diff --git a/.ci/azure/linux.yml b/.ci/azure/linux.yml
index 493d492d04a885..bfed994a137547 100644
--- a/.ci/azure/linux.yml
+++ b/.ci/azure/linux.yml
@@ -33,7 +33,7 @@ jobs:
     INSTALL_DIR: $(WORK_DIR)/install_pkg
     INSTALL_TEST_DIR: $(INSTALL_DIR)/tests
     LAYER_TESTS_DIR: $(INSTALL_TEST_DIR)/layer_tests
-    SETUPVARS: $(INSTALL_DIR)/bin/setupvars.sh
+    SETUPVARS: $(INSTALL_DIR)/setupvars.sh
 
   steps:
   - script: |
@@ -103,6 +103,7 @@ jobs:
     workingDirectory: $(WORK_DIR)
     displayName: 'Install dependencies'
 
+    # Should be after 'Install dependencies' because Git lfs is not installed
   - checkout: testdata
     clean: true
     lfs: true
@@ -140,18 +141,18 @@ jobs:
   - script: cmake -DCMAKE_INSTALL_PREFIX=$(INSTALL_DIR) -P cmake_install.cmake
     workingDirectory: $(BUILD_DIR)
     displayName: 'Install'
-  
+
   - task: CMake@1
     inputs:
       cmakeArgs: >
         -GNinja
         $(REPO_DIR)/tests/layer_tests
       workingDirectory: $(BUILD_LAYER_TESTS_DIR)
-      
+
   - script: ninja
     workingDirectory: $(BUILD_LAYER_TESTS_DIR)
     displayName: 'Build Layer Tests'
-    
+
   - script: cmake -DCOMPONENT=tests -DCMAKE_INSTALL_PREFIX=$(INSTALL_DIR) -P cmake_install.cmake
     workingDirectory: $(BUILD_LAYER_TESTS_DIR)
     displayName: 'Install Layer Tests'
@@ -166,18 +167,18 @@ jobs:
       cp -R $(REPO_DIR)/inference-engine/temp/opencv_4.5.2_ubuntu20/opencv/* $(INSTALL_DIR)/opencv/
     workingDirectory: $(BUILD_DIR)
     displayName: 'Install tests'
-    
+
   - script: ls -alR $(INSTALL_DIR)
     displayName: 'List install files'
 
-  - script: $(INSTALL_DIR)/deployment_tools/inference_engine/samples/cpp/build_samples.sh
+  - script: $(INSTALL_DIR)/samples/cpp/build_samples.sh
     workingDirectory: $(BUILD_SAMPLES_DIR)
     displayName: 'Build cpp samples'
 
-  - script: $(INSTALL_DIR)/deployment_tools/inference_engine/samples/c/build_samples.sh
+  - script: $(INSTALL_DIR)/samples/c/build_samples.sh
     workingDirectory: $(BUILD_SAMPLES_DIR)
     displayName: 'Build c samples'
-  
+
   - script: rm -fr $(BUILD_DIR)
     displayName: 'Clean build dir'
     continueOnError: false
@@ -188,8 +189,8 @@ jobs:
     continueOnError: false
 
   - script: |
-      export MO_ROOT=$(INSTALL_DIR)/deployment_tools/model_optimizer
-      . $(SETUPVARS) -pyver 3.8 && python3 -m pytest -s $(INSTALL_DIR)/deployment_tools/model_optimizer/unit_tests --junitxml=TEST-ModelOptimizer.xml
+      export MO_ROOT=$(INSTALL_DIR)/tools/model_optimizer
+      . $(SETUPVARS) -pyver 3.8 && python3 -m pytest -s $(INSTALL_DIR)/tools/model_optimizer/unit_tests --junitxml=TEST-ModelOptimizer.xml
     displayName: 'Model Optimizer UT'
     continueOnError: false
 
@@ -253,11 +254,11 @@ jobs:
       . $(SETUPVARS) -pyver 3.8 && python3 -m pytest --junitxml=TEST-PythonAPI.xml
     displayName: 'Python API Tests'
     continueOnError: false
-    
+
   - script: |
       . $(SETUPVARS)
       python3 -m pip install -r requirements.txt
-      export MO_ROOT=$(INSTALL_DIR)/deployment_tools/model_optimizer
+      export MO_ROOT=$(INSTALL_DIR)/tools/model_optimizer
       export PYTHONPATH=$(LAYER_TESTS_DIR):$PYTHONPATH
       python3 -m pytest tensorflow_tests/test_tf_Roll.py --ir_version=10 --junitxml=TEST-tf_Roll.xmlTEST
     workingDirectory: $(LAYER_TESTS_DIR)
diff --git a/.ci/azure/linux_conditional_compilation.yml b/.ci/azure/linux_conditional_compilation.yml
index a4063d2c9031f0..1a69b7c3dcd9a2 100644
--- a/.ci/azure/linux_conditional_compilation.yml
+++ b/.ci/azure/linux_conditional_compilation.yml
@@ -17,7 +17,7 @@ jobs:
     WORK_DIR: $(Pipeline.Workspace)/_w
     BUILD_DIR: $(WORK_DIR)/build
     INSTALL_DIR: $(WORK_DIR)/install_pkg
-    SETUPVARS: $(INSTALL_DIR)/bin/setupvars.sh
+    SETUPVARS: $(INSTALL_DIR)/setupvars.sh
 
   steps:
   - script: |
diff --git a/.ci/azure/linux_ngraph_onnx.yml b/.ci/azure/linux_ngraph_onnx.yml
index 5521d224630ad7..8218a0874cdd30 100644
--- a/.ci/azure/linux_ngraph_onnx.yml
+++ b/.ci/azure/linux_ngraph_onnx.yml
@@ -72,7 +72,7 @@ jobs:
     workingDirectory: $(WORK_DIR)
     displayName: 'Install dependencies'
 
-  - script: ngraph/python/tests/test_onnx/model_zoo_preprocess.sh -d $(MODELS_DIR)/models_data -o -s "$(ONNX_MODEL_ZOO_SHA)"
+  - script: runtime/bindings/python/tests/test_onnx/model_zoo_preprocess.sh -d $(MODELS_DIR)/models_data -o -s "$(ONNX_MODEL_ZOO_SHA)"
     displayName: 'Update models'
     condition: ne(variables['BUILD_TYPE'], 'Debug')
 
diff --git a/.ci/azure/linux_onnxruntime.yml b/.ci/azure/linux_onnxruntime.yml
index 932fb76d5cc8b9..ad5e630820ddbf 100644
--- a/.ci/azure/linux_onnxruntime.yml
+++ b/.ci/azure/linux_onnxruntime.yml
@@ -93,7 +93,6 @@ jobs:
         -DENABLE_CLDNN=OFF
         -DENABLE_PROFILING_ITT=OFF
         -DENABLE_SAMPLES=OFF
-        -DENABLE_SPEECH_DEMO=OFF
         -DNGRAPH_ONNX_FRONTEND_ENABLE=ON
         -DNGRAPH_DEBUG_ENABLE=OFF
         $(REPO_DIR)
@@ -111,44 +110,44 @@ jobs:
     displayName: 'Install'
 
   - script: |
-      source $(INSTALL_DIR)/bin/setupvars.sh
+      source $(INSTALL_DIR)/setupvars.sh
       CXXFLAGS="-Wno-error=deprecated-declarations" ./build.sh --config RelWithDebInfo --use_openvino CPU_FP32 --build_shared_lib --parallel --skip_tests --build_dir $(ONNXRUNTIME_BUILD_DIR)
     workingDirectory: $(ONNXRUNTIME_REPO_DIR)
     displayName: 'Build Lin ONNX Runtime'
 
   - script: |
-      source $(INSTALL_DIR)/bin/setupvars.sh
+      source $(INSTALL_DIR)/setupvars.sh
       skip_tests=`tr -s '\n ' ':' < $(ONNXRUNTIME_UTILS)/skip_tests`
       ./onnxruntime_test_all --gtest_filter=-$skip_tests
     workingDirectory: $(ONNXRUNTIME_BUILD_DIR)/RelWithDebInfo
     displayName: 'Run onnxruntime_test_all'
 
   - script: |
-      source $(INSTALL_DIR)/bin/setupvars.sh
+      source $(INSTALL_DIR)/setupvars.sh
       ./onnxruntime_shared_lib_test
     workingDirectory: $(ONNXRUNTIME_BUILD_DIR)/RelWithDebInfo
     displayName: 'Run onnxruntime_shared_lib_test'
 
   - script: |
-      source $(INSTALL_DIR)/bin/setupvars.sh
+      source $(INSTALL_DIR)/setupvars.sh
       ./onnxruntime_global_thread_pools_test
     workingDirectory: $(ONNXRUNTIME_BUILD_DIR)/RelWithDebInfo
     displayName: 'Run onnxruntime_global_thread_pools_test'
 
   - script: |
-      source $(INSTALL_DIR)/bin/setupvars.sh
+      source $(INSTALL_DIR)/setupvars.sh
       ./onnxruntime_api_tests_without_env
     workingDirectory: $(ONNXRUNTIME_BUILD_DIR)/RelWithDebInfo
     displayName: 'Run onnxruntime_api_tests_without_env'
 
   - script: |
-      source $(INSTALL_DIR)/bin/setupvars.sh
+      source $(INSTALL_DIR)/setupvars.sh
       ./onnx_test_runner "$(ONNXRUNTIME_REPO_DIR)/cmake/external/onnx/onnx/backend/test/data/pytorch-converted"
     workingDirectory: $(ONNXRUNTIME_BUILD_DIR)/RelWithDebInfo
     displayName: 'Run pytorch-converted tests'
 
   - script: |
-      source $(INSTALL_DIR)/bin/setupvars.sh
+      source $(INSTALL_DIR)/setupvars.sh
       ./onnx_test_runner "$(ONNXRUNTIME_REPO_DIR)/cmake/external/onnx/onnx/backend/test/data/pytorch-operator"
     workingDirectory: $(ONNXRUNTIME_BUILD_DIR)/RelWithDebInfo
     displayName: 'Run pytorch-operator tests'
diff --git a/.ci/azure/mac.yml b/.ci/azure/mac.yml
index b07ff48f78ccc3..4534c08b0651d5 100644
--- a/.ci/azure/mac.yml
+++ b/.ci/azure/mac.yml
@@ -28,19 +28,19 @@ jobs:
     MODELS_PATH: $(REPO_DIR)/../testdata
     WORK_DIR: $(Pipeline.Workspace)/_w
     BUILD_DIR: $(WORK_DIR)/build
-    BIN_DIR: $(REPO_DIR)/bin/intel64/$(BUILD_TYPE)
     INSTALL_DIR: $(WORK_DIR)/install_pkg
-    SETUPVARS: $(INSTALL_DIR)/bin/setupvars.sh
+    INSTALL_TEST_DIR: $(INSTALL_DIR)/tests
+    SETUPVARS: $(INSTALL_DIR)/setupvars.sh
 
   steps:
   - script: |
       whoami
       uname -a
-      which python3
-      python3 --version
-      which java
-      java -version
-      gcc --version
+      echo Python3 info ; which python3 ; python3 --version
+      echo Python info ; which python ; python --version
+      echo Java info ; which java ; java -version
+      echo gcc info ; which gcc ; gcc --version
+      echo cmake info ; which cmake ; cmake --version
       xcrun --sdk macosx --show-sdk-version
       env
       sysctl -a
@@ -91,47 +91,64 @@ jobs:
     workingDirectory: $(BUILD_DIR)
     displayName: 'CMake'
 
+  - script: ls -alR $(REPO_DIR)/inference-engine/temp/
+    displayName: 'List temp SDKs'
+
   - script: ninja
     workingDirectory: $(BUILD_DIR)
     displayName: 'Build Mac'
 
   - script: ls -alR $(REPO_DIR)/bin/
-    displayName: 'List files'
+    displayName: 'List bin files'
 
   - script: cmake -DCMAKE_INSTALL_PREFIX=$(INSTALL_DIR) -P cmake_install.cmake
     workingDirectory: $(BUILD_DIR)
     displayName: 'Install'
 
-  - script: $(BIN_DIR)/unit-test --gtest_print_time=1 --gtest_filter=-backend_api.config_unsupported:*IE_GPU*:IE_CPU.onnx_model_sigmoid:IE_CPU/GRUSequenceOp.onnx_model_gru* --gtest_output=xml:TEST-NGraphUT.xml
-    workingDirectory: $(BIN_DIR)
+  - script: ls -alR $(INSTALL_DIR)
+    displayName: 'List install files'
+
+  - script: |
+      set -e
+      mkdir $(INSTALL_DIR)/opencv/
+      cmake -DCMAKE_INSTALL_PREFIX=$(INSTALL_DIR) -DCOMPONENT=tests -P cmake_install.cmake
+      cp -R $(REPO_DIR)/inference-engine/temp/opencv_4.5.2_osx/opencv/* $(INSTALL_DIR)/opencv/
+    workingDirectory: $(BUILD_DIR)
+    displayName: 'Install tests'
+
+  - script: ls -alR $(INSTALL_DIR)
+    displayName: 'List install files'
+
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/unit-test --gtest_print_time=1 --gtest_filter=-backend_api.config_unsupported:*IE_GPU*:IE_CPU.onnx_model_sigmoid:IE_CPU/GRUSequenceOp.onnx_model_gru* --gtest_output=xml:TEST-NGraphUT.xml
+    workingDirectory: $(INSTALL_TEST_DIR)
     displayName: 'nGraph UT'
     continueOnError: false
 
-  - script: $(BIN_DIR)/InferenceEngineUnitTests --gtest_print_time=1 --gtest_filter=-MKLDNNGraphStructureTests.TestNoRedundantReordersBeforeDWConvolution:TestConvolution/MKLDNNGraphConvolutionTests.TestsConvolution/0:TestConvolutionDefaultPrimitivesPriority/MKLDNNGraphConvolutionTests.TestsConvolution/0 --gtest_output=xml:TEST-InferenceEngineUnitTests.xml
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/InferenceEngineUnitTests --gtest_print_time=1 --gtest_filter=-MKLDNNGraphStructureTests.TestNoRedundantReordersBeforeDWConvolution:TestConvolution/MKLDNNGraphConvolutionTests.TestsConvolution/0:TestConvolutionDefaultPrimitivesPriority/MKLDNNGraphConvolutionTests.TestsConvolution/0 --gtest_output=xml:TEST-InferenceEngineUnitTests.xml
     displayName: 'IE UT old'
     continueOnError: false
 
-  - script: $(BIN_DIR)/ieUnitTests --gtest_output=xml:TEST-ieUnitTests.xml
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/ieUnitTests --gtest_output=xml:TEST-ieUnitTests.xml
     displayName: 'IE UT'
     continueOnError: false
 
-  - script: $(BIN_DIR)/cpuUnitTests --gtest_output=xml:TEST-cpuUnitTests.xml
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/cpuUnitTests --gtest_output=xml:TEST-cpuUnitTests.xml
     displayName: 'CPU UT'
     continueOnError: false
 
-  - script: $(BIN_DIR)/vpuUnitTests --gtest_output=xml:TEST-vpuUnitTests.xml
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/vpuUnitTests --gtest_output=xml:TEST-vpuUnitTests.xml
     displayName: 'VPU UT'
     continueOnError: false
 
-  - script: $(BIN_DIR)/onnxImporterUnitTests --gtest_output=xml:TEST-onnxImporterUnitTests.xml
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/onnxImporterUnitTests --gtest_output=xml:TEST-onnxImporterUnitTests.xml
     displayName: 'ONNX Importer UT'
     continueOnError: false
 
-  - script: $(BIN_DIR)/ieFuncTests --gtest_output=xml:TEST-ieFuncTests.xml
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/ieFuncTests --gtest_output=xml:TEST-ieFuncTests.xml
     displayName: 'IE FuncTests'
     continueOnError: false
 
-  - script: $(BIN_DIR)/cpuFuncTests --gtest_filter=*smoke*:-smoke_LPT/ReduceMinTransformation.CompareWithRefImpl/f32_Shape* --gtest_print_time=1 --gtest_output=xml:TEST-cpuFuncTests.xml
+  - script: . $(SETUPVARS) && $(INSTALL_TEST_DIR)/cpuFuncTests --gtest_filter=*smoke*:-smoke_LPT/ReduceMinTransformation.CompareWithRefImpl/f32_Shape* --gtest_print_time=1 --gtest_output=xml:TEST-cpuFuncTests.xml
     displayName: 'CPU FuncTests'
     continueOnError: false
     enabled: false
@@ -139,7 +156,7 @@ jobs:
   - script: |
       export DATA_PATH=$(MODELS_PATH)
       export MODELS_PATH=$(MODELS_PATH)
-      $(BIN_DIR)/InferenceEngineCAPITests --gtest_output=xml:TEST-InferenceEngineCAPITests.xml
+      . $(SETUPVARS) && $(INSTALL_TEST_DIR)/InferenceEngineCAPITests --gtest_output=xml:TEST-InferenceEngineCAPITests.xml
     displayName: 'IE CAPITests'
     continueOnError: false
 
diff --git a/.ci/azure/windows.yml b/.ci/azure/windows.yml
index 3d0936c5411eeb..81c1ba956017d8 100644
--- a/.ci/azure/windows.yml
+++ b/.ci/azure/windows.yml
@@ -33,7 +33,7 @@ jobs:
     MSVC_COMPILER_PATH: C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\VC\Tools\MSVC\14.24.28314\bin\Hostx64\x64\cl.exe
     INSTALL_DIR: $(WORK_DIR)\install_pkg
     INSTALL_TEST_DIR: $(INSTALL_DIR)\tests
-    SETUPVARS: $(INSTALL_DIR)\bin\setupvars.bat
+    SETUPVARS: $(INSTALL_DIR)\setupvars.bat
 
   steps:
   - script: |
@@ -122,11 +122,11 @@ jobs:
   - script: dir $(INSTALL_DIR) /s
     displayName: 'List install files'
 
-  - script: $(INSTALL_DIR)\deployment_tools\inference_engine\samples\cpp\build_samples_msvc.bat
+  - script: $(INSTALL_DIR)\samples\cpp\build_samples_msvc.bat
     workingDirectory: $(BUILD_SAMPLES_DIR)
     displayName: 'Build cpp samples'
 
-  - script: $(INSTALL_DIR)\deployment_tools\inference_engine\samples\c\build_samples_msvc.bat
+  - script: $(INSTALL_DIR)\samples\c\build_samples_msvc.bat
     workingDirectory: $(BUILD_SAMPLES_DIR)
     displayName: 'Build c samples'
 
diff --git a/.ci/azure/windows_conditional_compilation.yml b/.ci/azure/windows_conditional_compilation.yml
index 9024ede46f6018..80c89e8d20f28e 100644
--- a/.ci/azure/windows_conditional_compilation.yml
+++ b/.ci/azure/windows_conditional_compilation.yml
@@ -19,7 +19,7 @@ jobs:
     MSVS_VARS_PATH: C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\VC\Auxiliary\Build\vcvars64.bat
     MSVC_COMPILER_PATH: C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\VC\Tools\MSVC\14.24.28314\bin\Hostx64\x64\cl.exe
     INSTALL_DIR: $(WORK_DIR)\install_pkg
-    SETUPVARS: $(INSTALL_DIR)\bin\setupvars.bat
+    SETUPVARS: $(INSTALL_DIR)\setupvars.bat
 
   steps:
   - script: |
diff --git a/.ci/openvino-onnx/Dockerfile b/.ci/openvino-onnx/Dockerfile
index 314ab2c103746d..8e2365e4ebc506 100644
--- a/.ci/openvino-onnx/Dockerfile
+++ b/.ci/openvino-onnx/Dockerfile
@@ -65,7 +65,6 @@ RUN cmake .. \
     -DENABLE_CLDNN=OFF \
     -DENABLE_PROFILING_ITT=OFF \
     -DENABLE_SAMPLES=OFF \
-    -DENABLE_SPEECH_DEMO=OFF \
     -DENABLE_PYTHON=ON \
     -DPYTHON_EXECUTABLE=/usr/bin/python3 \
     -DNGRAPH_ONNX_FRONTEND_ENABLE=ON \
@@ -75,8 +74,8 @@ RUN cmake .. \
 RUN make -j $(nproc) install
 
 # Run tests via tox
-WORKDIR /openvino/ngraph/python
-ENV ngraph_DIR=/openvino/dist/deployment_tools/ngraph
-ENV LD_LIBRARY_PATH=/openvino/dist/deployment_tools/ngraph/lib
+WORKDIR /openvino/runtime/bindings/python
+ENV OpenVINO_DIR=/openvino/dist/runtime/cmake
+ENV LD_LIBRARY_PATH=/openvino/dist/runtime/lib:/openvino/dist/runtime/3rdparty/tbb/lib
 ENV PYTHONPATH=/openvino/bin/intel64/${BUILD_TYPE}/lib/python_api/python3.8:${PYTHONPATH}
 CMD tox
diff --git a/.ci/openvino-onnx/Jenkinsfile b/.ci/openvino-onnx/Jenkinsfile
index 2849579dcdbf6b..5581c7c2ea8ad0 100644
--- a/.ci/openvino-onnx/Jenkinsfile
+++ b/.ci/openvino-onnx/Jenkinsfile
@@ -94,7 +94,7 @@ def prepare_repository(String workdir) {
 
 def updateModels() {
     sh """
-        ./ngraph/python/tests/test_onnx/model_zoo_preprocess.sh -d ${HOME}/ONNX_CI/models_data -o -s ${ONNX_MODEL_ZOO_SHA}
+        ./runtime/bindings/python/tests/test_onnx/model_zoo_preprocess.sh -d ${HOME}/ONNX_CI/models_data -o -s ${ONNX_MODEL_ZOO_SHA}
     """
 }
 
diff --git a/.github/dependabot.yml b/.github/dependabot.yml
index 7d450a951830a0..cc8124c21c7b54 100644
--- a/.github/dependabot.yml
+++ b/.github/dependabot.yml
@@ -4,7 +4,7 @@ version: 2
 updates:
   # Enable version updates for nGraph Python API
   - package-ecosystem: pip
-    directory: "/ngraph/python"
+    directory: "/runtime/bindings/python"
     schedule:
       interval: weekly
       day: monday
diff --git a/.github/workflows/build_doc.yml b/.github/workflows/build_doc.yml
index 40e02fd59b31bd..92b88967845b19 100644
--- a/.github/workflows/build_doc.yml
+++ b/.github/workflows/build_doc.yml
@@ -14,6 +14,7 @@ jobs:
 
       - name: Install dependencies
         run: |
+          sudo apt update
           sudo apt --assume-yes install libusb-1.0-0-dev graphviz texlive
           python3 -m pip install lxml
           # install doxygen
diff --git a/.github/workflows/code_style.yml b/.github/workflows/code_style.yml
index 8f30c986361f45..3eecdc0aff5131 100644
--- a/.github/workflows/code_style.yml
+++ b/.github/workflows/code_style.yml
@@ -10,10 +10,13 @@ jobs:
           submodules: recursive
 
       - name: Install clang-format-9
-        run: sudo apt --assume-yes install clang-format-9
+        run: |
+          sudo apt update
+          sudo apt --assume-yes install clang-format-9
 
       - name: Install dependencies
         run: |
+          sudo apt update
           sudo apt --assume-yes install libusb-1.0-0-dev
           python3 -m pip install --upgrade pip
           python3 -m pip install -r ./inference-engine/ie_bridges/python/requirements.txt
@@ -52,7 +55,9 @@ jobs:
           submodules: recursive
 
       - name: Install ShellCheck
-        run: sudo apt --assume-yes install shellcheck
+        run: |
+          sudo apt update
+          sudo apt --assume-yes install shellcheck
 
       - name: Install dependencies
         run: python3 -m pip install -r ./inference-engine/ie_bridges/python/requirements.txt
@@ -75,7 +80,9 @@ jobs:
           submodules: recursive
 
       - name: Install Clang dependency
-        run: sudo apt --assume-yes install libclang-9-dev
+        run: |
+          sudo apt update
+          sudo apt --assume-yes install libclang-9-dev
 
       - name: Install Python-based dependencies
         run: python3 -m pip install -r cmake/developer_package/ncc_naming_style/requirements_dev.txt
diff --git a/.github/workflows/mo.yml b/.github/workflows/mo.yml
index ebc0827adb0622..00fcec9d0258d6 100644
--- a/.github/workflows/mo.yml
+++ b/.github/workflows/mo.yml
@@ -41,6 +41,7 @@ jobs:
           pip install -r requirements.txt
           pip install -r requirements_dev.txt
           # requrements for CMake
+          sudo apt update
           sudo apt --assume-yes install libusb-1.0-0-dev
         working-directory: model-optimizer
 
diff --git a/.gitmodules b/.gitmodules
index 095f39682640b6..8569ecbb9587ea 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -44,8 +44,8 @@
 [submodule "thirdparty/protobuf"]
 	path = thirdparty/protobuf/protobuf
 	url = https://github.com/protocolbuffers/protobuf.git
-[submodule "ngraph/python/pybind11"]
-	path = ngraph/python/pybind11
+[submodule "runtime/bindings/python/thirdparty/pybind11"]
+	path = runtime/bindings/python/thirdparty/pybind11
 	url = https://github.com/pybind/pybind11.git
 [submodule "thirdparty/ittapi/ittapi"]
 	path = thirdparty/ittapi/ittapi
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 61a96ae9f4c816..7ead5a53212142 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -26,13 +26,15 @@ endif()
 # resolving dependencies for the project
 message (STATUS "PROJECT ............................... " ${PROJECT_NAME})
 message (STATUS "CMAKE_BINARY_DIR ...................... " ${CMAKE_BINARY_DIR})
-message (STATUS "OpenVINO_SOURCE_DIR ....     .......... " ${OpenVINO_SOURCE_DIR})
+message (STATUS "OpenVINO_SOURCE_DIR ................... " ${OpenVINO_SOURCE_DIR})
 message (STATUS "CMAKE_GENERATOR ....................... " ${CMAKE_GENERATOR})
 message (STATUS "CMAKE_C_COMPILER_ID ................... " ${CMAKE_C_COMPILER_ID})
 message (STATUS "CMAKE_BUILD_TYPE ...................... " ${CMAKE_BUILD_TYPE})
 
 # remove file with exported developer targets to force its regeneration
+file(REMOVE "${CMAKE_BINARY_DIR}/ngraph/ngraphTargets.cmake")
 file(REMOVE "${CMAKE_BINARY_DIR}/InferenceEngineTargets.cmake")
+file(REMOVE "${CMAKE_BINARY_DIR}/OpenVINOTargets.cmake")
 foreach(component IN LISTS openvino_export_components)
     file(REMOVE "${CMAKE_BINARY_DIR}/${component}_dev_targets.cmake")
     unset(${component} CACHE)
@@ -83,6 +85,7 @@ include(cmake/test_model_zoo.cmake)
 add_subdirectory(thirdparty)
 add_subdirectory(openvino)
 add_subdirectory(ngraph)
+add_subdirectory(runtime)
 add_subdirectory(inference-engine)
 
 # for Template plugin
diff --git a/CODEOWNERS b/CODEOWNERS
index 165bc7455631f2..bc7beb0841ef38 100644
--- a/CODEOWNERS
+++ b/CODEOWNERS
@@ -44,7 +44,6 @@ azure-pipelines.yml  @openvinotoolkit/openvino-admins
 /inference-engine/tests/functional/plugin/myriad/  @openvinotoolkit/openvino-ie-vpu-maintainers @openvinotoolkit/openvino-ie-tests-maintainers
 /inference-engine/tests/unit/vpu/  @openvinotoolkit/openvino-ie-vpu-maintainers @openvinotoolkit/openvino-ie-tests-maintainers
 /inference-engine/tests/unit/engines/vpu/  @openvinotoolkit/openvino-ie-vpu-maintainers @openvinotoolkit/openvino-ie-tests-maintainers
-/inference-engine/tools/vpu/  @openvinotoolkit/openvino-ie-vpu-maintainers
 /inference-engine/scripts/run_tests_myriad_multistick.sh  @openvinotoolkit/openvino-ie-vpu-maintainers
 
 # IE GNA:
@@ -72,6 +71,7 @@ azure-pipelines.yml  @openvinotoolkit/openvino-admins
 
 # Documentation
 /docs/  @openvinotoolkit/openvino-docs-maintainers
+/docs/template_plugin/ @openvinotoolkit/openvino-ie-template-maintainers
 *.md  @openvinotoolkit/openvino-docs-maintainers
 
 # Control 3d party dependencies
diff --git a/README.md b/README.md
index c445e5209b11cc..7c4b3cdd3a707c 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,5 @@
 # OpenVINO™ Toolkit
-[![Stable release](https://img.shields.io/badge/version-2021.4-green.svg)](https://github.com/openvinotoolkit/openvino/releases/tag/2021.4)
+[![Stable release](https://img.shields.io/badge/version-2021.4.1-green.svg)](https://github.com/openvinotoolkit/openvino/releases/tag/2021.4.1)
 [![Apache License Version 2.0](https://img.shields.io/badge/license-Apache_2.0-green.svg)](LICENSE)
 ![GitHub branch checks state](https://img.shields.io/github/checks-status/openvinotoolkit/openvino/master?label=GitHub%20checks)
 ![Azure DevOps builds (branch)](https://img.shields.io/azure-devops/build/openvinoci/b2bab62f-ab2f-4871-a538-86ea1be7d20f/13?label=Public%20CI)
diff --git a/cmake/dependencies.cmake b/cmake/dependencies.cmake
index 82f98b4c515ff3..b4946d85d11d85 100644
--- a/cmake/dependencies.cmake
+++ b/cmake/dependencies.cmake
@@ -89,7 +89,7 @@ if(THREADING STREQUAL "OMP")
     ie_cpack_add_component(omp REQUIRED)
     file(GLOB_RECURSE source_list "${OMP}/*${CMAKE_SHARED_LIBRARY_SUFFIX}*")
     install(FILES ${source_list} 
-            DESTINATION "deployment_tools/inference_engine/external/omp/lib"
+            DESTINATION "runtime/3rdparty/omp/lib"
             COMPONENT omp)
 endif()
 
@@ -298,44 +298,3 @@ if(ENABLE_GNA)
     update_deps_cache(GNA "${GNA}" "Path to GNA root folder")
     debug_message(STATUS "gna=" ${GNA})
 endif()
-
-if(ENABLE_SPEECH_DEMO)
-    reset_deps_cache(SPEECH_LIBS_AND_DEMOS)
-    if(DEFINED ENV{THIRDPARTY_SERVER_PATH})
-        set(IE_PATH_TO_DEPS "$ENV{THIRDPARTY_SERVER_PATH}")
-    elseif(DEFINED THIRDPARTY_SERVER_PATH)
-        set(IE_PATH_TO_DEPS "${THIRDPARTY_SERVER_PATH}")
-    else()
-        message(WARNING "Unable to locate Speech Demo")
-    endif()
-    if(DEFINED IE_PATH_TO_DEPS)
-        if(WIN32 AND X86_64)
-            RESOLVE_DEPENDENCY(SPEECH_LIBS_AND_DEMOS
-                    ARCHIVE_WIN "speech_demo_1.0.0.780_windows.zip"
-                    VERSION_REGEX ".*_([0-9]+.[0-9]+.[0-9]+.[0-9]+).*"
-                    TARGET_PATH "${TEMP}/speech_demo_1.0.0.780"
-                    SHA256 "957bd274a1f6dc1d83a46879c7ef3b3b06f17d11af85cc45c18919051d145abd")
-            debug_message(STATUS "speech_libs_and_demos=" ${SPEECH_LIBS_AND_DEMOS})
-        elseif(LINUX AND X86_64)
-            if(LINUX_OS_NAME STREQUAL "CentOS 7" OR CMAKE_CXX_COMPILER_VERSION VERSION_LESS "4.9")
-                RESOLVE_DEPENDENCY(SPEECH_LIBS_AND_DEMOS
-                    ARCHIVE_LIN "speech_demo_1.0.0.780_centos.tgz"
-                    VERSION_REGEX ".*_([0-9]+.[0-9]+.[0-9]+.[0-9]+).*"
-                    TARGET_PATH "${TEMP}/speech_demo_1.0.0.780"
-                    SHA256 "6d8d1111d0e662fe71d71cd3debad2995f6fb6fe5df3b92196dae06ff7abdf44")
-                debug_message(STATUS "speech_libs_and_demos=" ${SPEECH_LIBS_AND_DEMOS})
-            else()
-                RESOLVE_DEPENDENCY(SPEECH_LIBS_AND_DEMOS
-                    ARCHIVE_LIN "speech_demo_1.0.0.780_linux.tgz"
-                    VERSION_REGEX ".*_([0-9]+.[0-9]+.[0-9]+.[0-9]+).*"
-                    TARGET_PATH "${TEMP}/speech_demo_1.0.0.780"
-                    SHA256 "0ec6f1e47c00d781dc918af5d3055ab474ff47b9978dd6fe2add73e3339b0763")
-                debug_message(STATUS "speech_libs_and_demos=" ${SPEECH_LIBS_AND_DEMOS})
-            endif()
-        else()
-            message(FATAL_ERROR "Speech Demo is not available on current platform")
-        endif()
-        unset(IE_PATH_TO_DEPS)
-    endif()
-    update_deps_cache(SPEECH_LIBS_AND_DEMOS "${SPEECH_LIBS_AND_DEMOS}" "Path to SPEECH_LIBS_AND_DEMOS root folder")
-endif()
diff --git a/cmake/developer_package/packaging.cmake b/cmake/developer_package/packaging.cmake
index 4095a16157c068..7708de5c77b921 100644
--- a/cmake/developer_package/packaging.cmake
+++ b/cmake/developer_package/packaging.cmake
@@ -10,16 +10,15 @@ include(CPackComponent)
 #
 # Set library directory for cpack
 #
-set(IE_CPACK_IE_DIR       deployment_tools/inference_engine)
 function(ie_cpack_set_library_dir)
     if(WIN32)
-        set(IE_CPACK_LIBRARY_PATH ${IE_CPACK_IE_DIR}/lib/${ARCH_FOLDER}/$<CONFIG> PARENT_SCOPE)
-        set(IE_CPACK_RUNTIME_PATH ${IE_CPACK_IE_DIR}/bin/${ARCH_FOLDER}/$<CONFIG> PARENT_SCOPE)
-        set(IE_CPACK_ARCHIVE_PATH ${IE_CPACK_IE_DIR}/lib/${ARCH_FOLDER}/$<CONFIG> PARENT_SCOPE)
+        set(IE_CPACK_LIBRARY_PATH runtime/lib/${ARCH_FOLDER}/$<CONFIG> PARENT_SCOPE)
+        set(IE_CPACK_RUNTIME_PATH runtime/bin/${ARCH_FOLDER}/$<CONFIG> PARENT_SCOPE)
+        set(IE_CPACK_ARCHIVE_PATH runtime/lib/${ARCH_FOLDER}/$<CONFIG> PARENT_SCOPE)
     else()
-        set(IE_CPACK_LIBRARY_PATH ${IE_CPACK_IE_DIR}/lib/${ARCH_FOLDER} PARENT_SCOPE)
-        set(IE_CPACK_RUNTIME_PATH ${IE_CPACK_IE_DIR}/lib/${ARCH_FOLDER} PARENT_SCOPE)
-        set(IE_CPACK_ARCHIVE_PATH ${IE_CPACK_IE_DIR}/lib/${ARCH_FOLDER} PARENT_SCOPE)
+        set(IE_CPACK_LIBRARY_PATH runtime/lib/${ARCH_FOLDER} PARENT_SCOPE)
+        set(IE_CPACK_RUNTIME_PATH runtime/lib/${ARCH_FOLDER} PARENT_SCOPE)
+        set(IE_CPACK_ARCHIVE_PATH runtime/lib/${ARCH_FOLDER} PARENT_SCOPE)
     endif()
 endfunction()
 
diff --git a/cmake/developer_package/plugins/create_plugin_file.cmake b/cmake/developer_package/plugins/create_plugin_file.cmake
index 88f33904bee30a..cb28967d7960b2 100644
--- a/cmake/developer_package/plugins/create_plugin_file.cmake
+++ b/cmake/developer_package/plugins/create_plugin_file.cmake
@@ -2,6 +2,8 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
+cmake_policy(SET CMP0007 NEW)
+
 set(newContent "        <plugin name=\"${IE_DEVICE_NAME}\" location=\"${IE_PLUGIN_LIBRARY_NAME}\">")
 
 if(IE_PLUGIN_PROPERTIES)
@@ -9,10 +11,11 @@ if(IE_PLUGIN_PROPERTIES)
             <properties>")
 
     foreach(props IN LISTS IE_PLUGIN_PROPERTIES)
-        string(REPLACE "," ";" props "${props}")
+        string(REPLACE ":" ";" props "${props}")
 
         list(GET props 0 key)
         list(GET props 1 value)
+
         set(newContent "${newContent}
                 <property key=\"${key}\" value=\"${value}\"/>")
     endforeach()
diff --git a/cmake/developer_package/plugins/plugins.cmake b/cmake/developer_package/plugins/plugins.cmake
index cec023f3062513..3f83954cfa7f8c 100644
--- a/cmake/developer_package/plugins/plugins.cmake
+++ b/cmake/developer_package/plugins/plugins.cmake
@@ -20,19 +20,18 @@ endif()
 #
 # ie_add_plugin(NAME <targetName>
 #               DEVICE_NAME <deviceName>
-#               SOURCES <sources>
-#               OBJECT_LIBRARIES <object_libs>
-#               VERSION_DEFINES_FOR <source>
-#               SKIP_INSTALL
+#               [PSEUDO]
+#               [DEFAULT_CONFIG <key:value;...>]
+#               [SOURCES <sources>]
+#               [OBJECT_LIBRARIES <object_libs>]
+#               [VERSION_DEFINES_FOR <source>]
+#               [SKIP_INSTALL]
 #               )
 #
 function(ie_add_plugin)
-    set(options 
-        SKIP_INSTALL 
-        ADD_CLANG_FORMAT
-        )
+    set(options SKIP_INSTALL ADD_CLANG_FORMAT PSEUDO_PLUGIN)
     set(oneValueArgs NAME DEVICE_NAME VERSION_DEFINES_FOR)
-    set(multiValueArgs SOURCES OBJECT_LIBRARIES CPPLINT_FILTERS)
+    set(multiValueArgs DEFAULT_CONFIG SOURCES OBJECT_LIBRARIES CPPLINT_FILTERS)
     cmake_parse_arguments(IE_PLUGIN "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
 
     if(NOT IE_PLUGIN_NAME)
@@ -45,41 +44,73 @@ function(ie_add_plugin)
 
     # create and configure target
 
-    if(IE_PLUGIN_VERSION_DEFINES_FOR)
-        addVersionDefines(${IE_PLUGIN_VERSION_DEFINES_FOR} CI_BUILD_NUMBER)
-    endif()
+    if(NOT IE_PLUGIN_PSEUDO_PLUGIN)
+        if(IE_PLUGIN_VERSION_DEFINES_FOR)
+            addVersionDefines(${IE_PLUGIN_VERSION_DEFINES_FOR} CI_BUILD_NUMBER)
+        endif()
 
-    set(input_files ${IE_PLUGIN_SOURCES})
-    foreach(obj_lib IN LISTS IE_PLUGIN_OBJECT_LIBRARIES)
-        list(APPEND input_files $<TARGET_OBJECTS:${obj_lib}>)
-        add_cpplint_target(${obj_lib}_cpplint FOR_TARGETS ${obj_lib})
-    endforeach()
+        set(input_files ${IE_PLUGIN_SOURCES})
+        foreach(obj_lib IN LISTS IE_PLUGIN_OBJECT_LIBRARIES)
+            list(APPEND input_files $<TARGET_OBJECTS:${obj_lib}>)
+            add_cpplint_target(${obj_lib}_cpplint FOR_TARGETS ${obj_lib})
+        endforeach()
 
-    add_library(${IE_PLUGIN_NAME} MODULE ${input_files})
-    target_compile_definitions(${IE_PLUGIN_NAME} PRIVATE IMPLEMENT_INFERENCE_ENGINE_PLUGIN)
+        add_library(${IE_PLUGIN_NAME} MODULE ${input_files})
+        target_compile_definitions(${IE_PLUGIN_NAME} PRIVATE IMPLEMENT_INFERENCE_ENGINE_PLUGIN)
 
-    ie_add_vs_version_file(NAME ${IE_PLUGIN_NAME}
-                           FILEDESCRIPTION "Inference Engine ${IE_PLUGIN_DEVICE_NAME} device plugin library")
+        ie_add_vs_version_file(NAME ${IE_PLUGIN_NAME}
+            FILEDESCRIPTION "Inference Engine ${IE_PLUGIN_DEVICE_NAME} device plugin library")
 
-    if(TARGET IE::inference_engine_plugin_api)
-        target_link_libraries(${IE_PLUGIN_NAME} PRIVATE IE::inference_engine_plugin_api)
-    else()
-        target_link_libraries(${IE_PLUGIN_NAME} PRIVATE inference_engine_plugin_api)
-    endif()
+        if(TARGET IE::inference_engine_plugin_api)
+            target_link_libraries(${IE_PLUGIN_NAME} PRIVATE IE::inference_engine_plugin_api)
+        else()
+            target_link_libraries(${IE_PLUGIN_NAME} PRIVATE inference_engine_plugin_api)
+        endif()
 
-    if(WIN32)
-        set_target_properties(${IE_PLUGIN_NAME} PROPERTIES COMPILE_PDB_NAME ${IE_PLUGIN_NAME})
-    endif()
+        if(WIN32)
+            set_target_properties(${IE_PLUGIN_NAME} PROPERTIES COMPILE_PDB_NAME ${IE_PLUGIN_NAME})
+        endif()
 
-    set(custom_filter "")
-    foreach(filter IN LISTS IE_PLUGIN_CPPLINT_FILTERS)
-        string(CONCAT custom_filter "${custom_filter}" "," "${filter}")
-    endforeach()
+        set(custom_filter "")
+        foreach(filter IN LISTS IE_PLUGIN_CPPLINT_FILTERS)
+            string(CONCAT custom_filter "${custom_filter}" "," "${filter}")
+        endforeach()
 
-    if (IE_PLUGIN_ADD_CLANG_FORMAT)
-        add_clang_format_target(${IE_PLUGIN_NAME}_clang FOR_TARGETS ${IE_PLUGIN_NAME})
-    else()
-        add_cpplint_target(${IE_PLUGIN_NAME}_cpplint FOR_TARGETS ${IE_PLUGIN_NAME} CUSTOM_FILTERS ${custom_filter})
+        if (IE_PLUGIN_ADD_CLANG_FORMAT)
+            add_clang_format_target(${IE_PLUGIN_NAME}_clang FOR_TARGETS ${IE_PLUGIN_NAME})
+        else()
+            add_cpplint_target(${IE_PLUGIN_NAME}_cpplint FOR_TARGETS ${IE_PLUGIN_NAME} CUSTOM_FILTERS ${custom_filter})
+        endif()
+
+        add_dependencies(ie_plugins ${IE_PLUGIN_NAME})
+        if(TARGET inference_engine_preproc)
+            add_dependencies(${IE_PLUGIN_NAME} inference_engine_preproc)
+        endif()
+
+        # fake dependencies to build in the following order:
+        # IE -> IE readers -> IE inference plugins -> IE-based apps
+        if(TARGET inference_engine_ir_reader)
+            add_dependencies(${IE_PLUGIN_NAME} inference_engine_ir_reader)
+        endif()
+        if(TARGET inference_engine_ir_v7_reader)
+            add_dependencies(${IE_PLUGIN_NAME} inference_engine_ir_v7_reader)
+        endif()
+        if(TARGET onnx_ngraph_frontend)
+            add_dependencies(${IE_PLUGIN_NAME} onnx_ngraph_frontend)
+        endif()
+        if(TARGET paddlepaddle_ngraph_frontend)
+            add_dependencies(${IE_PLUGIN_NAME} paddlepaddle_ngraph_frontend)
+        endif()
+
+        # install rules
+        if(NOT IE_PLUGIN_SKIP_INSTALL)
+            string(TOLOWER "${IE_PLUGIN_DEVICE_NAME}" install_component)
+            ie_cpack_add_component(${install_component} REQUIRED DEPENDS core)
+
+            install(TARGETS ${IE_PLUGIN_NAME}
+                    LIBRARY DESTINATION ${IE_CPACK_RUNTIME_PATH}
+                    COMPONENT ${install_component})
+        endif()
     endif()
 
     # check that plugin with such name is not registered
@@ -98,33 +129,7 @@ function(ie_add_plugin)
 
     list(APPEND PLUGIN_FILES "${IE_PLUGIN_DEVICE_NAME}:${IE_PLUGIN_NAME}")
     set(PLUGIN_FILES "${PLUGIN_FILES}" CACHE INTERNAL "" FORCE)
-
-    add_dependencies(ie_plugins ${IE_PLUGIN_NAME})
-    if(TARGET inference_engine_preproc)
-        add_dependencies(${IE_PLUGIN_NAME} inference_engine_preproc)
-    endif()
-
-    # fake dependencies to build in the following order:
-    # IE -> IE readers -> IE inference plugins -> IE-based apps
-    if(TARGET inference_engine_ir_reader)
-        add_dependencies(${IE_PLUGIN_NAME} inference_engine_ir_reader)
-    endif()
-    if(TARGET inference_engine_ir_v7_reader)
-        add_dependencies(${IE_PLUGIN_NAME} inference_engine_ir_v7_reader)
-    endif()
-    if(TARGET onnx_ngraph_frontend)
-        add_dependencies(${IE_PLUGIN_NAME} onnx_ngraph_frontend)
-    endif()
-
-    # install rules
-
-    if(NOT IE_PLUGIN_SKIP_INSTALL)
-        string(TOLOWER "${IE_PLUGIN_DEVICE_NAME}" install_component)
-        ie_cpack_add_component(${install_component} REQUIRED DEPENDS core)
-
-        install(TARGETS ${IE_PLUGIN_NAME}
-                LIBRARY DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT ${install_component})
-    endif()
+    set(${IE_PLUGIN_DEVICE_NAME}_CONFIG "${IE_PLUGIN_DEFAULT_CONFIG}" CACHE INTERNAL "" FORCE)
 endfunction()
 
 #
@@ -168,7 +173,7 @@ macro(ie_register_plugins)
         list(GET name 1 name)
 
         # create plugin file
-        set(config_file_name "${CMAKE_BINARY_DIR}/plugins/${name}.xml")
+        set(config_file_name "${CMAKE_BINARY_DIR}/plugins/${device_name}.xml")
         ie_plugin_get_file_name(${name} library_name)
 
         add_custom_command(TARGET ${IE_REGISTER_MAIN_TARGET} POST_BUILD
@@ -176,9 +181,10 @@ macro(ie_register_plugins)
               "${CMAKE_COMMAND}"
               -D "IE_CONFIG_OUTPUT_FILE=${config_file_name}"
               -D "IE_DEVICE_NAME=${device_name}"
+              -D "IE_PLUGIN_PROPERTIES=${${device_name}_CONFIG}"
               -D "IE_PLUGIN_LIBRARY_NAME=${library_name}"
               -P "${IEDevScripts_DIR}/plugins/create_plugin_file.cmake"
-          COMMENT "Register ${name} plugin"
+          COMMENT "Register ${device_name} device as ${library_name}"
           VERBATIM)
 
         list(APPEND plugin_files_local "${config_file_name}")
diff --git a/cmake/features.cmake b/cmake/features.cmake
index cf9fbebbe9410a..450b0d255ccc05 100644
--- a/cmake/features.cmake
+++ b/cmake/features.cmake
@@ -98,8 +98,6 @@ ie_dependent_option (ENABLE_FUNCTIONAL_TESTS "functional tests" ON "ENABLE_TESTS
 
 ie_dependent_option (ENABLE_SAMPLES "console samples are part of inference engine package" ON "NOT MINGW" OFF)
 
-ie_dependent_option (ENABLE_SPEECH_DEMO "enable speech demo integration" ON "NOT APPLE;NOT ANDROID;X86_64" OFF)
-
 ie_option (ENABLE_OPENCV "enables OpenCV" ON)
 
 ie_option (ENABLE_V7_SERIALIZE "enables serialization to IR v7" OFF)
diff --git a/cmake/templates/InferenceEngineConfig.cmake.in b/cmake/templates/InferenceEngineConfig.cmake.in
index 43408483f9af6e..c6a69a907f2874 100644
--- a/cmake/templates/InferenceEngineConfig.cmake.in
+++ b/cmake/templates/InferenceEngineConfig.cmake.in
@@ -25,92 +25,32 @@
 
 @PACKAGE_INIT@
 
-#
-# Common functions
-#
-
 if(NOT DEFINED CMAKE_FIND_PACKAGE_NAME)
     set(CMAKE_FIND_PACKAGE_NAME InferenceEngine)
-    set(_need_package_name_reset ON)
+    set(_ie_need_package_name_reset ON)
 endif()
 
-# we have to use our own version of find_dependency because of support cmake 3.7
-macro(_ie_find_dependency dep)
-    set(cmake_fd_quiet_arg)
-    if(${CMAKE_FIND_PACKAGE_NAME}_FIND_QUIETLY)
-        set(cmake_fd_quiet_arg QUIET)
-    endif()
-    set(cmake_fd_required_arg)
-    if(${CMAKE_FIND_PACKAGE_NAME}_FIND_REQUIRED)
-        set(cmake_fd_required_arg REQUIRED)
-    endif()
-
-    get_property(cmake_fd_alreadyTransitive GLOBAL PROPERTY
-        _CMAKE_${dep}_TRANSITIVE_DEPENDENCY)
-
-    find_package(${dep} ${ARGN}
-        ${cmake_fd_quiet_arg}
-        ${cmake_fd_required_arg})
-
-    if(NOT DEFINED cmake_fd_alreadyTransitive OR cmake_fd_alreadyTransitive)
-        set_property(GLOBAL PROPERTY _CMAKE_${dep}_TRANSITIVE_DEPENDENCY TRUE)
-    endif()
-
-    if(NOT ${dep}_FOUND)
-        set(${CMAKE_FIND_PACKAGE_NAME}_NOT_FOUND_MESSAGE "${CMAKE_FIND_PACKAGE_NAME} could not be found because dependency ${dep} could not be found.")
-        set(${CMAKE_FIND_PACKAGE_NAME}_FOUND False)
-        return()
-    endif()
-
-    set(cmake_fd_required_arg)
-    set(cmake_fd_quiet_arg)
-endmacro()
-
-function(_ie_target_no_deprecation_error)
-    if(NOT MSVC)
-        if(CMAKE_CXX_COMPILER_ID STREQUAL "Intel")
-            set(flags "-diag-warning=1786")
-        else()
-            set(flags "-Wno-error=deprecated-declarations")
-        endif()
-        if(CMAKE_CROSSCOMPILING)
-            set_target_properties(${ARGV} PROPERTIES
-                                  INTERFACE_LINK_OPTIONS "-Wl,--allow-shlib-undefined")
-        endif()
-
-        set_target_properties(${ARGV} PROPERTIES INTERFACE_COMPILE_OPTIONS ${flags})
-    endif()
-endfunction()
+# need to store current PACKAGE_PREFIX_DIR, because it's overwritten by sub-package one
+set(_ie_package_prefix_dir "${PACKAGE_PREFIX_DIR}")
 
-#
-# Inference Engine config
-#
+include(CMakeFindDependencyMacro)
 
-# need to store current PACKAGE_PREFIX_DIR, because it's overwritten by ngraph one
-set(IE_PACKAGE_PREFIX_DIR "${PACKAGE_PREFIX_DIR}")
+find_dependency(OpenVINO
+                PATHS "${CMAKE_CURRENT_LIST_DIR}"
+                NO_CMAKE_FIND_ROOT_PATH
+                NO_DEFAULT_PATH)
 
-set(THREADING "@THREADING@")
-if(THREADING STREQUAL "TBB" OR THREADING STREQUAL "TBB_AUTO" AND NOT TBB_FOUND)
-    set_and_check(_tbb_dir "@PACKAGE_IE_TBB_DIR@")
-    _ie_find_dependency(TBB
-                        COMPONENTS tbb tbbmalloc
-                        CONFIG
-                        PATHS ${TBBROOT}/cmake
-                              ${_tbb_dir}
-                        NO_CMAKE_FIND_ROOT_PATH
-                        NO_DEFAULT_PATH)
+# create targets with old names for compatibility
+if(TARGET openvino::runtime AND NOT TARGET IE::inference_engine)
+    add_library(IE::inference_engine INTERFACE IMPORTED)
+    set_target_properties(IE::inference_engine PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::runtime)
 endif()
 
-set_and_check(_ngraph_dir "@PACKAGE_IE_NGRAPH_DIR@")
-_ie_find_dependency(ngraph
-                    CONFIG
-                    PATHS ${_ngraph_dir}
-                    NO_CMAKE_FIND_ROOT_PATH
-                    NO_DEFAULT_PATH)
-
-if(NOT TARGET inference_engine)
-    set(_ie_as_external_package ON)
-    include("${CMAKE_CURRENT_LIST_DIR}/InferenceEngineTargets.cmake")
+if(TARGET openvino::runtime::c AND NOT TARGET IE::inference_engine_c_api)
+    add_library(IE::inference_engine_c_api INTERFACE IMPORTED)
+    set_target_properties(IE::inference_engine_c_api PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::runtime::c)
 endif()
 
 # mark components as available
@@ -126,29 +66,21 @@ unset(InferenceEngine_LIBRARIES)
 foreach(comp IN LISTS ${CMAKE_FIND_PACKAGE_NAME}_FIND_COMPONENTS)
     # check if the component is available
     if(${CMAKE_FIND_PACKAGE_NAME}_${comp}_FOUND)
-        set(pcomp ${comp})
-        if(_ie_as_external_package)
-            set(pcomp IE::${comp})
-        endif()
+        set(pcomp IE::${comp})
 
         list(APPEND InferenceEngine_LIBRARIES ${pcomp})
     endif()
 endforeach()
 
-if(_ie_as_external_package)
-    _ie_target_no_deprecation_error(${InferenceEngine_LIBRARIES})
-endif()
-unset(_ie_as_external_package)
-
 # restore PACKAGE_PREFIX_DIR
-set(PACKAGE_PREFIX_DIR ${IE_PACKAGE_PREFIX_DIR})
-unset(IE_PACKAGE_PREFIX_DIR)
+set(PACKAGE_PREFIX_DIR ${_ie_package_prefix_dir})
+unset(_ie_package_prefix_dir)
 
 set_and_check(InferenceEngine_INCLUDE_DIRS "@PACKAGE_IE_INCLUDE_DIR@")
 
 check_required_components(${CMAKE_FIND_PACKAGE_NAME})
 
-if(_need_package_name_reset)
+if(_ie_need_package_name_reset)
     unset(CMAKE_FIND_PACKAGE_NAME)
-    unset(_need_package_name_reset)
+    unset(_ie_need_package_name_reset)
 endif()
diff --git a/cmake/templates/InferenceEngineDeveloperPackageConfig.cmake.in b/cmake/templates/InferenceEngineDeveloperPackageConfig.cmake.in
index 72af5ca89cadac..0f1f0d5e374f01 100644
--- a/cmake/templates/InferenceEngineDeveloperPackageConfig.cmake.in
+++ b/cmake/templates/InferenceEngineDeveloperPackageConfig.cmake.in
@@ -44,10 +44,30 @@ find_dependency(InferenceEngine
                 NO_CMAKE_FIND_ROOT_PATH
                 NO_DEFAULT_PATH)
 
+find_dependency(ngraph
+                PATHS "${CMAKE_CURRENT_LIST_DIR}/ngraph"
+                NO_CMAKE_FIND_ROOT_PATH
+                NO_DEFAULT_PATH)
+
+# create targets with old names for compatibility
+if(TARGET openvino::core AND NOT TARGET IE::core)
+    add_library(IE::core INTERFACE IMPORTED)
+    set_target_properties(IE::core PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::core)
+endif()
+
+if(TARGET openvino::runtime AND NOT TARGET IE::runtime)
+    add_library(IE::runtime INTERFACE IMPORTED)
+    set_target_properties(IE::runtime PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::runtime)
+endif()
+
 # WA for cmake: it exports ngraph as IE::ngraph in the IE export list
 # while we already have ngraph export in its own export list as ngraph::ngraph
-set_property(TARGET ngraph::ngraph PROPERTY IMPORTED_GLOBAL TRUE)
-add_library(IE::ngraph ALIAS ngraph::ngraph)
+if(TARGET ngraph::ngraph AND NOT TARGET IE::ngraph)
+    add_library(IE::ngraph INTERFACE IMPORTED)
+    set_target_properties(IE::ngraph PROPERTIES INTERFACE_LINK_LIBRARIES ngraph::ngraph)
+endif()
 
 foreach(component @openvino_export_components@)
     include("${CMAKE_CURRENT_LIST_DIR}/${component}_dev_targets.cmake")
diff --git a/cmake/templates/OpenVINOConfig-version.cmake.in b/cmake/templates/OpenVINOConfig-version.cmake.in
new file mode 100644
index 00000000000000..4e42995a83013f
--- /dev/null
+++ b/cmake/templates/OpenVINOConfig-version.cmake.in
@@ -0,0 +1,21 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+set(PACKAGE_VERSION_MAJOR @IE_VERSION_MAJOR@)
+set(PACKAGE_VERSION_MINOR @IE_VERSION_MINOR@)
+set(PACKAGE_VERSION_PATCH @IE_VERSION_PATCH@)
+set(PACKAGE_VERSION "${PACKAGE_VERSION_MAJOR}.${PACKAGE_VERSION_MINOR}.${PACKAGE_VERSION_PATCH}")
+
+set(PACKAGE_VERSION_EXACT False)
+set(PACKAGE_VERSION_COMPATIBLE False)
+
+if(PACKAGE_FIND_VERSION VERSION_EQUAL PACKAGE_VERSION)
+    set(PACKAGE_VERSION_EXACT True)
+    set(PACKAGE_VERSION_COMPATIBLE True)
+endif()
+
+if(PACKAGE_FIND_VERSION_MAJOR EQUAL PACKAGE_VERSION_MAJOR AND
+   PACKAGE_FIND_VERSION VERSION_LESS PACKAGE_VERSION)
+    set(PACKAGE_VERSION_COMPATIBLE True)
+endif()
diff --git a/cmake/templates/OpenVINOConfig.cmake.in b/cmake/templates/OpenVINOConfig.cmake.in
new file mode 100644
index 00000000000000..14fc57b36c258d
--- /dev/null
+++ b/cmake/templates/OpenVINOConfig.cmake.in
@@ -0,0 +1,203 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+# FindOpenVINO
+# ------
+#
+# Provides OpenVINO runtime for model creation and inference, frontend libraries
+# to convert models from framework specific formats.
+#
+# The following components are supported:
+#
+#  * `Runtime`: OpenVINO C++ and C Core & Inference Runtime, frontend manager
+#  * `ONNX`: OpenVINO ONNX frontend
+#  * `PaddlePaddle`: OpenVINO PaddlePaddle frontend
+#
+# If no components are specified, `Runtime` component is provided:
+#
+#   find_package(OpenVINO REQUIRED) # only Runtime component
+#
+# If specific components are required:
+#
+#   find_package(OpenVINO REQUIRED COMPONENTS Runtime ONNX)
+#
+# Imported Targets:
+# ------
+#
+#  Runtime targets:
+#
+#   `openvino::runtime`
+#   The OpenVINO C++ Core & Inference Runtime
+#
+#   `openvino::runtime::c`
+#   The OpenVINO C Inference Runtime
+#
+#   `openvino::core`
+#   The OpenVINO C++ Core Runtime
+#
+#  Frontend specific targets:
+#
+#   `openvino::frontend::manager`
+#   OpenVINO frontend manager
+#
+#   `openvino::frontend::onnx`
+#   ONNX FrontEnd target (optional)
+#
+#   `openvino::frontend::paddlepaddle`
+#   PaddlePaddle FrontEnd target (optional)
+#
+# Result variables:
+# ------
+#
+# The module sets the following variables in your project:
+#
+#   `OpenVINO_FOUND`
+#   System has OpenVINO Runtime installed
+#
+#   `OpenVINO_Runtime_FOUND`
+#   OpenVINO C++ Core & Inference Runtime is available
+#
+#   `OpenVINO_Frontend_ONNX_FOUND`
+#   OpenVINO ONNX frontend is available
+#
+#   `OpenVINO_Frontend_PaddlePaddle_FOUND`
+#   OpenVINO PaddlePaddle frontend is available
+#
+#  OpenVINO version variables:
+#
+#   `OpenVINO_VERSION_MAJOR`
+#   Major version component
+# 
+#   `OpenVINO_VERSION_MINOR`
+#   minor version component
+#
+#   `OpenVINO_VERSION_PATCH`
+#   Patch version component
+#
+
+@PACKAGE_INIT@
+
+#
+# Common functions
+#
+
+if(NOT DEFINED CMAKE_FIND_PACKAGE_NAME)
+    set(CMAKE_FIND_PACKAGE_NAME OpenVINO)
+    set(_need_package_name_reset ON)
+endif()
+
+# we have to use our own version of find_dependency because of support cmake 3.7
+macro(_ov_find_dependency dep)
+    set(cmake_fd_quiet_arg)
+    if(${CMAKE_FIND_PACKAGE_NAME}_FIND_QUIETLY)
+        set(cmake_fd_quiet_arg QUIET)
+    endif()
+    set(cmake_fd_required_arg)
+    if(${CMAKE_FIND_PACKAGE_NAME}_FIND_REQUIRED)
+        set(cmake_fd_required_arg REQUIRED)
+    endif()
+
+    get_property(cmake_fd_alreadyTransitive GLOBAL PROPERTY
+        _CMAKE_${dep}_TRANSITIVE_DEPENDENCY)
+
+    find_package(${dep} ${ARGN}
+        ${cmake_fd_quiet_arg}
+        ${cmake_fd_required_arg})
+
+    if(NOT DEFINED cmake_fd_alreadyTransitive OR cmake_fd_alreadyTransitive)
+        set_property(GLOBAL PROPERTY _CMAKE_${dep}_TRANSITIVE_DEPENDENCY TRUE)
+    endif()
+
+    if(NOT ${dep}_FOUND)
+        set(${CMAKE_FIND_PACKAGE_NAME}_NOT_FOUND_MESSAGE "${CMAKE_FIND_PACKAGE_NAME} could not be found because dependency ${dep} could not be found.")
+        set(${CMAKE_FIND_PACKAGE_NAME}_FOUND False)
+        return()
+    endif()
+
+    set(cmake_fd_required_arg)
+    set(cmake_fd_quiet_arg)
+endmacro()
+
+function(_ov_target_no_deprecation_error)
+    if(NOT MSVC)
+        if(CMAKE_CXX_COMPILER_ID STREQUAL "Intel")
+            set(flags "-diag-warning=1786")
+        else()
+            set(flags "-Wno-error=deprecated-declarations")
+        endif()
+        if(CMAKE_CROSSCOMPILING)
+            set_target_properties(${ARGV} PROPERTIES
+                                  INTERFACE_LINK_OPTIONS "-Wl,--allow-shlib-undefined")
+        endif()
+
+        set_target_properties(${ARGV} PROPERTIES INTERFACE_COMPILE_OPTIONS ${flags})
+    endif()
+endfunction()
+
+#
+# OpenVINO config
+#
+
+# need to store current PACKAGE_PREFIX_DIR, because it's overwritten by sub-package one
+set(_ov_package_prefix_dir "${PACKAGE_PREFIX_DIR}")
+
+set(THREADING "@THREADING@")
+if(THREADING STREQUAL "TBB" OR THREADING STREQUAL "TBB_AUTO" AND NOT TBB_FOUND)
+    set_and_check(_tbb_dir "@PACKAGE_IE_TBB_DIR@")
+    _ov_find_dependency(TBB
+                        COMPONENTS tbb tbbmalloc
+                        CONFIG
+                        PATHS ${TBBROOT}/cmake
+                              ${_tbb_dir}
+                        NO_CMAKE_FIND_ROOT_PATH
+                        NO_DEFAULT_PATH)
+endif()
+
+if(NOT TARGET inference_engine)
+    set(_ov_as_external_package ON)
+    include("${CMAKE_CURRENT_LIST_DIR}/OpenVINOTargets.cmake")
+endif()
+
+#
+# Components
+#
+
+set(${CMAKE_FIND_PACKAGE_NAME}_Runtime_FOUND ON)
+
+set(${CMAKE_FIND_PACKAGE_NAME}_ONNX_FOUND @NGRAPH_ONNX_FRONTEND_ENABLE@)
+set(${CMAKE_FIND_PACKAGE_NAME}_PaddlePaddle_FOUND @NGRAPH_PDPD_FRONTEND_ENABLE@)
+
+set(${CMAKE_FIND_PACKAGE_NAME}_Frontend_ONNX_FOUND ${${CMAKE_FIND_PACKAGE_NAME}_ONNX_FOUND})
+set(${CMAKE_FIND_PACKAGE_NAME}_Frontend_PaddlePaddle_FOUND ${${CMAKE_FIND_PACKAGE_NAME}_PaddlePaddle_FOUND})
+
+# if no components specified, only Runtime is provided
+if(NOT ${CMAKE_FIND_PACKAGE_NAME}_FIND_COMPONENTS)
+    set(${CMAKE_FIND_PACKAGE_NAME}_FIND_COMPONENTS Runtime)
+endif()
+
+#
+# Apply common functions
+#
+
+foreach(target openvino::runtime openvino::runtime::c openvino::core
+               openvino::frontend::manager openvino::frontend::onnx
+               openvino::frontend::paddlepaddle)
+    if(TARGET ${target} AND _ov_as_external_package)
+        _ov_target_no_deprecation_error(${target})
+    endif()
+endforeach()
+unset(_ov_as_external_package)
+
+# restore PACKAGE_PREFIX_DIR
+set(PACKAGE_PREFIX_DIR ${_ov_package_prefix_dir})
+unset(_ov_package_prefix_dir)
+
+check_required_components(${CMAKE_FIND_PACKAGE_NAME})
+
+if(_need_package_name_reset)
+    unset(CMAKE_FIND_PACKAGE_NAME)
+    unset(_need_package_name_reset)
+endif()
+
+unset(${CMAKE_FIND_PACKAGE_NAME}_PaddlePaddle_FOUND)
+unset(${CMAKE_FIND_PACKAGE_NAME}_ONNX_FOUND)
diff --git a/cmake/templates/ngraphConfig.cmake.in b/cmake/templates/ngraphConfig.cmake.in
index 1c17cbeb4cc49a..a94e6b50a58933 100644
--- a/cmake/templates/ngraphConfig.cmake.in
+++ b/cmake/templates/ngraphConfig.cmake.in
@@ -37,28 +37,56 @@
 
 @PACKAGE_INIT@
 
-if(NOT TARGET ngraph)
-    include("${CMAKE_CURRENT_LIST_DIR}/ngraphTargets.cmake")
+include(CMakeFindDependencyMacro)
+
+find_dependency(OpenVINO
+                PATHS "${CMAKE_CURRENT_LIST_DIR}"
+                      "${CMAKE_CURRENT_LIST_DIR}/ngraph"
+                NO_CMAKE_FIND_ROOT_PATH
+                NO_DEFAULT_PATH)
+
+# create targets with old names for compatibility
+if(TARGET openvino::core AND NOT TARGET ngraph::ngraph)
+    add_library(ngraph::ngraph INTERFACE IMPORTED)
+    set_target_properties(ngraph::ngraph PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::core)
+endif()
+
+if(TARGET openvino::frontend::manager AND NOT TARGET ngraph::frontend_manager)
+    add_library(ngraph::frontend_manager INTERFACE IMPORTED)
+    set_target_properties(ngraph::frontend_manager PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::frontend::manager)
+endif()
+
+if(TARGET openvino::frontend::onnx AND NOT TARGET ngraph::onnx_ngraph_frontend)
+    add_library(ngraph::onnx_ngraph_frontend INTERFACE IMPORTED)
+    set_target_properties(ngraph::onnx_ngraph_frontend PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::frontend::onnx)
+endif()
+
+if(TARGET openvino::frontend::paddlepaddle AND NOT TARGET ngraph::paddlepaddle_ngraph_frontend)
+    add_library(ngraph::paddlepaddle_ngraph_frontend INTERFACE IMPORTED)
+    set_target_properties(ngraph::paddlepaddle_ngraph_frontend PROPERTIES
+        INTERFACE_LINK_LIBRARIES openvino::frontend::paddlepaddle)
 endif()
 
 set(ngraph_ngraph_FOUND ON)
 set(NGRAPH_LIBRARIES ngraph::ngraph)
 
-set(ngraph_onnx_ngraph_frontend_FOUND @NGRAPH_ONNX_FRONTEND_ENABLE@)
+set(ngraph_onnx_ngraph_frontend_FOUND ${OpenVINO_Frontend_ONNX_FOUND})
+set(ngraph_onnx_importer_FOUND ${OpenVINO_Frontend_ONNX_FOUND})
 
-# ngraph::onnx_importer target and variables are deprecated
-set(ngraph_onnx_importer_FOUND @NGRAPH_ONNX_FRONTEND_ENABLE@)
 if(ngraph_onnx_importer_FOUND)
     set(ONNX_IMPORTER_LIBRARIES ngraph::onnx_ngraph_frontend)
+    # ngraph::onnx_importer target and variables are deprecated
+    # but need to create a dummy target for BW compatibility
     if(NOT TARGET ngraph::onnx_importer)
         add_library(ngraph::onnx_importer INTERFACE IMPORTED)
         set_target_properties(ngraph::onnx_importer PROPERTIES
-            INTERFACE_LINK_LIBRARIES ngraph::onnx_ngraph_frontend
-        )
+            INTERFACE_LINK_LIBRARIES ngraph::onnx_ngraph_frontend)
     endif()
 endif()
 
-set(ngraph_paddlepaddle_frontend_FOUND @NGRAPH_PDPD_FRONTEND_ENABLE@)
-set(ir_frontend_FOUND @IR_FRONTEND_ENABLE@)
+set(ngraph_paddlepaddle_frontend_FOUND ${OpenVINO_Frontend_PaddlePaddle_FOUND})
 
 check_required_components(ngraph)
diff --git a/docs/CMakeLists.txt b/docs/CMakeLists.txt
index 4d3135903de149..6eac6cc9ecbffa 100644
--- a/docs/CMakeLists.txt
+++ b/docs/CMakeLists.txt
@@ -9,20 +9,12 @@ if(NOT ENABLE_DOCKER)
 
     add_subdirectory(snippets)
 
-    # Detect nGraph
-    find_package(ngraph QUIET
-                 PATHS "${CMAKE_BINARY_DIR}/ngraph"
-                 NO_DEFAULT_PATH)
-    if(NOT ngraph_FOUND)
-        set(ngraph_DIR ${CMAKE_BINARY_DIR}/ngraph)
-    endif()
-
-    # Detect InferenceEngine
-    find_package(InferenceEngine QUIET
+    # Detect OpenVINO
+    find_package(OpenVINO QUIET
                  PATHS "${CMAKE_BINARY_DIR}"
                  NO_DEFAULT_PATH)
-    if(NOT InferenceEngine_FOUND)
-        set(InferenceEngine_DIR ${CMAKE_BINARY_DIR})
+    if(NOT OpenVINO_FOUND)
+        set(OpenVINO_DIR ${CMAKE_BINARY_DIR})
     endif()
 
     if(NGRAPH_ONNX_FRONTEND_ENABLE)
@@ -72,7 +64,7 @@ function(build_docs)
     set(C_API "${IE_SOURCE_DIR}/ie_bridges/c/include")
     set(PLUGIN_API_DIR "${DOCS_BUILD_DIR}/IE_PLUGIN_DG")
     set(NGRAPH_DIR "${OpenVINO_SOURCE_DIR}/ngraph")
-    set(NGRAPH_PY_DIR "${NGRAPH_DIR}/python/src/ngraph/")
+    set(NGRAPH_PY_DIR "${OpenVINO_SOURCE_DIR}/runtime/bindings/python/src/compatibility/ngraph/")
     set(NGRAPH_CPP_DIR "${NGRAPH_DIR}/core/include/" "${NGRAPH_DIR}/frontend/onnx_import/include")
 
     # Preprocessing scripts
diff --git a/docs/HOWTO/Custom_Layers_Guide.md b/docs/HOWTO/Custom_Layers_Guide.md
index cda4ed1c968f47..4bea76f5902baa 100644
--- a/docs/HOWTO/Custom_Layers_Guide.md
+++ b/docs/HOWTO/Custom_Layers_Guide.md
@@ -313,7 +313,7 @@ operation for the CPU plugin. The code of  the library is described in the [Exte
 To build the extension, run the following:<br>
 ```bash
 mkdir build && cd build
-source /opt/intel/openvino_2021/bin/setupvars.sh
+source /opt/intel/openvino_2022/setupvars.sh
 cmake .. -DCMAKE_BUILD_TYPE=Release
 make --jobs=$(nproc)
 ```
diff --git a/docs/IE_DG/Cross_Check_Tool.md b/docs/IE_DG/Cross_Check_Tool.md
index 495afa790fcccc..d53d3dddfe47de 100644
--- a/docs/IE_DG/Cross_Check_Tool.md
+++ b/docs/IE_DG/Cross_Check_Tool.md
@@ -8,11 +8,11 @@ The Cross Check Tool can compare metrics per layer or all over the model.
 
 On Linux* OS, before running the Cross Check Tool binary, make sure your application can find the
 Deep Learning Inference Engine libraries.
-Navigate to the `<INSTALL_DIR>/deployment_tools/inference_engine/bin` folder and run the `setvars.sh` script to
+Navigate to the `<INSTALL_DIR>` folder and run the `setupvars.sh` script to
 set all necessary environment variables:
 
 ```sh
-source setvars.sh
+source setupvars.sh
 ```
 
 ## Running the Cross Check Tool
diff --git a/docs/IE_DG/Deep_Learning_Inference_Engine_DevGuide.md b/docs/IE_DG/Deep_Learning_Inference_Engine_DevGuide.md
index 0f07f5503811f5..e2960c5dd87394 100644
--- a/docs/IE_DG/Deep_Learning_Inference_Engine_DevGuide.md
+++ b/docs/IE_DG/Deep_Learning_Inference_Engine_DevGuide.md
@@ -1,7 +1,5 @@
 # Inference Engine Developer Guide {#openvino_docs_IE_DG_Deep_Learning_Inference_Engine_DevGuide}
 
-> **NOTE:** [Intel® System Studio](https://software.intel.com/content/www/us/en/develop/tools/oneapi/commercial-base-iot.html) (click "Intel® System Studio Users" tab) is an all-in-one, cross-platform tool suite, purpose-built to simplify system bring-up and improve system and IoT device application performance on Intel® platforms. If you are using the Intel® Distribution of OpenVINO™ with Intel® System Studio, go to [Get Started with Intel® System Studio](https://software.intel.com/en-us/articles/get-started-with-openvino-and-intel-system-studio-2019).
-
 This Guide provides an overview of the Inference Engine describing the typical workflow for performing inference of a pre-trained and optimized deep learning model and a set of sample applications.
 
 > **NOTE:** Before you perform inference with the Inference Engine, your models should be converted to the Inference Engine format using the Model Optimizer or built directly in runtime using nGraph API. To learn about how to use Model Optimizer, refer to the [Model Optimizer Developer Guide](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md). To learn about the pre-trained and optimized models delivered with the OpenVINO™ toolkit, refer to [Pre-Trained Models](@ref omz_models_group_intel).
@@ -81,9 +79,9 @@ Make sure those libraries are in your computer's path or in the place you pointe
 * Windows: `PATH`
 * macOS: `DYLD_LIBRARY_PATH`
 
-On Linux and macOS, use the script `bin/setupvars.sh` to set the environment variables.
+On Linux and macOS, use the script `setupvars.sh` to set the environment variables.
 
-On Windows, run the `bin\setupvars.bat` batch file to set the environment variables.
+On Windows, run the `setupvars.bat` batch file to set the environment variables.
 
 To learn more about supported devices and corresponding plugins, see the [Supported Devices](supported_plugins/Supported_Devices.md) chapter.
 
@@ -111,10 +109,8 @@ The common workflow contains the following steps:
 8. **Get the output** - After inference is completed, get the output memory or read the memory you provided earlier. Do this with the `InferenceEngine::IInferRequest::GetBlob()` method.
 
 ## Video: Inference Engine Concept
-[![](https://img.youtube.com/vi/e6R13V8nbak/0.jpg)](https://www.youtube.com/watch?v=e6R13V8nbak)
-\htmlonly
+
 <iframe width="560" height="315" src="https://www.youtube.com/embed/e6R13V8nbak" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
-\endhtmlonly
 
 ## Further Reading
 
diff --git a/docs/IE_DG/Extensibility_DG/AddingNGraphOps.md b/docs/IE_DG/Extensibility_DG/AddingNGraphOps.md
index 8ca911f7d0cda9..ed4d65595320a5 100644
--- a/docs/IE_DG/Extensibility_DG/AddingNGraphOps.md
+++ b/docs/IE_DG/Extensibility_DG/AddingNGraphOps.md
@@ -1,6 +1,6 @@
 # Custom nGraph Operation {#openvino_docs_IE_DG_Extensibility_DG_AddingNGraphOps}
 
-Inference Engine Extension API allows you to register operation sets (opsets) with custom nGraph operations to support models with operations which OpenVINO™ does not support out-of-the-box.
+The Inference Engine Extension API allows you to register operation sets (opsets) with custom nGraph operations to support models with operations that OpenVINO™ does not support out-of-the-box.
 
 ## Operation Class
 
diff --git a/docs/IE_DG/Extensibility_DG/Building.md b/docs/IE_DG/Extensibility_DG/Building.md
index d1f62cb53a822d..be93c5a06d3bc9 100644
--- a/docs/IE_DG/Extensibility_DG/Building.md
+++ b/docs/IE_DG/Extensibility_DG/Building.md
@@ -14,6 +14,6 @@ To build an extension library, run the commands below:
 $ cd template_extension
 $ mkdir build
 $ cd build
-$ cmake -DInferenceEngine_DIR=[IE_DIR] -Dngraph_DIR=[NGRAPH_DIR] ../
+$ cmake -DOpenVINO_DIR=[OpenVINO_DIR]  ../
 $ cmake --build .
 ```
diff --git a/docs/IE_DG/Extensibility_DG/Custom_ONNX_Ops.md b/docs/IE_DG/Extensibility_DG/Custom_ONNX_Ops.md
index a9a9841cac457f..eb7183f0dc246b 100644
--- a/docs/IE_DG/Extensibility_DG/Custom_ONNX_Ops.md
+++ b/docs/IE_DG/Extensibility_DG/Custom_ONNX_Ops.md
@@ -50,8 +50,8 @@ The example below demonstrates how to unregister an operator from the destructor
 
 ## Requirements for Building with CMake
 
-A program that uses the `register_operator` functionality requires `ngraph::ngraph` and `ngraph::onnx_ngraph_frontend` libraries in addition to the Inference Engine.
-The `onnx_ngraph_frontend` is a component of the `ngraph` package , so `find_package(ngraph REQUIRED COMPONENTS onnx_ngraph_frontend)` can find both.
+A program that uses the `register_operator` functionality requires `openvino::core` and `openvino::frontend::onnx` libraries in addition to the OpenVINO Inference Runtime.
+The `onnx_ngraph_frontend` is a component of the `OpenVINO` package , so `find_package(OpenVINO REQUIRED COMPONENTS ONNX)` can find both.
 Those libraries need to be passed to the `target_link_libraries` command in the CMakeLists.txt file.
 
 See CMakeLists.txt below for reference:
diff --git a/docs/IE_DG/Extensibility_DG/Extension.md b/docs/IE_DG/Extensibility_DG/Extension.md
index 178d0099df68ee..e941cb9c13c1a8 100644
--- a/docs/IE_DG/Extensibility_DG/Extension.md
+++ b/docs/IE_DG/Extensibility_DG/Extension.md
@@ -25,5 +25,6 @@ Also, an `Extension` object should implement the following methods:
 Implement the InferenceEngine::IExtension::getOpSets method if the extension contains custom layers. 
 Read [Custom nGraph Operation](AddingNGraphOps.md) for more information.
 
-To integrate execution kernels to the extension library, read [How to Implement Custom CPU Operations](CPU_Kernel.md).
-To register a custom ONNX\* operator to the extension library, read [Custom ONNX Operators](Custom_ONNX_Ops.md).
+To understand how to integrate execution kernels to the extension library, read the [documentation about development of custom CPU kernels](CPU_Kernel.md).
+
+To understand how to register custom ONNX operator to the extension library, read the [documentation about custom ONNX operators](Custom_ONNX_Ops.md).
diff --git a/docs/IE_DG/Extensibility_DG/GPU_Kernel.md b/docs/IE_DG/Extensibility_DG/GPU_Kernel.md
index d9fd809f8e4227..f206c2c0bcb41e 100644
--- a/docs/IE_DG/Extensibility_DG/GPU_Kernel.md
+++ b/docs/IE_DG/Extensibility_DG/GPU_Kernel.md
@@ -4,7 +4,7 @@ The GPU codepath abstracts many details about OpenCL\*. You need to provide the
 
 There are two options of using the custom operation configuration file:
 
-* Include a section with your kernels into the global automatically-loaded `cldnn_global_custom_kernels/cldnn_global_custom_kernels.xml` file, which is hosted in the `<INSTALL_DIR>/deployment_tools/inference_engine/bin/intel64/{Debug/Release}` folder
+* Include a section with your kernels into the global automatically-loaded `cldnn_global_custom_kernels/cldnn_global_custom_kernels.xml` file, which is hosted in the `<INSTALL_DIR>/runtime/bin` folder
 * Call the `InferenceEngine::Core::SetConfig()` method from your application with the `InferenceEngine::PluginConfigParams::KEY_CONFIG_FILE` key and the configuration file name as a value before loading the network that uses custom operations to the plugin:
 
 @snippet snippets/GPU_Kernel.cpp part0
diff --git a/docs/IE_DG/Extensibility_DG/VPU_Kernel.md b/docs/IE_DG/Extensibility_DG/VPU_Kernel.md
index 033097598317bf..4dca14ce50233e 100644
--- a/docs/IE_DG/Extensibility_DG/VPU_Kernel.md
+++ b/docs/IE_DG/Extensibility_DG/VPU_Kernel.md
@@ -15,18 +15,18 @@ To customize your topology with an OpenCL layer, follow the steps below:
 > **NOTE:** OpenCL compiler, targeting Intel® Neural Compute Stick 2 for the SHAVE* processor only, is redistributed with OpenVINO.
 OpenCL support is provided by ComputeAorta*, and is distributed under a license agreement between Intel® and Codeplay* Software Ltd.
 
-The OpenCL toolchain for the Intel® Neural Compute Stick 2 supports offline compilation only, so first compile OpenCL C code using the standalone `clc` compiler. You can find the compiler binary at `<INSTALL_DIR>/deployment_tools/tools/cl_compiler`.
+The OpenCL toolchain for the Intel® Neural Compute Stick 2 supports offline compilation only, so first compile OpenCL C code using the standalone `clc` compiler. You can find the compiler binary at `<INSTALL_DIR>/tools/cl_compiler`.
 
 > **NOTE:** By design, custom OpenCL layers support any OpenCL kernels written with 1.2 version assumed. It also supports half float extension and is optimized for this type, because it is a native type for Intel® Movidius™ VPUs.
 
 1. Prior to running a compilation, make sure that the following variables are set:
-   * `SHAVE_MA2X8XLIBS_DIR=<INSTALL_DIR>/deployment_tools/tools/cl_compiler/lib/`
-   * `SHAVE_LDSCRIPT_DIR=<INSTALL_DIR>/deployment_tools/tools/cl_compiler/ldscripts/`
-   * `SHAVE_MYRIAD_LD_DIR=<INSTALL_DIR>/deployment_tools/tools/cl_compiler/bin/`
-   * `SHAVE_MOVIASM_DIR=<INSTALL_DIR>/deployment_tools/tools/cl_compiler/bin/`
+   * `SHAVE_MA2X8XLIBS_DIR=<INSTALL_DIR>/tools/cl_compiler/lib/`
+   * `SHAVE_LDSCRIPT_DIR=<INSTALL_DIR>/tools/cl_compiler/ldscripts/`
+   * `SHAVE_MYRIAD_LD_DIR=<INSTALL_DIR>/tools/cl_compiler/bin/`
+   * `SHAVE_MOVIASM_DIR=<INSTALL_DIR>/tools/cl_compiler/bin/`
 2. Run the compilation with the command below. You should use `--strip-binary-header` to make an OpenCL runtime-agnostic binary runnable with the Inference Engine.
 ```bash
-cd <INSTALL_DIR>/deployment_tools/tools/cl_compiler/bin
+cd <INSTALL_DIR>/tools/cl_compiler/bin
 ./clc --strip-binary-header custom_layer.cl -o custom_layer.bin
 ```
 
diff --git a/docs/IE_DG/Glossary.md b/docs/IE_DG/Glossary.md
index 41e2b1b1dab0b9..706e71591852d8 100644
--- a/docs/IE_DG/Glossary.md
+++ b/docs/IE_DG/Glossary.md
@@ -19,7 +19,6 @@ Glossary {#openvino_docs_IE_DG_Glossary}
 | ELU               | Exponential Linear rectification Unit |
 | FCN               | Fully Convolutional Network |
 | FP                | Floating Point |
-| FPGA              | Field-Programmable Gate Array |
 | GCC               | GNU Compiler Collection |
 | GPU               | Graphics Processing Unit |
 | HD                | High Definition |
diff --git a/docs/IE_DG/InferenceEngine_QueryAPI.md b/docs/IE_DG/InferenceEngine_QueryAPI.md
index 8588e00e5ceb62..90fa6bfb2cb17c 100644
--- a/docs/IE_DG/InferenceEngine_QueryAPI.md
+++ b/docs/IE_DG/InferenceEngine_QueryAPI.md
@@ -29,8 +29,6 @@ The function returns list of available devices, for example:
 ```
 MYRIAD.1.2-ma2480
 MYRIAD.1.4-ma2480
-FPGA.0
-FPGA.1
 CPU
 GPU.0
 GPU.1
diff --git a/docs/IE_DG/Int8Inference.md b/docs/IE_DG/Int8Inference.md
index 889af6a53278b1..2577e7dc4ecab7 100644
--- a/docs/IE_DG/Int8Inference.md
+++ b/docs/IE_DG/Int8Inference.md
@@ -1,12 +1,5 @@
 # Low-Precision 8-bit Integer Inference {#openvino_docs_IE_DG_Int8Inference}
 
-## Table of Contents
-1. [Supported devices](#supported-devices)
-2. [Low-Precision 8-bit Integer Inference Workflow](#low-precision-8-bit-integer-inference-workflow)
-3. [Prerequisites](#prerequisites)
-4. [Inference](#inference)
-5. [Results analysis](#results-analysis)
-
 ## Supported devices
 
 Low-precision 8-bit inference is optimized for:
@@ -24,34 +17,35 @@ Low-precision 8-bit inference is optimized for:
 
 ## Low-Precision 8-bit Integer Inference Workflow
 
-8-bit computations (referred to as `int8`) offer better performance compared to the results of inference in higher precision (for example, `fp32`), because they allow loading more data into a single processor instruction. Usually the cost for significant boost is a reduced accuracy. However, it is proved that an accuracy drop can be negligible and depends on task requirements, so that the application engineer can set up the maximum accuracy drop that is acceptable.
+8-bit computations (referred to as `int8`) offer better performance compared to the results of inference in higher precision (for example, `fp32`), because they allow loading more data into a single processor instruction. Usually the cost for significant boost is reduced accuracy. However, it is proved that an accuracy drop can be negligible and depends on task requirements, so that the application engineer can set up the maximum accuracy drop that is acceptable.
 
 For 8-bit integer computations, a model must be quantized. Quantized models can be downloaded from [Overview of OpenVINO™ Toolkit Intel's Pre-Trained Models](@ref omz_models_group_intel). If the model is not quantized, you can use the [Post-Training Optimization Tool](@ref pot_README) to quantize the model. The quantization process adds [FakeQuantize](../ops/quantization/FakeQuantize_1.md) layers on activations and weights for most layers. Read more about mathematical computations in the [Uniform Quantization with Fine-Tuning](https://github.com/openvinotoolkit/nncf/blob/develop/docs/compression_algorithms/Quantization.md).
 
 When you pass the quantized IR to the OpenVINO™ plugin, the plugin automatically recognizes it as a quantized model and performs 8-bit inference. Note, if you pass a quantized model to another plugin that does not support 8-bit inference but supports all operations from the model, the model is inferred in precision that this plugin supports.
 
-In *Runtime stage* stage, the quantized model is loaded to the plugin. The plugin uses `Low Precision Transformation` component to update the model to infer it in low precision:
-   - Update `FakeQuantize` layers to have quantized output tensors in low precision range and add dequantization layers to compensate the update. Dequantization layers are pushed through as many layers as possible to have more layers in low precision. After that, most layers have quantized input tensors in low precision range and can be inferred in low precision. Ideally, dequantization layers should be fused in the next `FakeQuantize` layer.
-   - Weights are quantized and stored in `Constant` layers. 
+In *Runtime stage*, the quantized model is loaded to the plugin. The plugin uses the `Low Precision Transformation` component to update the model to infer it in low precision:
+   - Update `FakeQuantize` layers to have quantized output tensors in a low precision range and add dequantization layers to compensate the update. Dequantization layers are pushed through as many layers as possible to have more layers in low precision. After that, most layers quantized input tensors in the low precision range and can be inferred in low precision. Ideally, dequantization layers should be fused in the next `FakeQuantize` layer.
+   - Quantize weights and store them in `Constant` layers. 
 
 ## Prerequisites
 
-Let's explore quantized [TensorFlow* implementation of ResNet-50](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-50-tf) model. Use [Model Downloader](@ref omz_tools_downloader) tool to download the `fp16` model from [OpenVINO™ Toolkit - Open Model Zoo repository](https://github.com/openvinotoolkit/open_model_zoo):
+Let's explore the quantized [TensorFlow* implementation of ResNet-50](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-50-tf) model. Use the [Model Downloader](@ref omz_tools_downloader) tool to download the `fp16` model from [OpenVINO™ Toolkit - Open Model Zoo repository](https://github.com/openvinotoolkit/open_model_zoo):
 ```sh
-./downloader.py --name resnet-50-tf --precisions FP16-INT8
+cd $INTEL_OPENVINO_DIR/deployment_tools/tools/model_downloader
+./downloader.py --name resnet-50-tf --precisions FP16-INT8 --output_dir <your_model_directory>
 ```
-After that you should quantize model by the [Model Quantizer](@ref omz_tools_downloader) tool.
+After that, you should quantize the model by the [Model Quantizer](@ref omz_tools_downloader) tool. For the dataset, you can choose to download the ImageNet dataset from [here](https://www.image-net.org/download.php).
 ```sh
-./quantizer.py --model_dir public/resnet-50-tf --dataset_dir <DATASET_DIR> --precisions=FP16-INT8
+./quantizer.py --model_dir --name public/resnet-50-tf --dataset_dir <DATASET_DIR> --precisions=FP16-INT8
 ```
 
 ## Inference
 
-The simplest way to infer the model and collect performance counters is [C++ Benchmark Application](../../inference-engine/samples/benchmark_app/README.md). 
+The simplest way to infer the model and collect performance counters is the [C++ Benchmark Application](../../inference-engine/samples/benchmark_app/README.md). 
 ```sh
 ./benchmark_app -m resnet-50-tf.xml -d CPU -niter 1 -api sync -report_type average_counters  -report_folder pc_report_dir
 ```
-If you infer the model with the OpenVINO™ CPU plugin and collect performance counters, all operations (except last not quantized SoftMax) are executed in INT8 precision.  
+If you infer the model with the Inference Engine CPU plugin and collect performance counters, all operations (except the last non-quantized SoftMax) are executed in INT8 precision.  
 
 ## Results analysis
 
diff --git a/docs/IE_DG/Integrate_with_customer_application_new_API.md b/docs/IE_DG/Integrate_with_customer_application_new_API.md
index 93482a9093887e..870d840c95cd21 100644
--- a/docs/IE_DG/Integrate_with_customer_application_new_API.md
+++ b/docs/IE_DG/Integrate_with_customer_application_new_API.md
@@ -35,7 +35,7 @@ Integration process includes the following steps:
 
 @snippet snippets/Integrate_with_customer_application_new_API.cpp part1
 
-**Or read the model from ONNX format** (.onnx and .prototxt are supported formats). You can find more information about the ONNX format support in the document [ONNX format support in the OpenVINO™](./ONNX_Support.md).
+**Or read the model from ONNX format**. You can find more information about the ONNX format support in the document [ONNX format support in the OpenVINO™](./ONNX_Support.md).
 
 @snippet snippets/Integrate_with_customer_application_new_API.cpp part2
 
@@ -173,7 +173,7 @@ Note that casting `Blob` to `TBlob` via `std::dynamic_pointer_cast` is not the r
 ## Build Your Application
 
 For details about building your application, refer to the CMake files for the sample applications.
-All samples source code is located in the `<INSTALL_DIR>/openvino/inference_engine/samples` directory, where `INSTALL_DIR` is the OpenVINO™ installation directory.
+All samples source code is located in the `<INSTALL_DIR>/samples` directory, where `INSTALL_DIR` is the OpenVINO™ installation directory.
 
 ### CMake project creation
 
@@ -193,14 +193,13 @@ build/                  - build directory
 ``` cmake
 cmake_minimum_required(VERSION 3.0.0)
 project(project_name)
-find_package(ngraph REQUIRED)
-find_package(InferenceEngine REQUIRED)
+find_package(OpenVINO REQUIRED)
 find_package(OpenCV REQUIRED)
 add_executable(${PROJECT_NAME} src/main.cpp)
-target_link_libraries(${PROJECT_NAME} PRIVATE ${InferenceEngine_LIBRARIES} ${OpenCV_LIBS} ${NGRAPH_LIBRARIES})
+target_link_libraries(${PROJECT_NAME} PRIVATE openvino::runtime ${OpenCV_LIBS})
 ```
 3. **To build your project** using CMake with the default build tools currently available on your machine, execute the following commands:
-> **NOTE**: Make sure you set environment variables first by running `<INSTALL_DIR>/bin/setupvars.sh` (or setupvars.bat for Windows)`. Otherwise the `InferenceEngine_DIR` and `OpenCV_DIR` variables won't be configured properly to pass `find_package` calls.
+> **NOTE**: Make sure you set environment variables first by running `<INSTALL_DIR>/setupvars.sh` (or setupvars.bat for Windows)`. Otherwise the `InferenceEngine_DIR` and `OpenCV_DIR` variables won't be configured properly to pass `find_package` calls.
 ```sh
 cd build/
 cmake ../project
diff --git a/docs/IE_DG/Intro_to_Performance.md b/docs/IE_DG/Intro_to_Performance.md
index 48d1ea5c56cff0..ca360d0d06f1c0 100644
--- a/docs/IE_DG/Intro_to_Performance.md
+++ b/docs/IE_DG/Intro_to_Performance.md
@@ -34,7 +34,7 @@ Refer to the [Benchmark App](../../inference-engine/samples/benchmark_app/README
 ## Using Caching API for first inference latency optimization
 Since with the 2021.4 release, Inference Engine provides an ability to enable internal caching of loaded networks.
 This can significantly reduce load network latency for some devices at application startup.
-Internally caching uses plugin's Export/ImportNetwork flow, like it is done for [Compile tool](../../inference-engine/tools/compile_tool/README.md), using the regular ReadNetwork/LoadNetwork API.
+Internally caching uses plugin's Export/ImportNetwork flow, like it is done for [Compile tool](../../tools/compile_tool/README.md), using the regular ReadNetwork/LoadNetwork API.
 Refer to the [Model Caching Overview](Model_caching_overview.md) for more detailed explanation.
 
 ## Using Async API
diff --git a/docs/IE_DG/Legal_Information.md b/docs/IE_DG/Legal_Information.md
deleted file mode 100644
index 3b39dba5810fa4..00000000000000
--- a/docs/IE_DG/Legal_Information.md
+++ /dev/null
@@ -1,12 +0,0 @@
-# Legal Information {#openvino_docs_IE_DG_Legal_Information}
-
-<sup>No license (express or implied, by estoppel or otherwise) to any intellectual property rights is granted by this document.</sup><br/>
-<sup>Intel disclaims all express and implied warranties, including without limitation, the implied warranties of merchantability, fitness for a particular purpose, and non-infringement, as well as any warranty arising from course of performance, course of dealing, or usage in trade.</sup><br/>
-<sup>This document contains information on products, services and/or processes in development. All information provided here is subject to change without notice. Contact your Intel representative to obtain the latest forecast, schedule, specifications and roadmaps.</sup><br/>
-<sup>The products and services described may contain defects or errors known as errata which may cause deviations from published specifications. Current characterized errata are available on request.</sup><br/>
-<sup>Copies of documents which have an order number and are referenced in this document may be obtained by calling 1-800-548-4725 or by visiting [<b>www.intel.com/design/literature.htm</b>](http://www.intel.com/design/literature.htm).</sup><br/>
-<sup>Intel, Intel logo, Intel Core, VTune, Xeon are trademarks of Intel Corporation in the U.S. and other countries.</sup><br/>
-<sup>\* Other names and brands may be claimed as the property of others.</sup><br/>
-<sup>Copyright © 2016-2018 Intel Corporation.</sup><br/>
-<sup>This software and the related documents are Intel copyrighted materials, and your use of them is governed by the express license under which they were provided to you (License). Unless the License provides otherwise, you may not use, modify, copy, publish, distribute, disclose or transmit this software or the related documents without Intel's prior written permission.</sup><br/>
-<sup>This software and the related documents are provided as is, with no express or implied warranties, other than those that are expressly stated in the License.</sup><br/>
diff --git a/docs/IE_DG/Model_caching_overview.md b/docs/IE_DG/Model_caching_overview.md
index 10d3d6cf99e302..d480d7626d9859 100644
--- a/docs/IE_DG/Model_caching_overview.md
+++ b/docs/IE_DG/Model_caching_overview.md
@@ -20,7 +20,7 @@ As described in [Inference Engine Developer Guide](Deep_Learning_Inference_Engin
 
 Step #5 can potentially perform several time-consuming device-specific optimizations and network compilations,
 and such delays can lead to bad user experience on application startup. To avoid this, some devices offer
-Import/Export network capability, and it is possible to either use [Compile tool](../../inference-engine/tools/compile_tool/README.md)
+Import/Export network capability, and it is possible to either use [Compile tool](../../tools/compile_tool/README.md)
 or enable model caching to export compiled network automatically. Reusing cached networks can significantly reduce load network time.
 
 
diff --git a/docs/IE_DG/Samples_Overview.md b/docs/IE_DG/Samples_Overview.md
index f9e21cf5e4dcce..db989aac76f596 100644
--- a/docs/IE_DG/Samples_Overview.md
+++ b/docs/IE_DG/Samples_Overview.md
@@ -3,9 +3,9 @@
 The Inference Engine sample applications are simple console applications that show how to utilize specific Inference Engine capabilities within an application, assist developers in executing specific tasks such as loading a model, running inference, querying specific device capabilities and etc.
 
 After installation of Intel® Distribution of OpenVINO™ toolkit, С, C++ and Python* sample applications are available in the following directories, respectively:
-* `<INSTALL_DIR>/inference_engine/samples/c`
-* `<INSTALL_DIR>/inference_engine/samples/cpp`
-* `<INSTALL_DIR>/inference_engine/samples/python`
+* `<INSTALL_DIR>/samples/c`
+* `<INSTALL_DIR>/samples/cpp`
+* `<INSTALL_DIR>/samples/python`
 
 Inference Engine sample applications include the following:
 
@@ -64,7 +64,7 @@ The officially supported Linux* build environment is the following:
 
 > **NOTE**: For building samples from the open-source version of OpenVINO™ toolkit, see the [build instructions on GitHub](https://github.com/openvinotoolkit/openvino/wiki/BuildingCode).
 
-To build the C or C++ sample applications for Linux, go to the `<INSTALL_DIR>/inference_engine/samples/c` or `<INSTALL_DIR>/inference_engine/samples/cpp` directory, respectively, and run the `build_samples.sh` script:
+To build the C or C++ sample applications for Linux, go to the `<INSTALL_DIR>/samples/c` or `<INSTALL_DIR>/samples/cpp` directory, respectively, and run the `build_samples.sh` script:
 ```sh
 build_samples.sh
 ```
@@ -91,11 +91,11 @@ cd build
 3. Run CMake to generate the Make files for release or debug configuration. For example, for C++ samples:
   - For release configuration:
   ```sh
-  cmake -DCMAKE_BUILD_TYPE=Release <INSTALL_DIR>/inference_engine/samples/cpp
+  cmake -DCMAKE_BUILD_TYPE=Release <INSTALL_DIR>/samples/cpp
   ```
   - For debug configuration:
   ```sh
-  cmake -DCMAKE_BUILD_TYPE=Debug <INSTALL_DIR>/inference_engine/samples/cpp
+  cmake -DCMAKE_BUILD_TYPE=Debug <INSTALL_DIR>/samples/cpp
   ```
 4. Run `make` to build the samples:
 ```sh
@@ -109,12 +109,12 @@ for the debug configuration — in `<path_to_build_directory>/intel64/Debug/`.
 
 The recommended Windows* build environment is the following:
 * Microsoft Windows* 10
-* Microsoft Visual Studio* 2017, or 2019
+* Microsoft Visual Studio* 2017, or 2019. Make sure that C++ CMake tools for Windows is [enabled](https://docs.microsoft.com/en-us/cpp/build/cmake-projects-in-visual-studio?view=msvc-160#:~:text=The%20Visual%20C%2B%2B%20Tools%20for,Visual%20Studio%20generators%20are%20supported).
 * CMake* version 3.10 or higher
 
 > **NOTE**: If you want to use Microsoft Visual Studio 2019, you are required to install CMake 3.14.
 
-To build the C or C++ sample applications on Windows, go to the `<INSTALL_DIR>\inference_engine\samples\c` or `<INSTALL_DIR>\inference_engine\samples\cpp` directory, respectively, and run the `build_samples_msvc.bat` batch file:
+To build the C or C++ sample applications on Windows, go to the `<INSTALL_DIR>\samples\c` or `<INSTALL_DIR>\samples\cpp` directory, respectively, and run the `build_samples_msvc.bat` batch file:
 ```sh
 build_samples_msvc.bat
 ```
@@ -123,7 +123,7 @@ By default, the script automatically detects the highest Microsoft Visual Studio
 a solution for a sample code. Optionally, you can also specify the preferred Microsoft Visual Studio version to be used by the script. Supported
 versions are `VS2017` and `VS2019`. For example, to build the C++ samples using the Microsoft Visual Studio 2017, use the following command:
 ```sh
-<INSTALL_DIR>\inference_engine\samples\cpp\build_samples_msvc.bat VS2017
+<INSTALL_DIR>\samples\cpp\build_samples_msvc.bat VS2017
 ```
 
 Once the build is completed, you can find sample binaries in the following folders:
@@ -144,7 +144,7 @@ The officially supported macOS* build environment is the following:
 
 > **NOTE**: For building samples from the open-source version of OpenVINO™ toolkit, see the [build instructions on GitHub](https://github.com/openvinotoolkit/openvino/wiki/BuildingCode).
 
-To build the C or C++ sample applications for macOS, go to the `<INSTALL_DIR>/inference_engine/samples/c` or `<INSTALL_DIR>/inference_engine/samples/cpp` directory, respectively, and run the `build_samples.sh` script:
+To build the C or C++ sample applications for macOS, go to the `<INSTALL_DIR>/samples/c` or `<INSTALL_DIR>/samples/cpp` directory, respectively, and run the `build_samples.sh` script:
 ```sh
 build_samples.sh
 ```
@@ -177,11 +177,11 @@ cd build
 3. Run CMake to generate the Make files for release or debug configuration. For example, for C++ samples:
   - For release configuration:
   ```sh
-  cmake -DCMAKE_BUILD_TYPE=Release <INSTALL_DIR>/inference_engine/samples/cpp
+  cmake -DCMAKE_BUILD_TYPE=Release <INSTALL_DIR>/samples/cpp
   ```
   - For debug configuration:
   ```sh
-  cmake -DCMAKE_BUILD_TYPE=Debug <INSTALL_DIR>/inference_engine/samples/cpp
+  cmake -DCMAKE_BUILD_TYPE=Debug <INSTALL_DIR>/samples/cpp
   ```
 4. Run `make` to build the samples:
 ```sh
@@ -199,7 +199,7 @@ Before running compiled binary files, make sure your application can find the
 Inference Engine and OpenCV libraries.
 Run the `setupvars` script to set all necessary environment variables:
 ```sh
-source <INSTALL_DIR>/bin/setupvars.sh
+source <INSTALL_DIR>/setupvars.sh
 ```
 
 **(Optional)**: The OpenVINO environment variables are removed when you close the
@@ -212,7 +212,7 @@ vi <user_home_directory>/.bashrc
 
 2. Add this line to the end of the file:
 ```sh
-source /opt/intel/openvino_2021/bin/setupvars.sh
+source /opt/intel/openvino_2022/setupvars.sh
 ```
 
 3. Save and close the file: press the **Esc** key, type `:wq` and press the **Enter** key.
@@ -228,7 +228,7 @@ Before running compiled binary files, make sure your application can find the
 Inference Engine and OpenCV libraries.
 Use the `setupvars` script, which sets all necessary environment variables:
 ```sh
-<INSTALL_DIR>\bin\setupvars.bat
+<INSTALL_DIR>\setupvars.bat
 ```
 
 To debug or run the samples on Windows in Microsoft Visual Studio, make sure you
@@ -240,7 +240,7 @@ For example, for the **Debug** configuration, go to the project's
 variable in the **Environment** field to the following:
 
 ```sh
-PATH=<INSTALL_DIR>\deployment_tools\inference_engine\bin\intel64\Debug;<INSTALL_DIR>\opencv\bin;%PATH%
+PATH=<INSTALL_DIR>\runtime\bin;<INSTALL_DIR>\opencv\bin;%PATH%
 ```
 where `<INSTALL_DIR>` is the directory in which the OpenVINO toolkit is installed.
 
diff --git a/docs/IE_DG/ShapeInference.md b/docs/IE_DG/ShapeInference.md
index dcc4b5c3f8837b..a265f2e9703e2e 100644
--- a/docs/IE_DG/ShapeInference.md
+++ b/docs/IE_DG/ShapeInference.md
@@ -33,7 +33,7 @@ If a model has a hard-coded batch dimension, use `InferenceEngine::CNNNetwork::s
 
 Inference Engine takes three kinds of a model description as an input, which are converted into an `InferenceEngine::CNNNetwork` object:
 1. [Intermediate Representation (IR)](../MO_DG/IR_and_opsets.md) through `InferenceEngine::Core::ReadNetwork`
-2. [ONNX model](../IE_DG/OnnxImporterTutorial.md) through `InferenceEngine::Core::ReadNetwork`
+2. [ONNX model](../IE_DG/ONNX_Support.md) through `InferenceEngine::Core::ReadNetwork`
 3. [nGraph function](../nGraph_DG/nGraph_dg.md) through the constructor of `InferenceEngine::CNNNetwork`
 
 `InferenceEngine::CNNNetwork` keeps an `ngraph::Function` object with the model description internally.
diff --git a/docs/IE_DG/Tools_Overview.md b/docs/IE_DG/Tools_Overview.md
index f0741105387617..e3acfa7fb483b7 100644
--- a/docs/IE_DG/Tools_Overview.md
+++ b/docs/IE_DG/Tools_Overview.md
@@ -6,11 +6,11 @@ The OpenVINO™ toolkit installation includes the following tools:
 
 |Tool                                                                         | Location in the Installation Directory|
 |-----------------------------------------------------------------------------|---------------------------------------|
-|[Accuracy Checker Tool](@ref omz_tools_accuracy_checker)              | `<INSTALL_DIR>/deployment_tools/tools/open_model_zoo/tools/accuracy_checker`|
-|[Post-Training Optimization Tool](@ref pot_README)                           | `<INSTALL_DIR>/deployment_tools/tools/post_training_optimization_toolkit`|
-|[Model Downloader](@ref omz_tools_downloader)                         | `<INSTALL_DIR>/deployment_tools/tools/model_downloader`| 
-|[Cross Check Tool](../../inference-engine/tools/cross_check_tool/README.md)  | `<INSTALL_DIR>/deployment_tools/tools/cross_check_tool`|
-|[Compile Tool](../../inference-engine/tools/compile_tool/README.md)          | `<INSTALL_DIR>/deployment_tools/inference_engine/lib/intel64/`|
+|[Accuracy Checker Tool](@ref omz_tools_accuracy_checker)              | `<INSTALL_DIR>/tools/accuracy_checker`|
+|[Post-Training Optimization Tool](@ref pot_README)                           | `<INSTALL_DIR>/tools/post_training_optimization_toolkit`|
+|[Model Downloader](@ref omz_tools_downloader)                         | `<INSTALL_DIR>/extras/open_model_zoo/tools/downloader`| 
+|[Cross Check Tool](../../tools/cross_check_tool/README.md)  | `<INSTALL_DIR>/tools/cross_check_tool`|
+|[Compile Tool](../../tools/compile_tool/README.md)          | `<INSTALL_DIR>/tools/compile_tool`|
 
 
 ## See Also
diff --git a/docs/IE_DG/inference_engine_intro.md b/docs/IE_DG/inference_engine_intro.md
index 89d80654fe4480..3ad44b99144736 100644
--- a/docs/IE_DG/inference_engine_intro.md
+++ b/docs/IE_DG/inference_engine_intro.md
@@ -84,9 +84,9 @@ Make sure those libraries are in your computer's path or in the place you pointe
 * Windows: `PATH`
 * macOS: `DYLD_LIBRARY_PATH`
 
-On Linux and macOS, use the script `bin/setupvars.sh` to set the environment variables.
+On Linux and macOS, use the script `setupvars.sh` to set the environment variables.
 
-On Windows, run the `bin\setupvars.bat` batch file to set the environment variables.
+On Windows, run the `setupvars.bat` batch file to set the environment variables.
 
 To learn more about supported devices and corresponding plugins, see the [Supported Devices](supported_plugins/Supported_Devices.md) chapter.
 
diff --git a/docs/IE_DG/supported_plugins/CPU.md b/docs/IE_DG/supported_plugins/CPU.md
index 8f75a792adeeb2..12b005099ba092 100644
--- a/docs/IE_DG/supported_plugins/CPU.md
+++ b/docs/IE_DG/supported_plugins/CPU.md
@@ -105,17 +105,18 @@ These are general options, also supported by other plugins:
 
 | Parameter name                  | Parameter values      | Default            | Description                                                                                                                  |
 | :---                            | :---                  | :---               | :----------------------------------------------------------------------------------------------------------------------------|
-| KEY_EXCLUSIVE_ASYNC_REQUESTS    | YES/NO                | NO                 | Forces async requests (also from different executable networks) to execute serially. This prevents potential oversubscription|
-| KEY_PERF_COUNT                  | YES/NO                | NO                 | Enables gathering performance counters                                                                                       |
+| `KEY_EXCLUSIVE_ASYNC_REQUESTS`    | `YES`/`NO`                | `NO`                 | Forces async requests (also from different executable networks) to execute serially. This prevents potential oversubscription|
+| `KEY_PERF_COUNT`                 | `YES`/`NO`                | `NO`                 | Enables gathering performance counters                                                                                       |
 
 CPU-specific settings:
 
-| Parameter name              | Parameter values      | Default            | Description                                               |
-| :---                        | :---                  | :---               | :--- |
-| KEY_CPU_THREADS_NUM         | positive integer values| 0                 | Specifies the number of threads that CPU plugin should use for inference. Zero (default) means using all (logical) cores|
-| KEY_CPU_BIND_THREAD         | YES/NUMA/NO           | YES                | Binds inference threads to CPU cores. 'YES' (default) binding option maps threads to cores - this works best for static/synthetic scenarios like benchmarks. The 'NUMA' binding is more relaxed, binding inference threads only to NUMA nodes, leaving further scheduling to specific cores to the OS. This option might perform better in the real-life/contended scenarios. Note that for the latency-oriented cases (number of the streams is less or equal to the number of NUMA nodes, see below) both YES and NUMA options limit number of inference threads to the number of hardware cores (ignoring hyper-threading) on the multi-socket machines. |
-| KEY_CPU_THROUGHPUT_STREAMS  | KEY_CPU_THROUGHPUT_NUMA, KEY_CPU_THROUGHPUT_AUTO, or positive integer values| 1 | Specifies number of CPU "execution" streams for the throughput mode. Upper bound for the number of inference requests that can be executed simultaneously. All available CPU cores are evenly distributed between the streams. The default value is 1, which implies latency-oriented behavior for single NUMA-node machine, with all available cores processing requests one by one. On the multi-socket (multiple NUMA nodes) machine, the best latency numbers usually achieved with a number of streams matching the number of NUMA-nodes. <br>KEY_CPU_THROUGHPUT_NUMA creates as many streams as needed to accommodate NUMA and avoid associated penalties.<br>KEY_CPU_THROUGHPUT_AUTO creates bare minimum of streams to improve the performance; this is the most portable option if you don't know how many cores your target machine has (and what would be the optimal number of streams). Note that your application should provide enough parallel slack (for example, run many inference requests) to leverage the throughput mode. <br> Non-negative integer value creates the requested number of streams. If a number of streams is 0, no internal streams are created and user threads are interpreted as stream master threads.|
-| KEY_ENFORCE_BF16            | YES/NO| YES | The name for setting to execute in bfloat16 precision whenever it is possible. This option lets plugin know to downscale the precision where it sees performance benefits from bfloat16 execution. Such option does not guarantee accuracy of the network, you need to verify the accuracy in this mode separately, based on performance and accuracy results. It should be your decision whether to use this option or not. |
+
+| Parameter name     | Parameter values      | Default            |             Description                                                      |
+| :---               | :---                  | :---               |:-----------------------------------------------------------------------------|
+| `KEY_CPU_THREADS_NUM`         | `positive integer values`| `0`                 | Specifies the number of threads that CPU plugin should use for inference. Zero (default) means using all (logical) cores|
+| `KEY_CPU_BIND_THREAD`         | `YES`/`NUMA`/`NO`           | `YES`                | Binds inference threads to CPU cores. 'YES' (default) binding option maps threads to cores - this works best for static/synthetic scenarios like benchmarks. The 'NUMA' binding is more relaxed, binding inference threads only to NUMA nodes, leaving further scheduling to specific cores to the OS. This option might perform better in the real-life/contended scenarios. Note that for the latency-oriented cases (number of the streams is less or equal to the number of NUMA nodes, see below) both YES and NUMA options limit number of inference threads to the number of hardware cores (ignoring hyper-threading) on the multi-socket machines. |
+| `KEY_CPU_THROUGHPUT_STREAMS`  | `KEY_CPU_THROUGHPUT_NUMA`, `KEY_CPU_THROUGHPUT_AUTO`, or `positive integer values`| `1` | Specifies number of CPU "execution" streams for the throughput mode. Upper bound for the number of inference requests that can be executed simultaneously. All available CPU cores are evenly distributed between the streams. The default value is 1, which implies latency-oriented behavior for single NUMA-node machine, with all available cores processing requests one by one. On the multi-socket (multiple NUMA nodes) machine, the best latency numbers usually achieved with a number of streams matching the number of NUMA-nodes. <br>`KEY_CPU_THROUGHPUT_NUMA` creates as many streams as needed to accommodate NUMA and avoid associated penalties.<br>`KEY_CPU_THROUGHPUT_AUTO` creates bare minimum of streams to improve the performance; this is the most portable option if you don't know how many cores your target machine has (and what would be the optimal number of streams). Note that your application should provide enough parallel slack (for example, run many inference requests) to leverage the throughput mode. <br> Non-negative integer value creates the requested number of streams. If a number of streams is 0, no internal streams are created and user threads are interpreted as stream master threads.|
+| `KEY_ENFORCE_BF16`            | `YES`/`NO`| `YES` | The name for setting to execute in bfloat16 precision whenever it is possible. This option lets plugin know to downscale the precision where it sees performance benefits from bfloat16 execution. Such option does not guarantee accuracy of the network, you need to verify the accuracy in this mode separately, based on performance and accuracy results. It should be your decision whether to use this option or not. |
 
 > **NOTE**: To disable all internal threading, use the following set of configuration parameters: `KEY_CPU_THROUGHPUT_STREAMS=0`, `KEY_CPU_THREADS_NUM=1`, `KEY_CPU_BIND_THREAD=NO`.
 
diff --git a/docs/IE_DG/supported_plugins/GPU.md b/docs/IE_DG/supported_plugins/GPU.md
index cc12be98a121e1..ab84dfbac06a9f 100644
--- a/docs/IE_DG/supported_plugins/GPU.md
+++ b/docs/IE_DG/supported_plugins/GPU.md
@@ -99,23 +99,24 @@ The plugin supports the configuration parameters listed below.
 All parameters must be set before calling <code>InferenceEngine::Core::LoadNetwork()</code> in order to take effect.
 When specifying key values as raw strings (that is, when using Python API), omit the `KEY_` prefix.
 
+
 | Parameter Name          | Parameter Values                | Default         | Description                                               |
 |---------------------|-----------------------------|-----------------|-----------------------------------------------------------|
 | `KEY_CACHE_DIR`      | `"<cache_dir>"`                    | `""`              | Specifies a directory where compiled OCL binaries can be cached. First model loading generates the cache, and all subsequent LoadNetwork calls use precompiled kernels which significantly improves load time. If empty - caching is disabled             |
 | `KEY_PERF_COUNT`      | `YES` / `NO`                    | `NO`              | Collect performance counters during inference             |
 | `KEY_CONFIG_FILE`     | `"<file1> [<file2> ...]"`         | `""`              | Load custom layer configuration files                     |
-| `KEY_GPU_PLUGIN_PRIORITY` | `<0-3>`                       | `0`               | OpenCL queue priority (before usage, make sure your OpenCL driver supports appropriate extension)<br> Higher value means higher priority for OpenCL queue. 0 disables the setting. |
-| `KEY_GPU_PLUGIN_THROTTLE` | `<0-3>`                       | `0`               | OpenCL queue throttling (before usage, make sure your OpenCL driver supports appropriate extension)<br> Lower value means lower driver thread priority and longer sleep time for it. 0 disables the setting. |
-| `KEY_CLDNN_ENABLE_FP16_FOR_QUANTIZED_MODELS` | `YES` / `NO`                       | `YES`               | Allows using FP16+INT8 mixed precision mode, so non-quantized parts of a model will be executed in FP16 precision for FP16 IR. Does not affect quantized FP32 IRs |
-| `KEY_GPU_NV12_TWO_INPUTS` | `YES` / `NO`                       | `NO`               | Controls preprocessing logic for nv12 input. If it's set to YES, then device graph will expect that user will set biplanar nv12 blob as input wich will be directly passed to device execution graph. Otherwise, preprocessing via GAPI is used to convert NV12->BGR, thus GPU graph have to expect single input |
-| `KEY_GPU_THROUGHPUT_STREAMS`  | `KEY_GPU_THROUGHPUT_AUTO`, or positive integer| 1 | Specifies a number of GPU "execution" streams for the throughput mode (upper bound for a number of inference requests that can be executed simultaneously).<br>This option is can be used to decrease GPU stall time by providing more effective load from several streams. Increasing the number of streams usually is more effective for smaller topologies or smaller input sizes. Note that your application should provide enough parallel slack (e.g. running many inference requests) to leverage full GPU bandwidth. Additional streams consume several times more GPU memory, so make sure the system has enough memory available to suit parallel stream execution. Multiple streams might also put additional load on CPU. If CPU load increases, it can be regulated by setting an appropriate `KEY_GPU_PLUGIN_THROTTLE` option value (see above). If your target system has relatively weak CPU, keep throttling low. <br>The default value is 1, which implies latency-oriented behavior.<br>`KEY_GPU_THROUGHPUT_AUTO` creates bare minimum of streams to improve the performance; this is the most portable option if you are not sure how many resources your target machine has (and what would be the optimal number of streams). <br> A positive integer value creates the requested number of streams. |
-| `KEY_EXCLUSIVE_ASYNC_REQUESTS` | `YES` / `NO`                | `NO`              | Forces async requests (also from different executable networks) to execute serially.|
-| `KEY_GPU_MAX_NUM_THREADS` | `integer value` | `maximum # of HW threads available in host environment` |  Specifies the number of CPU threads that can be used for GPU engine, e.g, JIT compilation of GPU kernels or cpu kernel processing within GPU plugin. The default value is set as the number of maximum available threads in host environment to minimize the time for LoadNetwork, where the GPU kernel build time occupies a large portion. Note that if the specified value is larger than the maximum available # of threads or less than zero, it is set as maximum available # of threads. It can be specified with a smaller number than the available HW threads according to the usage scenario, e.g., when the user wants to assign more CPU threads while GPU plugin is running. Note that setting this value with lower number will affect not only the network loading time but also the cpu layers of GPU networks that are optimized with multi-threading. |
-| `KEY_GPU_ENABLE_LOOP_UNROLLING` | `YES` / `NO`             | `YES`             | Enables recurrent layers such as TensorIterator or Loop with fixed iteration count to be unrolled. It is turned on by default. Turning this key on will achieve better inference performance for loops with not too many iteration counts (less than 16, as a rule of thumb). Turning this key off will achieve better performance for both graph loading time and inference time with many iteration counts (greater than 16). Note that turning this key on will increase the graph loading time in proportion to the iteration counts. Thus, this key should be turned off if graph loading time is considered to be most important target to optimize. |
-| `KEY_CLDNN_PLUGIN_PRIORITY` | `<0-3>`                       | `0`               | OpenCL queue priority (before usage, make sure your OpenCL driver supports appropriate extension)<br> Higher value means higher priority for OpenCL queue. 0 disables the setting. **Deprecated**. Please use KEY_GPU_PLUGIN_PRIORITY |
-| `KEY_CLDNN_PLUGIN_THROTTLE` | `<0-3>`                       | `0`               | OpenCL queue throttling (before usage, make sure your OpenCL driver supports appropriate extension)<br> Lower value means lower driver thread priority and longer sleep time for it. 0 disables the setting. **Deprecated**. Please use KEY_GPU_PLUGIN_THROTTLE |
-| `KEY_CLDNN_GRAPH_DUMPS_DIR` | `"<dump_dir>"`                       | `""`               | clDNN graph optimizer stages dump output directory (in GraphViz format) **Deprecated**. Will be removed in the next release                                     |
-| `KEY_CLDNN_SOURCES_DUMPS_DIR` | `"<dump_dir>"`                       | `""`               | Final optimized clDNN OpenCL sources dump output directory. **Deprecated**. Will be removed in the next release                                   |
+| `KEY_GPU_PLUGIN_`<br>`PRIORITY` | `<0-3>`                       | `0`               | OpenCL queue priority (before usage, make sure your OpenCL driver supports appropriate extension)<br> Higher value means higher priority for OpenCL queue. 0 disables the setting. |
+| `KEY_GPU_PLUGIN_`<br>`THROTTLE` | `<0-3>`                       | `0`               | OpenCL queue throttling (before usage, make sure your OpenCL driver supports appropriate extension)<br> Lower value means lower driver thread priority and longer sleep time for it. 0 disables the setting. |
+| `KEY_CLDNN_ENABLE_`<br>`FP16_FOR_QUANTIZED_`<br>`MODELS` | `YES` / `NO`                       | `YES`               | Allows using FP16+INT8 mixed precision mode, so non-quantized parts of a model will be executed in FP16 precision for FP16 IR. Does not affect quantized FP32 IRs |
+| `KEY_GPU_NV12_`<br>`TWO_INPUTS` | `YES` / `NO`                       | `NO`               | Controls preprocessing logic for nv12 input. If it's set to YES, then device graph will expect that user will set biplanar nv12 blob as input wich will be directly passed to device execution graph. Otherwise, preprocessing via GAPI is used to convert NV12->BGR, thus GPU graph have to expect single input |
+| `KEY_GPU_THROUGHPUT_`<br>`STREAMS`  | `KEY_GPU_THROUGHPUT_AUTO`, or positive integer| 1 | Specifies a number of GPU "execution" streams for the throughput mode (upper bound for a number of inference requests that can be executed simultaneously).<br>This option is can be used to decrease GPU stall time by providing more effective load from several streams. Increasing the number of streams usually is more effective for smaller topologies or smaller input sizes. Note that your application should provide enough parallel slack (e.g. running many inference requests) to leverage full GPU bandwidth. Additional streams consume several times more GPU memory, so make sure the system has enough memory available to suit parallel stream execution. Multiple streams might also put additional load on CPU. If CPU load increases, it can be regulated by setting an appropriate `KEY_GPU_PLUGIN_THROTTLE` option value (see above). If your target system has relatively weak CPU, keep throttling low. <br>The default value is 1, which implies latency-oriented behavior.<br>`KEY_GPU_THROUGHPUT_AUTO` creates bare minimum of streams to improve the performance; this is the most portable option if you are not sure how many resources your target machine has (and what would be the optimal number of streams). <br> A positive integer value creates the requested number of streams. |
+| `KEY_EXCLUSIVE_ASYNC_`<br>`REQUESTS` | `YES` / `NO`                | `NO`              | Forces async requests (also from different executable networks) to execute serially.|
+| `KEY_GPU_MAX_NUM_`<br>`THREADS` | `integer value` | `maximum # of HW threads available in host environment` |  Specifies the number of CPU threads that can be used for GPU engine, e.g, JIT compilation of GPU kernels or cpu kernel processing within GPU plugin. The default value is set as the number of maximum available threads in host environment to minimize the time for LoadNetwork, where the GPU kernel build time occupies a large portion. Note that if the specified value is larger than the maximum available # of threads or less than zero, it is set as maximum available # of threads. It can be specified with a smaller number than the available HW threads according to the usage scenario, e.g., when the user wants to assign more CPU threads while GPU plugin is running. Note that setting this value with lower number will affect not only the network loading time but also the cpu layers of GPU networks that are optimized with multi-threading. |
+| `KEY_GPU_ENABLE_`<br>`LOOP_UNROLLING` | `YES` / `NO`             | `YES`             | Enables recurrent layers such as TensorIterator or Loop with fixed iteration count to be unrolled. It is turned on by default. Turning this key on will achieve better inference performance for loops with not too many iteration counts (less than 16, as a rule of thumb). Turning this key off will achieve better performance for both graph loading time and inference time with many iteration counts (greater than 16). Note that turning this key on will increase the graph loading time in proportion to the iteration counts. Thus, this key should be turned off if graph loading time is considered to be most important target to optimize. |
+| `KEY_CLDNN_PLUGIN_`<br>`PRIORITY` | `<0-3>`                       | `0`               | OpenCL queue priority (before usage, make sure your OpenCL driver supports appropriate extension)<br> Higher value means higher priority for OpenCL queue. 0 disables the setting. **Deprecated**. Please use KEY_GPU_PLUGIN_PRIORITY |
+| `KEY_CLDNN_PLUGIN_`<br>`THROTTLE` | `<0-3>`                       | `0`               | OpenCL queue throttling (before usage, make sure your OpenCL driver supports appropriate extension)<br> Lower value means lower driver thread priority and longer sleep time for it. 0 disables the setting. **Deprecated**. Please use KEY_GPU_PLUGIN_THROTTLE |
+| `KEY_CLDNN_GRAPH_`<br>`DUMPS_DIR` | `"<dump_dir>"`                       | `""`               | clDNN graph optimizer stages dump output directory (in GraphViz format) **Deprecated**. Will be removed in the next release                                     |
+| `KEY_CLDNN_SOURCES_`<br>`DUMPS_DIR` | `"<dump_dir>"`                       | `""`               | Final optimized clDNN OpenCL sources dump output directory. **Deprecated**. Will be removed in the next release                                   |
 | `KEY_DUMP_KERNELS`    | `YES` / `NO`                    | `NO`              | Dump the final kernels used for custom layers. **Deprecated**. Will be removed in the next release             |
 | `KEY_TUNING_MODE`     | `TUNING_DISABLED` <br /> `TUNING_CREATE` <br />  `TUNING_USE_EXISTING`            | `TUNING_DISABLED` | Disable inference kernel tuning     <br /> Create tuning file (expect much longer runtime)  <br />         Use an existing tuning file. **Deprecated**. Will be removed in the next release |
 | `KEY_TUNING_FILE`     | `"<filename>"`                  | `""`              | Tuning file to create / use. **Deprecated**. Will be removed in the next release |
diff --git a/docs/IE_DG/supported_plugins/HETERO.md b/docs/IE_DG/supported_plugins/HETERO.md
index f2b7521457e294..3d965e109f24e7 100644
--- a/docs/IE_DG/supported_plugins/HETERO.md
+++ b/docs/IE_DG/supported_plugins/HETERO.md
@@ -23,7 +23,7 @@ If transmitting data from one part of a network to another part in heterogeneous
 In this case, you can define heaviest part manually and set the affinity to avoid sending data back and forth many times during one inference.
 
 ## Annotation of Layers per Device and Default Fallback Policy
-Default fallback policy decides which layer goes to which device automatically according to the support in dedicated plugins (FPGA, GPU, CPU, MYRIAD).
+Default fallback policy decides which layer goes to which device automatically according to the support in dedicated plugins (GPU, CPU, MYRIAD).
 
 Another way to annotate a network is to set affinity manually using <code>ngraph::Node::get_rt_info</code> with key `"affinity"`:
 
@@ -46,25 +46,16 @@ If you rely on the default affinity distribution, you can avoid calling <code>In
 During loading of the network to heterogeneous plugin, network is divided to separate parts and loaded to dedicated plugins.
 Intermediate blobs between these sub graphs are allocated automatically in the most efficient way.
 
-## Execution Precision
-Precision for inference in heterogeneous plugin is defined by
-* Precision of IR.
-* Ability of final plugins to execute in precision defined in IR
-
-Examples:
-* If you want to execute GPU with CPU fallback with FP16 on GPU, you need to use only FP16 IR.
-* If you want to execute on FPGA with CPU fallback, you can use any precision for IR. The execution on FPGA is defined by bitstream, the execution on CPU happens in FP32.
-
 Samples can be used with the following command:
 
 ```sh
-./object_detection_sample_ssd -m  <path_to_model>/ModelSSD.xml -i <path_to_pictures>/picture.jpg -d HETERO:FPGA,CPU
+./object_detection_sample_ssd -m  <path_to_model>/ModelSSD.xml -i <path_to_pictures>/picture.jpg -d HETERO:GPU,CPU
 ```
 where:
 - `HETERO` stands for heterogeneous plugin
-- `FPGA,CPU` points to fallback policy with priority on FPGA and fallback to CPU
+- `GPU,CPU` points to fallback policy with priority on GPU and fallback to CPU
 
-You can point more than two devices: `-d HETERO:FPGA,GPU,CPU`
+You can point more than two devices: `-d HETERO:GPU,GPU,CPU`
 
 ## Analyzing Heterogeneous Execution
 After enabling of <code>KEY_HETERO_DUMP_GRAPH_DOT</code> config key, you can dump GraphViz* `.dot` files with annotations of devices per layer.
diff --git a/docs/IE_DG/supported_plugins/MULTI.md b/docs/IE_DG/supported_plugins/MULTI.md
index a3f7dc2afc9a89..cebc03ba135fdc 100644
--- a/docs/IE_DG/supported_plugins/MULTI.md
+++ b/docs/IE_DG/supported_plugins/MULTI.md
@@ -96,10 +96,8 @@ Notice that you can use the FP16 IR to work with multi-device (as CPU automatica
 Also notice that no demos are (yet) fully optimized for the multi-device, by means of supporting the OPTIMAL_NUMBER_OF_INFER_REQUESTS metric, using the GPU streams/throttling, and so on.
 
 ## Video: MULTI Plugin
-[![](https://img.youtube.com/vi/xbORYFEmrqU/0.jpg)](https://www.youtube.com/watch?v=xbORYFEmrqU)
-\htmlonly
+
 <iframe width="560" height="315" src="https://www.youtube.com/embed/xbORYFEmrqU" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
-\endhtmlonly
 
 ## See Also
 * [Supported Devices](Supported_Devices.md)
diff --git a/docs/Legal_Information.md b/docs/Legal_Information.md
index 2f3526f2902677..2936ae2a949665 100644
--- a/docs/Legal_Information.md
+++ b/docs/Legal_Information.md
@@ -1,22 +1,20 @@
 # Legal Information {#openvino_docs_Legal_Information}
 
-This software and the related documents are Intel copyrighted materials, and your use of them is governed by the express license (the “License”) under which they were provided to you. No license (express or implied, by estoppel or otherwise) to any intellectual property rights is granted by this document. Unless the License provides otherwise, you may not use, modify, copy, publish, distribute, disclose or transmit this software or the related documents without Intel's prior written permission. This software and the related documents are provided as is, with no express or implied warranties, other than those that are expressly stated in the License. Intel disclaims all express and implied warranties, including without limitation, the implied warranties of merchantability, fitness for a particular purpose, and non-infringement, as well as any warranty arising from course of performance, course of dealing, or usage in trade.
-
-This document contains information on products, services and/or processes in development. All information provided here is subject to change without notice. Contact your Intel representative to obtain the latest forecast, schedule, specifications and roadmaps. The products and services described may contain defects or errors known as errata which may cause deviations from published specifications. Current characterized errata are available on request. Copies of documents which have an order number and are referenced in this document may be obtained by calling 1-800-548-4725 or by visiting [www.intel.com/design/literature.htm](https://www.intel.com/design/literature.htm).
-
 Performance varies by use, configuration and other factors. Learn more at [www.intel.com/PerformanceIndex](https://www.intel.com/PerformanceIndex).
-
-Performance results are based on testing as of dates shown in configurations and may not reflect all publicly available updates.  See backup for configuration details.  No product or component can be absolutely secure. 
-
-Your costs and results may vary. 
-
+ 
+Performance results are based on testing as of dates shown in configurations and may not reflect all publicly available updates. See backup for configuration details.  No product or component can be absolutely secure.
+ 
+Your costs and results may vary.
+ 
 Intel technologies may require enabled hardware, software or service activation.
 
-© Intel Corporation. Intel, the Intel logo, and other Intel marks are trademarks of Intel Corporation or its subsidiaries. \*Other names and brands may be claimed as the property of others.  
+OpenCL and the OpenCL logo are trademarks of Apple Inc. used by permission by Khronos.
 
+© Intel Corporation. Intel, the Intel logo, and other Intel marks are trademarks of Intel Corporation or its subsidiaries. Other names and brands may be claimed as the property of others.
+ 
 ## OpenVINO™ Logo
 To build equity around the project, the OpenVINO logo was created for both Intel and community usage. The logo may only be used to represent the OpenVINO toolkit and offerings built using the OpenVINO toolkit.
-
+ 
 ## Logo Usage Guidelines
 The OpenVINO logo must be used in connection with truthful, non-misleading references to the OpenVINO toolkit, and for no other purpose.
-Modification of the logo or use of any separate element(s) of the logo alone is not allowed.
+Modification of the logo or use of any separate element(s) of the logo alone is not allowed.
\ No newline at end of file
diff --git a/docs/MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md b/docs/MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md
index 2aed66ba719934..378d559f895805 100644
--- a/docs/MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md
+++ b/docs/MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md
@@ -1,136 +1,54 @@
 # Model Optimizer Developer Guide {#openvino_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide}
 
+## Introduction 
+
 Model Optimizer is a cross-platform command-line tool that facilitates the transition between the training and deployment environment, performs static model analysis, and adjusts deep learning models for optimal execution on end-point target devices.
 
-Model Optimizer process assumes you have a network model trained using a supported deep learning framework. The scheme below illustrates the typical workflow for deploying a trained deep learning model:
+Model Optimizer process assumes you have a network model trained using supported deep learning frameworks: Caffe*, TensorFlow*, Kaldi*, MXNet* or converted to the ONNX* format. Model Optimizer produces an Intermediate Representation (IR) of the network, which can be inferred with the [Inference Engine](../IE_DG/Deep_Learning_Inference_Engine_DevGuide.md).
+
+> **NOTE**: Model Optimizer does not infer models. Model Optimizer is an offline tool that runs before the inference takes place.
+
+The scheme below illustrates the typical workflow for deploying a trained deep learning model: 
 
 ![](img/workflow_steps.png)
 
-Model Optimizer produces an Intermediate Representation (IR) of the network, which can be read, loaded, and inferred with the Inference Engine. The Inference Engine API offers a unified API across a number of supported Intel® platforms. The Intermediate Representation is a pair of files describing the model:
+The IR is a pair of files describing the model: 
 
 *  <code>.xml</code> - Describes the network topology
 
 *  <code>.bin</code> - Contains the weights and biases binary data.
 
-> **TIP**: You also can work with the Model Optimizer inside the OpenVINO™ [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench).
-> [DL Workbench](@ref workbench_docs_Workbench_DG_Introduction) is a platform built upon OpenVINO™ and provides a web-based graphical environment that enables you to optimize, fine-tune, analyze, visualize, and compare 
-> performance of deep learning models on various Intel® architecture
-> configurations. In the DL Workbench, you can use most of OpenVINO™ toolkit components.
-> <br>
-> Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub) to get started.
-
-## What's New in the Model Optimizer in this Release?
-
-* Common changes:
-    * Implemented several optimization transformations to replace sub-graphs of operations with HSwish, Mish, Swish and SoftPlus operations.
-    * Model Optimizer generates IR keeping shape-calculating sub-graphs **by default**. Previously, this behavior was triggered if the "--keep_shape_ops" command line parameter was provided. The key is ignored in this release and will be deleted in the next release. To trigger the legacy behavior to generate an IR for a fixed input shape (folding ShapeOf operations and shape-calculating sub-graphs to Constant), use the "--static_shape" command line parameter. Changing model input shape using the Inference Engine API in runtime may fail for such an IR.
-    * Fixed Model Optimizer conversion issues resulted in non-reshapeable IR using the Inference Engine reshape API.
-    * Enabled transformations to fix non-reshapeable patterns in the original networks:
-        * Hardcoded Reshape
-            * In Reshape(2D)->MatMul pattern
-            * Reshape->Transpose->Reshape when the pattern can be fused to the ShuffleChannels or DepthToSpace operation
-        * Hardcoded Interpolate
-            * In Interpolate->Concat pattern
-        * Added a dedicated requirements file for TensorFlow 2.X as well as the dedicated install prerequisites scripts.
-        * Replaced the SparseToDense operation with ScatterNDUpdate-4.
-* ONNX*:
-    * Enabled an ability to specify the model output **tensor** name using the "--output" command line parameter.
-    * Added support for the following operations:
-        * Acosh
-        * Asinh
-        * Atanh
-        * DepthToSpace-11, 13
-        * DequantizeLinear-10 (zero_point must be constant)
-        * HardSigmoid-1,6
-        * QuantizeLinear-10 (zero_point must be constant)
-        * ReduceL1-11, 13
-        * ReduceL2-11, 13
-        * Resize-11, 13 (except mode="nearest" with 5D+ input, mode="tf_crop_and_resize", and attributes exclude_outside and extrapolation_value with non-zero values)
-        * ScatterND-11, 13
-        * SpaceToDepth-11, 13
-* TensorFlow*:
-    * Added support for the following operations:
-        * Acosh
-        * Asinh
-        * Atanh
-        * CTCLoss
-        * EuclideanNorm
-        * ExtractImagePatches
-        * FloorDiv
-* MXNet*:
-    * Added support for the following operations:
-        * Acosh
-        * Asinh
-        * Atanh
-* Kaldi*:
-    * Fixed bug with ParallelComponent support. Now it is fully supported with no restrictions.
-
-> **NOTE:** 
-> [Intel® System Studio](https://software.intel.com/en-us/system-studio) is an all-in-one, cross-platform tool suite, purpose-built to simplify system bring-up and improve system and IoT device application performance on Intel® platforms. If you are using the Intel® Distribution of OpenVINO™ with Intel® System Studio, go to [Get Started with Intel® System Studio](https://software.intel.com/en-us/articles/get-started-with-openvino-and-intel-system-studio-2019).
-
-## Table of Contents
-
-* [Preparing and Optimizing your Trained Model with Model Optimizer](prepare_model/Prepare_Trained_Model.md)
-    * [Configuring Model Optimizer](prepare_model/Config_Model_Optimizer.md)
-    * [Converting a Model to Intermediate Representation (IR)](prepare_model/convert_model/Converting_Model.md)
-        * [Converting a Model Using General Conversion Parameters](prepare_model/convert_model/Converting_Model_General.md)
-        * [Converting Your Caffe* Model](prepare_model/convert_model/Convert_Model_From_Caffe.md)
-        * [Converting Your TensorFlow* Model](prepare_model/convert_model/Convert_Model_From_TensorFlow.md)
-            * [Converting BERT from TensorFlow](prepare_model/convert_model/tf_specific/Convert_BERT_From_Tensorflow.md)
-            * [Converting GNMT from TensorFlow](prepare_model/convert_model/tf_specific/Convert_GNMT_From_Tensorflow.md)
-            * [Converting YOLO from DarkNet to TensorFlow and then to IR](prepare_model/convert_model/tf_specific/Convert_YOLO_From_Tensorflow.md)
-            * [Converting Wide and Deep Models from TensorFlow](prepare_model/convert_model/tf_specific/Convert_WideAndDeep_Family_Models.md)
-            * [Converting FaceNet from TensorFlow](prepare_model/convert_model/tf_specific/Convert_FaceNet_From_Tensorflow.md)
-            * [Converting DeepSpeech from TensorFlow](prepare_model/convert_model/tf_specific/Convert_DeepSpeech_From_Tensorflow.md)
-            * [Converting Language Model on One Billion Word Benchmark from TensorFlow](prepare_model/convert_model/tf_specific/Convert_lm_1b_From_Tensorflow.md)
-            * [Converting Neural Collaborative Filtering Model from TensorFlow*](prepare_model/convert_model/tf_specific/Convert_NCF_From_Tensorflow.md)
-            * [Converting TensorFlow* Object Detection API Models](prepare_model/convert_model/tf_specific/Convert_Object_Detection_API_Models.md)
-            * [Converting TensorFlow*-Slim Image Classification Model Library Models](prepare_model/convert_model/tf_specific/Convert_Slim_Library_Models.md)
-            * [Converting CRNN Model from TensorFlow*](prepare_model/convert_model/tf_specific/Convert_CRNN_From_Tensorflow.md)
-        * [Converting Your MXNet* Model](prepare_model/convert_model/Convert_Model_From_MxNet.md)
-            * [Converting a Style Transfer Model from MXNet](prepare_model/convert_model/mxnet_specific/Convert_Style_Transfer_From_MXNet.md)
-        * [Converting Your Kaldi* Model](prepare_model/convert_model/Convert_Model_From_Kaldi.md)
-        * [Converting Your ONNX* Model](prepare_model/convert_model/Convert_Model_From_ONNX.md)
-            * [Converting Faster-RCNN ONNX* Model](prepare_model/convert_model/onnx_specific/Convert_Faster_RCNN.md)
-            * [Converting Mask-RCNN ONNX* Model](prepare_model/convert_model/onnx_specific/Convert_Mask_RCNN.md)
-            * [Converting GPT2 ONNX* Model](prepare_model/convert_model/onnx_specific/Convert_GPT2.md)
-        * [Converting Your PyTorch* Model](prepare_model/convert_model/Convert_Model_From_PyTorch.md)
-            * [Converting F3Net PyTorch* Model](prepare_model/convert_model/pytorch_specific/Convert_F3Net.md)
-            * [Converting QuartzNet PyTorch* Model](prepare_model/convert_model/pytorch_specific/Convert_QuartzNet.md)
-            * [Converting YOLACT PyTorch* Model](prepare_model/convert_model/pytorch_specific/Convert_YOLACT.md)
-        * [Model Optimizations Techniques](prepare_model/Model_Optimization_Techniques.md)
-        * [Cutting parts of the model](prepare_model/convert_model/Cutting_Model.md)
-        * [Sub-graph Replacement in Model Optimizer](prepare_model/customize_model_optimizer/Subgraph_Replacement_Model_Optimizer.md)
-        * [Supported Framework Layers](prepare_model/Supported_Frameworks_Layers.md)
-        * [Intermediate Representation and Operation Sets](IR_and_opsets.md)
-        * [Operations Specification](../ops/opset.md)
-        * [Intermediate Representation suitable for INT8 inference](prepare_model/convert_model/IR_suitable_for_INT8_inference.md)
-    * [Model Optimizer Extensibility](prepare_model/customize_model_optimizer/Customize_Model_Optimizer.md)
-        * [Extending Model Optimizer with New Primitives](prepare_model/customize_model_optimizer/Extending_Model_Optimizer_with_New_Primitives.md)
-        * [Extending Model Optimizer with Caffe Python Layers](prepare_model/customize_model_optimizer/Extending_Model_Optimizer_with_Caffe_Python_Layers.md)
-        * [Extending Model Optimizer with Custom MXNet* Operations](prepare_model/customize_model_optimizer/Extending_MXNet_Model_Optimizer_with_New_Primitives.md)
-        * [Legacy Mode for Caffe* Custom Layers](prepare_model/customize_model_optimizer/Legacy_Mode_for_Caffe_Custom_Layers.md)
-    * [Model Optimizer Frequently Asked Questions](prepare_model/Model_Optimizer_FAQ.md)
-
-* [Known Issues](Known_Issues_Limitations.md)
-
-**Typical Next Step:** [Preparing and Optimizing your Trained Model with Model Optimizer](prepare_model/Prepare_Trained_Model.md)
-
-## Video: Model Optimizer Concept
-
-[![](https://img.youtube.com/vi/Kl1ptVb7aI8/0.jpg)](https://www.youtube.com/watch?v=Kl1ptVb7aI8)
-\htmlonly
-<iframe width="560" height="315" src="https://www.youtube.com/embed/Kl1ptVb7aI8" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
-\endhtmlonly
-
-## Video: Model Optimizer Basic Operation
-[![](https://img.youtube.com/vi/BBt1rseDcy0/0.jpg)](https://www.youtube.com/watch?v=BBt1rseDcy0)
-\htmlonly
-<iframe width="560" height="315" src="https://www.youtube.com/embed/BBt1rseDcy0" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
-\endhtmlonly
+Below is a simple command running Model Optimizer to generate an IR for the input model:
+
+```sh
+python3 mo.py --input_model INPUT_MODEL
+```
+To learn about all Model Optimizer parameters and conversion technics, see the [Converting a Model to IR](prepare_model/convert_model/Converting_Model.md) page.
+
+> **TIP**: You can quick start with the Model Optimizer inside the OpenVINO™ [Deep Learning Workbench](@ref 
+> openvino_docs_get_started_get_started_dl_workbench) (DL Workbench).
+> [DL Workbench](@ref workbench_docs_Workbench_DG_Introduction) is the OpenVINO™ toolkit UI that enables you to
+> import a model, analyze its performance and accuracy, visualize the outputs, optimize and prepare the model for 
+> deployment on various Intel® platforms.
+
+## Videos
+
+<table>
+  <tr>
+    <td>
+<iframe width="220" src="https://www.youtube.com/embed/Kl1ptVb7aI8" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
+</td>
+<td>
+    <iframe width="220" src="https://www.youtube.com/embed/BBt1rseDcy0" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
+</td>
+<td>
+<iframe width="220" src="https://www.youtube.com/embed/RF8ypHyiKrY" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
+</td>
+  </tr>
+  <tr>
+    <td><strong>Model Optimizer Concept</strong>. <br>Duration: 3:56</td>
+    <td><strong>Model Optimizer Basic<br> Operation</strong>. <br>Duration: 2:57.</td>
+    <td><strong>Choosing the Right Precision</strong>. <br>Duration: 4:18.</td>
+  </tr>
+</table>
 
-## Video: Choosing the Right Precision
-[![](https://img.youtube.com/vi/RF8ypHyiKrY/0.jpg)](https://www.youtube.com/watch?v=RF8ypHyiKrY)
-\htmlonly
-<iframe width="560" height="315" src="https://www.youtube.com/embed/RF8ypHyiKrY" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
-\endhtmlonly
diff --git a/docs/MO_DG/img/small_IR_graph_demonstration.png b/docs/MO_DG/img/small_IR_graph_demonstration.png
index 91a3fe385ae32f..332c11fdb65b66 100644
--- a/docs/MO_DG/img/small_IR_graph_demonstration.png
+++ b/docs/MO_DG/img/small_IR_graph_demonstration.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c8ae479880ab43cdb12eeb2fbaaf3b7861f786413c583eeba906c5fdf4b66730
-size 30696
+oid sha256:e8a86ea362473121a266c0ec1257c8d428a4bb6438fecdc9d4a4f1ff5cfc9047
+size 26220
diff --git a/docs/MO_DG/img/workflow_steps.png b/docs/MO_DG/img/workflow_steps.png
index 6bf780127ad14c..fee04b7cb33ebe 100644
--- a/docs/MO_DG/img/workflow_steps.png
+++ b/docs/MO_DG/img/workflow_steps.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5e22bc22d614c7335ae461a8ce449ea8695973d755faca718cf74b95972c94e2
-size 19773
+oid sha256:5281f26cbaa468dc4cafa4ce2fde35d338fe0f658bbb796abaaf793e951939f6
+size 13943
diff --git a/docs/MO_DG/prepare_model/Config_Model_Optimizer.md b/docs/MO_DG/prepare_model/Config_Model_Optimizer.md
index 9b978d750aa586..186b8ddabd5b4e 100644
--- a/docs/MO_DG/prepare_model/Config_Model_Optimizer.md
+++ b/docs/MO_DG/prepare_model/Config_Model_Optimizer.md
@@ -1,8 +1,6 @@
-# Configuring the Model Optimizer {#openvino_docs_MO_DG_prepare_model_Config_Model_Optimizer}
+# Installing Model Optimizer Pre-Requisites {#openvino_docs_MO_DG_prepare_model_Config_Model_Optimizer}
 
-You must configure the Model Optimizer for the framework that was used to train
-the model. This section tells you how to configure the Model Optimizer either
-through scripts or by using a manual process.
+Before running the Model Optimizer, you must install the Model Optimizer pre-requisites for the framework that was used to train the model. This section tells you how to install the pre-requisites either through scripts or by using a manual process.
 
 ## Using Configuration Scripts
 
@@ -12,7 +10,7 @@ dependencies and provide the fastest and easiest way to configure the Model
 Optimizer.
 
 To configure all three frameworks, go to the
-`<INSTALL_DIR>/deployment_tools/model_optimizer/install_prerequisites`
+`<INSTALL_DIR>/tools/model_optimizer/install_prerequisites`
 directory and run:
 
 *   For Linux\* OS:
@@ -37,7 +35,7 @@ install_prerequisites.bat
 ```
 
 To configure a specific framework, go to the
-`<INSTALL_DIR>/deployment_tools/model_optimizer/install_prerequisites`
+`<INSTALL_DIR>/tools/model_optimizer/install_prerequisites`
 directory and run:
 
 *   For Caffe\* on Linux:
@@ -103,7 +101,7 @@ framework at a time.
 
 1.  Go to the Model Optimizer directory:
 ```shell
-cd <INSTALL_DIR>/deployment_tools/model_optimizer/
+cd <INSTALL_DIR>/tools/model_optimizer/
 ```
 2.  **Strongly recommended for all global Model Optimizer dependency installations**:
     Create and activate a virtual environment. While not required, this step is
@@ -154,6 +152,10 @@ pip3 install -r requirements_onnx.txt
 ```
 
 ## Using the protobuf Library in the Model Optimizer for Caffe\*
+<details>
+    <summary>Click to expand</summary>
+
+
 
 These procedures require:
 
@@ -166,7 +168,7 @@ By default, the library executes pure Python\* language implementation,
 which is slow. These steps show how to use the faster C++ implementation
 of the protobuf library on Windows OS or Linux OS.
 
-### Using the protobuf Library on Linux\* OS
+#### Using the protobuf Library on Linux\* OS
 
 To use the C++ implementation of the protobuf library on Linux, it is enough to
 set up the environment variable:
@@ -174,12 +176,12 @@ set up the environment variable:
 export PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp
 ```
 
-### <a name="protobuf-install-windows"></a>Using the protobuf Library on Windows\* OS
+#### <a name="protobuf-install-windows"></a>Using the protobuf Library on Windows\* OS
 
 On Windows, pre-built protobuf packages for Python versions 3.4, 3.5, 3.6,
 and 3.7 are provided with the installation package and can be found in
 the
-`<INSTALL_DIR>\deployment_tools\model_optimizer\install_prerequisites`
+`<INSTALL_DIR>\tools\model_optimizer\install_prerequisites`
 folder. Please note that they are not installed with the
 `install_prerequisites.bat` installation script due to possible issues
 with `pip`, and you can install them at your own discretion. Make sure
@@ -196,7 +198,7 @@ To install the protobuf package:
 1. Open the command prompt as administrator.
 2. Go to the `install_prerequisites` folder of the OpenVINO toolkit installation directory:
 ```sh
-cd <INSTALL_DIR>\deployment_tools\model_optimizer\install_prerequisites
+cd <INSTALL_DIR>\tools\model_optimizer\install_prerequisites
 ```
 
 3. Run the following command to install the protobuf for Python 3.6. If
@@ -262,6 +264,8 @@ python3 -m easy_install dist/protobuf-3.6.1-py3.6-win-amd64.egg
 set PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp
 ```
 
+</details>
+
 ## See Also
 
 * [Converting a Model to Intermediate Representation (IR)](convert_model/Converting_Model.md)
diff --git a/docs/MO_DG/prepare_model/Model_Optimizer_FAQ.md b/docs/MO_DG/prepare_model/Model_Optimizer_FAQ.md
index bb599cf93b5632..cd41e9da21d0a8 100644
--- a/docs/MO_DG/prepare_model/Model_Optimizer_FAQ.md
+++ b/docs/MO_DG/prepare_model/Model_Optimizer_FAQ.md
@@ -28,7 +28,7 @@ For example, to add the description of the `CustomReshape` layer, which is an ar
     
 2.  Generate a new parser:
 ```shell
-cd <INSTALL_DIR>/deployment_tools/model_optimizer/mo/front/caffe/proto
+cd <INSTALL_DIR>/tools/model_optimizer/mo/front/caffe/proto
 python3 generate_caffe_pb2.py --input_proto <PATH_TO_CUSTOM_CAFFE>/src/caffe/proto/caffe.proto
 ```
 where `PATH_TO_CUSTOM_CAFFE` is the path to the root directory of custom Caffe\*.
@@ -66,7 +66,7 @@ The mean file that you provide for the Model Optimizer must be in a `.binaryprot
 
 #### 7. What does the message "Invalid proto file: there is neither 'layer' nor 'layers' top-level messages" mean? <a name="question-7"></a>
 
-The structure of any Caffe\* topology is described in the `caffe.proto` file of any Caffe version. For example, in the Model Optimizer, you can find the following proto file, used by default: `<INSTALL_DIR>/deployment_tools/model_optimizer/mo/front/caffe/proto/my_caffe.proto`. There you can find the structure:
+The structure of any Caffe\* topology is described in the `caffe.proto` file of any Caffe version. For example, in the Model Optimizer, you can find the following proto file, used by default: `<INSTALL_DIR>/tools/model_optimizer/mo/front/caffe/proto/my_caffe.proto`. There you can find the structure:
 ```
 message NetParameter {
   // ... some other parameters
@@ -81,7 +81,7 @@ This means that any topology should contain layers as top-level structures in `p
 
 #### 8. What does the message "Old-style inputs (via 'input_dims') are not supported. Please specify inputs via 'input_shape'" mean? <a name="question-8"></a>
 
-The structure of any Caffe\* topology is described in the `caffe.proto` file for any Caffe version. For example, in the Model Optimizer you can find the following `.proto` file, used by default: `<INSTALL_DIR>/deployment_tools/model_optimizer/mo/front/caffe/proto/my_caffe.proto`. There you can find the structure:
+The structure of any Caffe\* topology is described in the `caffe.proto` file for any Caffe version. For example, in the Model Optimizer you can find the following `.proto` file, used by default: `<INSTALL_DIR>/tools/model_optimizer/mo/front/caffe/proto/my_caffe.proto`. There you can find the structure:
 ```sh
 message NetParameter {
 
diff --git a/docs/MO_DG/prepare_model/Prepare_Trained_Model.md b/docs/MO_DG/prepare_model/Prepare_Trained_Model.md
deleted file mode 100644
index a74d1b789a2f34..00000000000000
--- a/docs/MO_DG/prepare_model/Prepare_Trained_Model.md
+++ /dev/null
@@ -1,63 +0,0 @@
-# Preparing and Optimizing Your Trained Model {#openvino_docs_MO_DG_prepare_model_Prepare_Trained_Model}
-
-Inference Engine enables _deploying_ your network model trained with any of supported deep learning frameworks: Caffe\*, TensorFlow\*, Kaldi\*, MXNet\* or converted to the ONNX\* format. To perform the inference, the Inference Engine does not operate with the original model, but with its Intermediate Representation (IR), which is optimized for execution on end-point target devices. To generate an IR for your trained model, the Model Optimizer tool is used.
-
-## How the Model Optimizer Works
-
-Model Optimizer loads a model into memory, reads it, builds the internal representation of the model, optimizes it, and produces the Intermediate Representation. Intermediate Representation is the only format the Inference Engine accepts.
-
-> **NOTE**: Model Optimizer does not infer models. Model Optimizer is an offline tool that runs before the inference takes place.
-
-Model Optimizer has two main purposes:
-
-*   **Produce a valid Intermediate Representation**. If this main conversion artifact is not valid, the Inference Engine cannot run. The primary responsibility of the Model Optimizer is to produce the two files (`.xml` and `.bin`) that form the Intermediate Representation.
-*   **Produce an optimized Intermediate Representation**. Pre-trained models contain layers that are important for training, such as the `Dropout` layer. These layers are useless during inference and might increase the inference time. In many cases, these operations can be automatically removed from the resulting Intermediate Representation. However, if a group of operations can be represented as a single mathematical operation, and thus as a single operation node in a model graph, the Model Optimizer recognizes such patterns and replaces this group of operation nodes with the only one operation. The result is an Intermediate Representation that has fewer operation nodes than the original model. This decreases the inference time.
-
-To produce a valid Intermediate Representation, the Model Optimizer must be able to read the original model operations, handle their properties and represent them in Intermediate Representation format, while maintaining validity of the resulting Intermediate Representation. The resulting model consists of operations described in the [Operations Specification](../../ops/opset.md).
-
-## What You Need to Know about Your Model
-
-Many common layers exist across known frameworks and neural network topologies. Examples of these layers are `Convolution`, `Pooling`, and `Activation`. To read the original model and produce the Intermediate Representation of a model, the Model Optimizer must be able to work with these layers.
-
-The full list of them depends on the framework and can be found in the [Supported Framework Layers](Supported_Frameworks_Layers.md) section. If your topology contains only layers from the list of layers, as is the case for the topologies used by most users, the Model Optimizer easily creates the Intermediate Representation. After that you can proceed to work with the Inference Engine.
-
-However, if you use a topology with layers that are not recognized by the Model Optimizer out of the box, see [Custom Layers in the Model Optimizer](customize_model_optimizer/Customize_Model_Optimizer.md) to learn how to work with custom layers.
-
-## Model Optimizer Directory Structure
-
-After installation with OpenVINO&trade; toolkit or Intel&reg; Deep Learning Deployment Toolkit, the Model Optimizer folder has the following structure (some directories omitted for clarity):
-```
-|-- model_optimizer
-    |-- extensions
-        |-- front - Front-End framework agnostic transformations (operations output shapes are not defined yet). 
-            |-- caffe - Front-End Caffe-specific transformations and Caffe layers extractors
-                |-- CustomLayersMapping.xml.example - example of file for registering custom Caffe layers (compatible with the 2017R3 release)
-            |-- kaldi - Front-End Kaldi-specific transformations and Kaldi operations extractors
-            |-- mxnet - Front-End MxNet-specific transformations and MxNet symbols extractors
-            |-- onnx - Front-End ONNX-specific transformations and ONNX operators extractors            
-            |-- tf - Front-End TensorFlow-specific transformations, TensorFlow operations extractors, sub-graph replacements configuration files. 
-        |-- middle - Middle-End framework agnostic transformations (layers output shapes are defined).
-        |-- back - Back-End framework agnostic transformations (preparation for IR generation).        
-    |-- mo
-        |-- back - Back-End logic: contains IR emitting logic
-        |-- front - Front-End logic: contains matching between Framework-specific layers and IR specific, calculation of output shapes for each registered layer
-        |-- graph - Graph utilities to work with internal IR representation
-        |-- middle - Graph transformations - optimizations of the model
-        |-- pipeline - Sequence of steps required to create IR for each framework
-        |-- utils - Utility functions
-    |-- tf_call_ie_layer - Source code that enables TensorFlow fallback in Inference Engine during model inference
-    |-- mo.py - Centralized entry point that can be used for any supported framework
-    |-- mo_caffe.py - Entry point particularly for Caffe
-    |-- mo_kaldi.py - Entry point particularly for Kaldi
-    |-- mo_mxnet.py - Entry point particularly for MXNet
-    |-- mo_onnx.py - Entry point particularly for ONNX
-    |-- mo_tf.py - Entry point particularly for TensorFlow
-```
-
-The following sections provide the information about how to use the Model Optimizer, from configuring the tool and generating an IR for a given model to customizing the tool for your needs:
-
-* [Configuring Model Optimizer](Config_Model_Optimizer.md)
-* [Converting a Model to Intermediate Representation](convert_model/Converting_Model.md)
-* [Custom Layers in Model Optimizer](customize_model_optimizer/Customize_Model_Optimizer.md)
-* [Model Optimization Techniques](Model_Optimization_Techniques.md)
-* [Model Optimizer Frequently Asked Questions](Model_Optimizer_FAQ.md)
diff --git a/docs/MO_DG/prepare_model/Supported_Frameworks_Layers.md b/docs/MO_DG/prepare_model/Supported_Frameworks_Layers.md
index a09df51a56a34d..c01c71752210e6 100644
--- a/docs/MO_DG/prepare_model/Supported_Frameworks_Layers.md
+++ b/docs/MO_DG/prepare_model/Supported_Frameworks_Layers.md
@@ -67,6 +67,7 @@ Standard MXNet\* symbols:
 | _minus_scalar | No |
 | _mul_scalar | No |
 | _plus_scalar | No |
+| _random_uniform | Operation provides sequence from uniform distribution, but exact values won't match. |
 | _rnn_param_concat | No |
 | _arange | No |
 | _contrib_AdaptiveAvgPooling2D | Converted to the Average Pooling with fixed paddings |
@@ -272,6 +273,8 @@ Standard TensorFlow\* operations:
 | PlaceholderWithDefault | No |
 | Prod | No |
 | QueueDequeueUpToV2 | Supported only when it is part of a sub-graph of the special form |
+| RandomUniform | No |
+| RandomUniformInt | No |
 | Range | No |
 | Rank | No |
 | RealDiv | No |
@@ -568,6 +571,7 @@ Standard ONNX\* operators:
 | RNN | No |
 | ROIAlign | No |
 | Range | No |
+| RandomUniform | Operation provides sequence from uniform distribution, but exact values won't match. |
 | Reciprocal | No |
 | ReduceL1 | No |
 | ReduceL2 | No |
diff --git a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Caffe.md b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Caffe.md
index 4c257d1689ea23..229205f7b68166 100644
--- a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Caffe.md
+++ b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Caffe.md
@@ -38,7 +38,7 @@ A summary of the steps for optimizing and deploying a model that was trained wit
 
 To convert a Caffe\* model:
 
-1. Go to the `$INTEL_OPENVINO_DIR/deployment_tools/model_optimizer` directory.
+1. Go to the `$INTEL_OPENVINO_DIR/tools/model_optimizer` directory.
 2. Use the `mo.py` script to simply convert a model, specifying the path to the input model `.caffemodel` file and the path to an output directory with write permissions:
 ```sh
 python3 mo.py --input_model <INPUT_MODEL>.caffemodel --output_dir <OUTPUT_MODEL_DIR>
diff --git a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Kaldi.md b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Kaldi.md
index 20f2511dcbf148..3aac41fbd67874 100644
--- a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Kaldi.md
+++ b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Kaldi.md
@@ -33,7 +33,7 @@ A summary of the steps for optimizing and deploying a model that was trained wit
 
 To convert a Kaldi\* model:
 
-1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory.
+1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory.
 2. Use the `mo.py` script to simply convert a model with the path to the input model `.nnet` or `.mdl` file and to an output directory where you have write permissions:
 ```sh
 python3 mo.py --input_model <INPUT_MODEL>.nnet --output_dir <OUTPUT_MODEL_DIR>
diff --git a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_MxNet.md b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_MxNet.md
index 4b8c1816e8b318..6ac304aa5c236b 100644
--- a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_MxNet.md
+++ b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_MxNet.md
@@ -27,14 +27,12 @@ A summary of the steps for optimizing and deploying a model that was trained wit
 |SSD-ResNet-50|	[Repo](https://github.com/zhreshold/mxnet-ssd), [Symbol + Params](https://github.com/zhreshold/mxnet-ssd/releases/download/v0.6/resnet50_ssd_512_voc0712_trainval.zip)|
 |SSD-VGG-16-300|	[Repo](https://github.com/zhreshold/mxnet-ssd), [Symbol + Params](https://github.com/zhreshold/mxnet-ssd/releases/download/v0.5-beta/vgg16_ssd_300_voc0712_trainval.zip)|
 |SSD-Inception v3|	[Repo](https://github.com/zhreshold/mxnet-ssd), [Symbol + Params](https://github.com/zhreshold/mxnet-ssd/releases/download/v0.7-alpha/ssd_inceptionv3_512_voc0712trainval.zip)|
-|FCN8 (Semantic Segmentation)|	[Repo](https://github.com/apache/incubator-mxnet/tree/master/example/fcn-xs), [Symbol](https://www.dropbox.com/sh/578n5cxej7ofd6m/AAA9SFCBN8R_uL2CnAd3WQ5ia/FCN8s_VGG16-symbol.json?dl=0), [Params](https://www.dropbox.com/sh/578n5cxej7ofd6m/AABHWZHCtA2P6iR6LUflkxb_a/FCN8s_VGG16-0019-cpu.params?dl=0)|
 |MTCNN part 1 (Face Detection)| [Repo](https://github.com/pangyupo/mxnet_mtcnn_face_detection), [Symbol](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det1-symbol.json), [Params](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det1-0001.params)|
 |MTCNN part 2 (Face Detection)| [Repo](https://github.com/pangyupo/mxnet_mtcnn_face_detection), [Symbol](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det2-symbol.json), [Params](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det2-0001.params)|
 |MTCNN part 3 (Face Detection)| [Repo](https://github.com/pangyupo/mxnet_mtcnn_face_detection), [Symbol](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det3-symbol.json), [Params](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det3-0001.params)|
 |MTCNN part 4 (Face Detection)| [Repo](https://github.com/pangyupo/mxnet_mtcnn_face_detection), [Symbol](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det4-symbol.json), [Params](https://github.com/pangyupo/mxnet_mtcnn_face_detection/blob/master/model/det4-0001.params)|
 |Lightened_moon| [Repo](https://github.com/tornadomeet/mxnet-face/tree/master/model/lightened_moon), [Symbol](https://github.com/tornadomeet/mxnet-face/blob/master/model/lightened_moon/lightened_moon_fuse-symbol.json), [Params](https://github.com/tornadomeet/mxnet-face/blob/master/model/lightened_moon/lightened_moon_fuse-0082.params)|
 |RNN-Transducer| [Repo](https://github.com/HawkAaron/mxnet-transducer) |
-|word_lm| [Repo](https://github.com/apache/incubator-mxnet/tree/master/example/rnn/word_lm) |
 
 **Other supported topologies**
 
@@ -45,7 +43,7 @@ A summary of the steps for optimizing and deploying a model that was trained wit
 
 To convert an MXNet\* model:
 
-1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory.
+1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory.
 2. To convert an MXNet\* model contained in a `model-file-symbol.json` and `model-file-0000.params`, run the Model Optimizer launch script `mo.py`, specifying a path to the input model file and a path to an output directory with write permissions:
 ```sh
 python3 mo_mxnet.py --input_model model-file-0000.params --output_dir <OUTPUT_MODEL_DIR>
diff --git a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_ONNX.md b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_ONNX.md
index 79f740b55ecdd4..6ab9ef30e43782 100644
--- a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_ONNX.md
+++ b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_ONNX.md
@@ -59,7 +59,7 @@ The Model Optimizer process assumes you have an ONNX model that was directly dow
 
 To convert an ONNX\* model:
 
-1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory.
+1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory.
 2. Use the `mo.py` script to simply convert a model with the path to the input model `.nnet` file and an output directory where you have write permissions:
 ```sh
 python3 mo.py --input_model <INPUT_MODEL>.onnx --output_dir <OUTPUT_MODEL_DIR>
diff --git a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Paddle.md b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Paddle.md
index 65f5c8fbbab1ba..d2d75aefb08541 100644
--- a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Paddle.md
+++ b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Paddle.md
@@ -29,7 +29,7 @@ A summary of the steps for optimizing and deploying a model that was trained wit
 
 To convert a Paddle\* model:
 
-1. Go to the `$INTEL_OPENVINO_DIR/deployment_tools/model_optimizer` directory.
+1. Go to the `$INTEL_OPENVINO_DIR/tools/model_optimizer` directory.
 2. Use the `mo.py` script to simply convert a model, specifying the framework, the path to the input model `.pdmodel` file and the path to an output directory with write permissions:
 ```sh
 python3 mo.py --input_model <INPUT_MODEL>.pdmodel --output_dir <OUTPUT_MODEL_DIR> --framework=paddle
diff --git a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_TensorFlow.md b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_TensorFlow.md
index 7e29a7668b2f24..d5124fab21b0e6 100644
--- a/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_TensorFlow.md
+++ b/docs/MO_DG/prepare_model/convert_model/Convert_Model_From_TensorFlow.md
@@ -37,7 +37,7 @@ Detailed information on how to convert models from the <a href="https://github.c
 
 **Supported Pre-Trained Topologies from TensorFlow 1 Detection Model Zoo**
 
-Detailed information on how to convert models from the <a href="https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/tf1_detection_zoo.md">TensorFlow 1 Detection Model Zoo</a> is available in the [Converting TensorFlow Object Detection API Models](tf_specific/Convert_Object_Detection_API_Models.md) chapter. The table below contains models from the Object Detection Models zoo that are supported.
+Detailed information on how to convert models from the <a href="https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/tf1_detection_zoo.md">TensorFlow 1 Object Detection Models Zoo</a> and <a href="https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/tf2_detection_zoo.md">TensorFlow 2 Object Detection Models Zoo</a> is available in the [Converting TensorFlow Object Detection API Models](tf_specific/Convert_Object_Detection_API_Models.md) chapter. The table below contains models from the Object Detection Models Zoo that are supported.
 
 | Model Name| TensorFlow 1 Object Detection API Models|
 | :------------- | -----:|
@@ -178,7 +178,7 @@ There are three ways to store non-frozen TensorFlow models and load them to the
 
     To convert such a TensorFlow model:
 
-    1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory
+    1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory
     2. Run the `mo_tf.py` script with the path to the checkpoint file to convert a model and an output directory where you have write permissions:
 
     * If input model is in `.pb` format:<br>
@@ -200,7 +200,7 @@ python3 mo_tf.py --input_model <INFERENCE_GRAPH>.pbtxt --input_checkpoint <INPUT
 
     To convert such TensorFlow model:
 
-    1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory
+    1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory
     2. Run the `mo_tf.py` script with a path to the MetaGraph `.meta` file and a writable output directory to convert a model:<br>
 ```sh
 python3 mo_tf.py --input_meta_graph <INPUT_META_GRAPH>.meta --output_dir <OUTPUT_MODEL_DIR>
@@ -212,7 +212,7 @@ python3 mo_tf.py --input_meta_graph <INPUT_META_GRAPH>.meta --output_dir <OUTPUT
 
     To convert such TensorFlow model:
 
-    1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory
+    1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory
     2. Run the `mo_tf.py` script with a path to the SavedModel directory and a writable output directory to convert a model:<br>
 ```sh
 python3 mo_tf.py --saved_model_dir <SAVED_MODEL_DIRECTORY> --output_dir <OUTPUT_MODEL_DIR>
@@ -251,7 +251,7 @@ Where:
 
 To convert a TensorFlow model:
 
-1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory
+1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory
 2. Use the `mo_tf.py` script to simply convert a model with the path to the input model `.pb` file and a writable output directory:
 ```sh
 python3 mo_tf.py --input_model <INPUT_MODEL>.pb --output_dir <OUTPUT_MODEL_DIR>
@@ -342,7 +342,7 @@ Below are the instructions on how to convert each of them.
 
 A model in the SavedModel format consists of a directory with a `saved_model.pb` file and two subfolders: `variables` and `assets`. 
 To convert such a model:
-1. Go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory.
+1. Go to the `<INSTALL_DIR>/tools/model_optimizer` directory.
 2. Run the `mo_tf.py` script with a path to the SavedModel directory and a writable output directory:
 ```sh
 python3 mo_tf.py --saved_model_dir <SAVED_MODEL_DIRECTORY> --output_dir <OUTPUT_MODEL_DIR>
@@ -405,10 +405,8 @@ Refer to [Supported Framework Layers ](../Supported_Frameworks_Layers.md) for th
 The Model Optimizer provides explanatory messages if it is unable to run to completion due to issues like typographical errors, incorrectly used options, or other issues. The message describes the potential cause of the problem and gives a link to the [Model Optimizer FAQ](../Model_Optimizer_FAQ.md). The FAQ has instructions on how to resolve most issues. The FAQ also includes links to relevant sections in the Model Optimizer Developer Guide to help you understand what went wrong.
 
 ## Video: Converting a TensorFlow Model
-[![](https://img.youtube.com/vi/QW6532LtiTc/0.jpg)](https://www.youtube.com/watch?v=QW6532LtiTc)
-\htmlonly
+
 <iframe width="560" height="315" src="https://www.youtube.com/embed/QW6532LtiTc" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
-\endhtmlonly
 
 ## Summary
 In this document, you learned:
diff --git a/docs/MO_DG/prepare_model/convert_model/Converting_Model.md b/docs/MO_DG/prepare_model/convert_model/Converting_Model.md
index 26ce1289b8c04e..78acbd694e139c 100644
--- a/docs/MO_DG/prepare_model/convert_model/Converting_Model.md
+++ b/docs/MO_DG/prepare_model/convert_model/Converting_Model.md
@@ -1,39 +1,20 @@
 # Converting a Model to Intermediate Representation (IR)  {#openvino_docs_MO_DG_prepare_model_convert_model_Converting_Model}
 
-Use the <code>mo.py</code> script from the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory to run the Model Optimizer and convert the model to the Intermediate Representation (IR). 
-The simplest way to convert a model is to run <code>mo.py</code> with a path to the input model file and an output directory where you have write permissions:
+Use the <code>mo.py</code> script from the `<INSTALL_DIR>/tools/model_optimizer` directory to run the Model Optimizer and convert the model to the Intermediate Representation (IR): 
 ```sh
 python3 mo.py --input_model INPUT_MODEL --output_dir <OUTPUT_MODEL_DIR>
 ```
+You need to have have write permissions for an output directory.
 
-> **NOTE**: Some models require using additional arguments to specify conversion parameters, such as `--scale`, `--scale_values`, `--mean_values`, `--mean_file`. To learn about when you need to use these parameters, refer to [Converting a Model Using General Conversion Parameters](Converting_Model_General.md).
-
-The <code>mo.py</code> script is the universal entry point that can deduce the framework that has produced the input model by a standard extension of the model file:
-
-* `.caffemodel` - Caffe\* models
-* `.pb` - TensorFlow\* models
-* `.params` - MXNet\* models
-* `.onnx` - ONNX\* models
-* `.nnet` - Kaldi\* models.
-
-If the model files do not have standard extensions, you can use the ``--framework {tf,caffe,kaldi,onnx,mxnet,paddle}`` option to specify the framework type explicitly. 
-
-For example, the following commands are equivalent: 
-```sh
-python3 mo.py --input_model /user/models/model.pb
-```
-```sh
-python3 mo.py --framework tf --input_model /user/models/model.pb
-```
+> **NOTE**: Some models require using additional arguments to specify conversion parameters, such as `--input_shape`, `--scale`, `--scale_values`, `--mean_values`, `--mean_file`. To learn about when you need to use these parameters, refer to [Converting a Model Using General Conversion Parameters](Converting_Model_General.md).
 
 To adjust the conversion process, you may use general parameters defined in the [Converting a Model Using General Conversion Parameters](Converting_Model_General.md) and 
 Framework-specific parameters for:
-* [Caffe](Convert_Model_From_Caffe.md),
-* [TensorFlow](Convert_Model_From_TensorFlow.md),
-* [MXNet](Convert_Model_From_MxNet.md),
-* [ONNX](Convert_Model_From_ONNX.md),
-* [Kaldi](Convert_Model_From_Kaldi.md).
-* [Paddle](Convert_Model_From_Paddle.md).
+* [Caffe](Convert_Model_From_Caffe.md)
+* [TensorFlow](Convert_Model_From_TensorFlow.md)
+* [MXNet](Convert_Model_From_MxNet.md)
+* [ONNX](Convert_Model_From_ONNX.md)
+* [Kaldi](Convert_Model_From_Kaldi.md)
 
 
 ## See Also
diff --git a/docs/MO_DG/prepare_model/convert_model/Converting_Model_General.md b/docs/MO_DG/prepare_model/convert_model/Converting_Model_General.md
index 2d267cda3e7172..114bf7a3ce0f68 100644
--- a/docs/MO_DG/prepare_model/convert_model/Converting_Model_General.md
+++ b/docs/MO_DG/prepare_model/convert_model/Converting_Model_General.md
@@ -5,7 +5,7 @@ To simply convert a model trained by any supported framework, run the Model Opti
 python3 mo.py --input_model INPUT_MODEL --output_dir <OUTPUT_MODEL_DIR>
 ```
 
-The script is in `$INTEL_OPENVINO_DIR/deployment_tools/model_optimizer/`. The output directory must have write permissions, so you can run mo.py from the output directory or specify an output path with the `--output_dir` option.
+The script is in `$INTEL_OPENVINO_DIR/tools/model_optimizer/`. The output directory must have write permissions, so you can run mo.py from the output directory or specify an output path with the `--output_dir` option.
 
 > **NOTE:** The color channel order (RGB or BGR) of an input data should match the channel order of the model training dataset. If they are different, perform the `RGB<->BGR` conversion specifying the command-line parameter: `--reverse_input_channels`. Otherwise, inference results may be incorrect. For details, refer to [When to Reverse Input Channels](#when_to_reverse_input_channels).
 
@@ -212,8 +212,7 @@ Launch the Model Optimizer for the Caffe bvlc_alexnet model with reversed input
 python3 mo.py --input_model bvlc_alexnet.caffemodel --reverse_input_channels --mean_values [255,255,255] --data_type FP16 --output_dir <OUTPUT_MODEL_DIR>
 ```
 
-Launch the Model Optimizer for the Caffe bvlc_alexnet model with extensions listed in specified directories, specified mean_images binaryproto.
- file For more information about extensions, please refer to [this](../customize_model_optimizer/Extending_Model_Optimizer_with_New_Primitives.md) page.
+Launch the Model Optimizer for the Caffe bvlc_alexnet model with extensions listed in specified directories, specified mean_images binaryproto file. For more information about extensions, please refer to [this](../customize_model_optimizer/Extending_Model_Optimizer_with_New_Primitives.md) page.
 ```sh
 python3 mo.py --input_model bvlc_alexnet.caffemodel --extensions /home/,/some/other/path/ --mean_file /path/to/binaryproto --output_dir <OUTPUT_MODEL_DIR>
 ```
diff --git a/docs/MO_DG/prepare_model/convert_model/Cutting_Model.md b/docs/MO_DG/prepare_model/convert_model/Cutting_Model.md
index d86368a9f708f5..d0248d149bc7cd 100644
--- a/docs/MO_DG/prepare_model/convert_model/Cutting_Model.md
+++ b/docs/MO_DG/prepare_model/convert_model/Cutting_Model.md
@@ -19,7 +19,7 @@ Model Optimizer provides command line options `--input` and `--output` to specif
 *   `--input` option accepts a comma-separated list of layer names of the input model that should be treated as new entry points to the model.
 *   `--output` option accepts a comma-separated list of layer names of the input model that should be treated as new exit points from the model.
 
-The `--input` option is required for cases unrelated to model cutting. For example, when the model contains several inputs and `--input_shape` or `--mean_values` options are used, you should use the `--input` option to specify the order of input nodes for correct mapping between multiple items provided in `--input_shape` and `--mean_values` and the inputs in the model. This is out of scope.
+The `--input` option is required for cases unrelated to model cutting. For example, when the model contains several inputs and `--input_shape` or `--mean_values` options are used, you should use the `--input` option to specify the order of input nodes for correct mapping between multiple items provided in `--input_shape` and `--mean_values` and the inputs in the model. Details on these options are out of scope for this document, which focuses on model cutting.
 
 Model cutting is illustrated with Inception V1. This model is in `models/research/slim` repository. [This section](Converting_Model.md) describes pre-work to prepare the model for the Model Optimizer to be ready to proceed with this chapter.
 
@@ -39,7 +39,7 @@ In the TensorBoard, it looks the following way together with some predecessors:
 
 Convert this model and put the results in a writable output directory:
 ```sh
-${INTEL_OPENVINO_DIR}/deployment_tools/model_optimizer
+${INTEL_OPENVINO_DIR}/tools/model_optimizer
 python3 mo.py --input_model inception_v1.pb -b 1 --output_dir <OUTPUT_MODEL_DIR>
 ```
 (The other examples on this page assume that you first cd to the `model_optimizer` directory and add the `--output_dir` argument with a directory where you have write permissions.)
diff --git a/docs/MO_DG/prepare_model/convert_model/IR_suitable_for_INT8_inference.md b/docs/MO_DG/prepare_model/convert_model/IR_suitable_for_INT8_inference.md
index fa4bdb50554913..4f9baa1386cb7d 100644
--- a/docs/MO_DG/prepare_model/convert_model/IR_suitable_for_INT8_inference.md
+++ b/docs/MO_DG/prepare_model/convert_model/IR_suitable_for_INT8_inference.md
@@ -9,7 +9,7 @@ Intermediate Representation (IR) should be specifically formed to be suitable fo
 Such an IR is called a Low Precision IR and you can generate it in two ways:
 - [Quantize regular IR with the Post-Training Optimization tool](@ref pot_README)
 - Use the Model Optimizer for a model pretrained for Low Precision inference: TensorFlow\* pre-TFLite models (`.pb` model file with `FakeQuantize*` operations) and ONNX\* quantized models.
-Both Tensorflow and ONNX quantized models could be prepared by [Neural Network Compression Framework](https://github.com/openvinotoolkit/nncf/blob/develop/README.md) 
+Both TensorFlow and ONNX quantized models could be prepared by [Neural Network Compression Framework](https://github.com/openvinotoolkit/nncf/blob/develop/README.md). 
 
 For an operation to be executed in INT8, it must have `FakeQuantize` operations as inputs.
 See the [specification of `FakeQuantize` operation](../../../ops/quantization/FakeQuantize_1.md) for details. 
@@ -17,7 +17,7 @@ See the [specification of `FakeQuantize` operation](../../../ops/quantization/Fa
 To execute the `Convolution` operation in INT8 on CPU, both data and weight inputs should have `FakeQuantize` as an input operation:
 ![](../../img/expanded_int8_Convolution_weights.png)
 
-Low pecision IR is also suitable for FP32 and FP16 inference if a chosen plugin supports all operations of the IR, because the only difference between a Low Precision IR and FP16 or FP32 IR is the existence of `FakeQuantize` in the Low Precision IR. 
+Low precision IR is also suitable for FP32 and FP16 inference if a chosen plugin supports all operations of the IR, because the only difference between a Low Precision IR and FP16 or FP32 IR is the existence of `FakeQuantize` in the Low Precision IR. 
 Plugins with Low Precision Inference support recognize these sub-graphs and quantize them during the inference time. 
 Plugins without Low Precision support execute all operations, including `FakeQuantize`, as is in the FP32 or FP16 precision.   
 
diff --git a/docs/MO_DG/prepare_model/convert_model/mxnet_specific/Convert_Style_Transfer_From_MXNet.md b/docs/MO_DG/prepare_model/convert_model/mxnet_specific/Convert_Style_Transfer_From_MXNet.md
index f0ec23d5a9f631..eb1a7094673e2f 100644
--- a/docs/MO_DG/prepare_model/convert_model/mxnet_specific/Convert_Style_Transfer_From_MXNet.md
+++ b/docs/MO_DG/prepare_model/convert_model/mxnet_specific/Convert_Style_Transfer_From_MXNet.md
@@ -90,6 +90,8 @@ Where the `models/13` string is composed of the following substrings:
 * `models/`: path to the folder that contains .nd files with pre-trained styles weights 
 * `13`: prefix pointing to 13_decoder, which is the default decoder for the repository
 
+>**NOTE**: If you get an error saying "No module named 'cPickle'", try running the script from this step in Python 2. Then return to Python 3 for the remaining steps.
+
 You can choose any style from [collection of pre-trained weights](https://pan.baidu.com/s/1skMHqYp). (On the Chinese-language page, click the down arrow next to a size in megabytes. Then wait for an overlay box to appear, and click the blue button in it to download.) The `generate()` function generates `nst_vgg19-symbol.json` and `vgg19-symbol.json` files for the specified shape. In the code, it is [1024 x 768] for a 4:3 ratio, and you can specify another, for example, [224,224] for a square ratio.
 
 #### 6. Run the Model Optimizer to generate an Intermediate Representation (IR):
diff --git a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_F3Net.md b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_F3Net.md
index ffb16eb5f7cc5f..0d130197f74a2c 100644
--- a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_F3Net.md
+++ b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_F3Net.md
@@ -2,15 +2,19 @@
 
 [F3Net](https://github.com/weijun88/F3Net): Fusion, Feedback and Focus for Salient Object Detection
 
+## Clone the F3Net Model Repository
+
+To clone the repository, run the following command:
+```bash
+git clone http://github.com/weijun88/F3Net.git
+```
+
 ## Download and Convert the Model to ONNX*
 
 To download the pre-trained model or train the model yourself, refer to the 
-[instruction](https://github.com/weijun88/F3Net/blob/master/README.md) in the F3Net model repository. Firstly, 
-convert the model to ONNX\* format. Create and run the script with the following content in the `src`
-directory of the model repository:
+[instruction](https://github.com/weijun88/F3Net/blob/master/README.md) in the F3Net model repository. First, convert the model to ONNX\* format. Create and run the script with the following content in the `src` directory of the model repository:
 ```python
 import torch
-
 from dataset import Config
 from net import F3Net
 
@@ -19,7 +23,7 @@ net = F3Net(cfg)
 image = torch.zeros([1, 3, 352, 352])
 torch.onnx.export(net, image, 'f3net.onnx', export_params=True, do_constant_folding=True, opset_version=11)
 ```
-The script generates the ONNX\* model file f3net.onnx. The model conversion was tested with the repository hash commit `eecace3adf1e8946b571a4f4397681252f9dc1b8`.
+The script generates the ONNX\* model file `f3net.onnx`. This model conversion was tested with the repository hash commit `eecace3adf1e8946b571a4f4397681252f9dc1b8`.
 
 ## Convert ONNX* F3Net Model to IR
 
diff --git a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md
index a58e886d4f4230..31de647f379158 100644
--- a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md
+++ b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_RNNT.md
@@ -20,15 +20,15 @@ mkdir rnnt_for_openvino
 cd rnnt_for_openvino
 ```
 
-**Step 3**. Download pretrained weights for PyTorch implementation from https://zenodo.org/record/3662521#.YG21DugzZaQ.
-For UNIX*-like systems you can use wget:
+**Step 3**. Download pretrained weights for PyTorch implementation from [https://zenodo.org/record/3662521#.YG21DugzZaQ](https://zenodo.org/record/3662521#.YG21DugzZaQ).
+For UNIX*-like systems you can use `wget`:
 ```bash
 wget https://zenodo.org/record/3662521/files/DistributedDataParallel_1576581068.9962234-epoch-100.pt
 ```
 The link was taken from `setup.sh` in the `speech_recoginitin/rnnt` subfolder. You will get exactly the same weights as 
-if you were following the steps from https://github.com/mlcommons/inference/tree/master/speech_recognition/rnnt.
+if you were following the steps from [https://github.com/mlcommons/inference/tree/master/speech_recognition/rnnt](https://github.com/mlcommons/inference/tree/master/speech_recognition/rnnt).
 
-**Step 4**. Install required python* packages:
+**Step 4**. Install required Python packages:
 ```bash
 pip3 install torch toml
 ```
@@ -37,7 +37,7 @@ pip3 install torch toml
 `export_rnnt_to_onnx.py` and run it in the current directory `rnnt_for_openvino`:
 
 > **NOTE**: If you already have a full clone of MLCommons inference repository, you need to
-> specify `mlcommons_inference_path` variable.
+> specify the `mlcommons_inference_path` variable.
 
 ```python
 import toml
@@ -92,8 +92,7 @@ torch.onnx.export(model.joint, (f, g), "rnnt_joint.onnx", opset_version=12,
 python3 export_rnnt_to_onnx.py
 ```
 
-After completing this step, the files rnnt_encoder.onnx, rnnt_prediction.onnx, and rnnt_joint.onnx will be saved in 
-the current directory. 
+After completing this step, the files `rnnt_encoder.onnx`, `rnnt_prediction.onnx`, and `rnnt_joint.onnx` will be saved in the current directory. 
 
 **Step 6**. Run the conversion command:
 
@@ -102,6 +101,6 @@ python3 {path_to_openvino}/mo.py --input_model rnnt_encoder.onnx --input "input.
 python3 {path_to_openvino}/mo.py --input_model rnnt_prediction.onnx --input "input.1[1 1],1[2 1 320],2[2 1 320]"
 python3 {path_to_openvino}/mo.py --input_model rnnt_joint.onnx --input "0[1 1 1024],1[1 1 320]"
 ```
-Please note that hardcoded value for sequence length = 157 was taken from the MLCommons, but conversion to IR preserves 
-network [reshapeability](../../../../IE_DG/ShapeInference.md); this means you can change input shapes manually to any value either during conversion or 
-inference. 
+Please note that hardcoded value for sequence length = 157 was taken from the MLCommons but conversion to IR preserves 
+network [reshapeability](../../../../IE_DG/ShapeInference.md), this means you can change input shapes manually to any value either during conversion or 
+inference.
\ No newline at end of file
diff --git a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_YOLACT.md b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_YOLACT.md
index 9fb7e1ca9e9ce3..50272a33f74d4c 100644
--- a/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_YOLACT.md
+++ b/docs/MO_DG/prepare_model/convert_model/pytorch_specific/Convert_YOLACT.md
@@ -138,7 +138,7 @@ git checkout 57b8f2d95e62e2e649b382f516ab41f949b57239
 
 3. Set up the environment as described in `README.md`.
 
-**Step 2**. Download a pre-trained model from the list attached in the `Evaluation` section of `README.md` document, for example `yolact_base_54_800000.pth`.
+**Step 2**. Download a pre-trained model from the list attached in the `Evaluation` section of the [README.md](https://github.com/dbolya/yolact/blob/master/README.md) document, for example `yolact_base_54_800000.pth`.
 
 **Step 3**. Export the model to ONNX* format.
 
@@ -187,5 +187,4 @@ python path/to/model_optimizer/mo.py \
     --input_model /path/to/yolact.onnx \
     --reverse_input_channels \
     --scale 255
-```
-
+```
\ No newline at end of file
diff --git a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_EfficientDet_Models.md b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_EfficientDet_Models.md
index b78ec640cba19c..fe829c1c21cbd3 100644
--- a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_EfficientDet_Models.md
+++ b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_EfficientDet_Models.md
@@ -47,9 +47,9 @@ As a result the frozen model file `savedmodeldir/efficientdet-d4_frozen.pb` will
 
 To generate the IR of the EfficientDet TensorFlow model, run:<br>
 ```sh
-python3 $INTEL_OPENVINO_DIR/deployment_tools/model_optimizer/mo.py \
+python3 $INTEL_OPENVINO_DIR/tools/model_optimizer/mo.py \
 --input_model savedmodeldir/efficientdet-d4_frozen.pb \
---transformations_config $INTEL_OPENVINO_DIR/deployment_tools/model_optimizer/extensions/front/tf/automl_efficientdet.json \
+--transformations_config $INTEL_OPENVINO_DIR/tools/model_optimizer/extensions/front/tf/automl_efficientdet.json \
 --input_shape [1,$IMAGE_SIZE,$IMAGE_SIZE,3] \
 --reverse_input_channels
 ```
diff --git a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_Object_Detection_API_Models.md b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_Object_Detection_API_Models.md
index eabe4840eb885a..076fe4716cc205 100644
--- a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_Object_Detection_API_Models.md
+++ b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_Object_Detection_API_Models.md
@@ -3,20 +3,18 @@
 > **NOTES**:
 > * Starting with the 2022.1 release, the Model Optimizer can convert the TensorFlow\* Object Detection API Faster and Mask RCNNs topologies differently. By default, the Model Optimizer adds operation "Proposal" to the generated IR. This operation needs an additional input to the model with name "image_info" which should be fed with several values describing the pre-processing applied to the input image (refer to the [Proposal](../../../../ops/detection/Proposal_4.md) operation specification for more information). However, this input is redundant for the models trained and inferred with equal size images. Model Optimizer can generate IR for such models and insert operation [DetectionOutput](../../../../ops/detection/DetectionOutput_1.md) instead of `Proposal`. The `DetectionOutput` operation does not require additional model input "image_info" and moreover, for some models the produced inference results are closer to the original TensorFlow\* model. In order to trigger new behaviour the attribute "operation_to_add" in the corresponding JSON transformation configuration file should be set to value "DetectionOutput" instead of default one "Proposal".
 > * Starting with the 2021.1 release, the Model Optimizer converts the TensorFlow\* Object Detection API SSDs, Faster and Mask RCNNs topologies keeping shape-calculating sub-graphs by default, so topologies can be re-shaped in the Inference Engine using dedicated reshape API. Refer to [Using Shape Inference](../../../../IE_DG/ShapeInference.md) for more information on how to use this feature. It is possible to change the both spatial dimensions of the input image and batch size.
-> * To generate IRs for SSD topologies, the Model Optimizer creates a number of `PriorBoxClustered` layers instead of a constant node with prior boxes calculated for the particular input image size. This change allows you to reshape the topology in the Inference Engine using dedicated Inference Engine API. The reshaping is supported for all SSD topologies except FPNs which contain hardcoded shapes for some operations preventing from changing topology input shape.  
+> * To generate IRs for TF 1 SSD topologies, the Model Optimizer creates a number of `PriorBoxClustered` operations instead of a constant node with prior boxes calculated for the particular input image size. This change allows you to reshape the topology in the Inference Engine using dedicated Inference Engine API. The reshaping is supported for all SSD topologies except FPNs which contain hardcoded shapes for some operations preventing from changing topology input shape.
 
 ## How to Convert a Model
 
-With 2018 R3 release, the Model Optimizer introduces a new approach to convert models created using the TensorFlow\* Object Detection API. Compared with the previous approach, the new process produces inference results with higher accuracy and does not require modifying any configuration files and providing intricate command line parameters.
-
 You can download TensorFlow\* Object Detection API models from the <a href="https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/tf1_detection_zoo.md">TensorFlow 1 Detection Model Zoo</a> or <a href="https://github.com/tensorflow/models/blob/master/research/object_detection/g3doc/tf2_detection_zoo.md">TensorFlow 2 Detection Model Zoo</a>.
 
 <strong>NOTE</strong>: Before converting, make sure you have configured the Model Optimizer. For configuration steps, refer to [Configuring the Model Optimizer](../../Config_Model_Optimizer.md).
 
-To convert a TensorFlow\* Object Detection API model, go to the `<INSTALL_DIR>/deployment_tools/model_optimizer` directory and run the `mo_tf.py` script with the following required parameters:
+To convert a TensorFlow\* Object Detection API model, go to the `<INSTALL_DIR>/tools/model_optimizer` directory and run the `mo_tf.py` script with the following required parameters:
 
 * `--input_model <path_to_frozen.pb>` --- File with a pre-trained model (binary or text .pb file after freezing) OR `--saved_model_dir <path_to_saved_model>` for the TensorFlow\* 2 models
-* `--transformations_config <path_to_subgraph_replacement_configuration_file.json>` --- A subgraph replacement configuration file with transformations description. For the models downloaded from the TensorFlow\* Object Detection API zoo, you can find the configuration files in the `<INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf` directory. Use:
+* `--transformations_config <path_to_subgraph_replacement_configuration_file.json>` --- A subgraph replacement configuration file with transformations description. For the models downloaded from the TensorFlow\* Object Detection API zoo, you can find the configuration files in the `<INSTALL_DIR>/tools/model_optimizer/extensions/front/tf` directory. Use:
     * `ssd_v2_support.json` --- for frozen SSD topologies from the models zoo version up to 1.13.X inclusively
     * `ssd_support_api_v.1.14.json` --- for SSD topologies trained using the TensorFlow\* Object Detection API version 1.14 up to 1.14.X inclusively
     * `ssd_support_api_v.1.15.json` --- for SSD topologies trained using the TensorFlow\* Object Detection API version 1.15 up to 2.0
@@ -54,9 +52,26 @@ Additionally to the mandatory parameters listed above you can use optional conve
 For example, if you downloaded the [pre-trained SSD InceptionV2 topology](http://download.tensorflow.org/models/object_detection/ssd_inception_v2_coco_2018_01_28.tar.gz) and extracted archive to the directory `/tmp/ssd_inception_v2_coco_2018_01_28`, the sample command line to convert the model looks as follows:
 
 ```
-<INSTALL_DIR>/deployment_tools/model_optimizer/mo_tf.py --input_model=/tmp/ssd_inception_v2_coco_2018_01_28/frozen_inference_graph.pb --transformations_config <INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf/ssd_v2_support.json --tensorflow_object_detection_api_pipeline_config /tmp/ssd_inception_v2_coco_2018_01_28/pipeline.config --reverse_input_channels
+<INSTALL_DIR>/tools/model_optimizer/mo_tf.py --input_model=/tmp/ssd_inception_v2_coco_2018_01_28/frozen_inference_graph.pb --transformations_config <INSTALL_DIR>/tools/model_optimizer/extensions/front/tf/ssd_v2_support.json --tensorflow_object_detection_api_pipeline_config /tmp/ssd_inception_v2_coco_2018_01_28/pipeline.config --reverse_input_channels
 ```
 
+## Important Notes About Feeding Input Images to the Samples
+
+Inference Engine comes with a number of samples to infer Object Detection API models including:
+
+* [Object Detection for SSD Sample](../../../../../inference-engine/samples/object_detection_sample_ssd/README.md) --- for RFCN, SSD and Faster R-CNNs
+* [Mask R-CNN Sample for TensorFlow* Object Detection API Models](@ref omz_demos_mask_rcnn_demo_cpp) --- for Mask R-CNNs
+
+There are several important notes about feeding input images to the samples:
+
+1. Inference Engine samples stretch input image to the size of the input operation without preserving aspect ratio. This behavior is usually correct for most topologies (including SSDs), but incorrect for other models like Faster R-CNN, Mask R-CNN and R-FCN. These models usually use keeps aspect ratio resizer. The type of pre-processing is defined in the pipeline configuration file in the section `image_resizer`. If keeping aspect ratio is used, then it is necessary to resize image before passing it to the sample and optionally pad the resized image with 0s (if the attribute "pad_to_max_dimension" in the pipeline.config is equal to "true").
+
+2. TensorFlow\* implementation of image resize may be different from the one implemented in the sample. Even reading input image from compressed format (like `.jpg`) could give different results in the sample and TensorFlow\*. So, if it is necessary to compare accuracy between the TensorFlow\* and the Inference Engine it is recommended to pass pre-resized input image in a non-compressed format (like `.bmp`).
+
+3. If you want to infer the model with the Inference Engine samples, convert the model specifying the `--reverse_input_channels` command line parameter. The samples load images in BGR channels order, while TensorFlow* models were trained with images in RGB order. When the `--reverse_input_channels` command line parameter is specified, the Model Optimizer performs first convolution or other channel dependent operation weights modification so the output will be like the image is passed with RGB channels order.
+
+4. Read carefully messaged printed by the Model Optimizer during a model conversion. They contain important instructions on how to prepare input data before running the inference and how to interpret the output.
+
 ## Custom Input Shape <a name="tf_od_custom_input_shape"></a>
 Model Optimizer handles the command line parameter `--input_shape` for TensorFlow\* Object Detection API models in a special way depending on the image resizer type defined in the `pipeline.config` file. TensorFlow\* Object Detection API generates different `Preprocessor` sub-graph based on the image resizer type. Model Optimizer supports two types of image resizer:
 * `fixed_shape_resizer` --- *Stretches* input image to the specific height and width. The `pipeline.config` snippet below shows a `fixed_shape_resizer` sample definition:
@@ -77,19 +92,20 @@ image_resizer {
   }
 }
 ```
+If an additional parameter "pad_to_max_dimension" is equal to "true" then the resized image will be padded with 0s to the square image of size "max_dimension".
 
 ### Fixed Shape Resizer Replacement
-* If the `--input_shape` command line parameter is not specified, the Model Optimizer generates an input layer with the height and width as defined in the `pipeline.config`.
+* If the `--input_shape` command line parameter is not specified, the Model Optimizer generates an input operation with the height and width as defined in the `pipeline.config`.
 
-* If the `--input_shape [1, H, W, 3]` command line parameter is specified, the Model Optimizer sets the input layer height to `H` and width to `W` and convert the model. However, the conversion may fail because of the following reasons:
-  * The model is not reshape-able, meaning that it's not possible to change the size of the model input image. For example, SSD FPN models have `Reshape` operations with hard-coded output shapes, but the input size to these `Reshape` instances depends on the input image size. In this case, the Model Optimizer shows an error during the shape inference phase. Run the Model Optimizer with `--log_level DEBUG` to see the inferred layers output shapes to see the mismatch.
+* If the `--input_shape [1, H, W, 3]` command line parameter is specified, the Model Optimizer sets the input operation height to `H` and width to `W` and convert the model. However, the conversion may fail because of the following reasons:
+  * The model is not reshape-able, meaning that it's not possible to change the size of the model input image. For example, SSD FPN models have `Reshape` operations with hard-coded output shapes, but the input size to these `Reshape` instances depends on the input image size. In this case, the Model Optimizer shows an error during the shape inference phase. Run the Model Optimizer with `--log_level DEBUG` to see the inferred operations output shapes to see the mismatch.
   * Custom input shape is too small. For example, if you specify `--input_shape [1,100,100,3]` to convert a SSD Inception V2 model, one of convolution or pooling nodes decreases input tensor spatial dimensions to non-positive values. In this case, the Model Optimizer shows error message like this: '[ ERROR ]  Shape [  1  -1  -1 256] is not fully defined for output X of "node_name".'
 
 
 ### Keep Aspect Ratio Resizer Replacement
-* If the `--input_shape` command line parameter is not specified, the Model Optimizer generates an input layer with both height and width equal to the value of parameter `min_dimension` in the `keep_aspect_ratio_resizer`.
+* If the `--input_shape` command line parameter is not specified, the Model Optimizer generates an input operation with both height and width equal to the value of parameter `min_dimension` in the `keep_aspect_ratio_resizer`.
 
-* If the `--input_shape [1, H, W, 3]` command line parameter is specified, the Model Optimizer scales the specified input image height `H` and width `W` to satisfy the `min_dimension` and `max_dimension` constraints defined in the `keep_aspect_ratio_resizer`. The following function calculates the input layer height and width:
+* If the `--input_shape [1, H, W, 3]` command line parameter is specified, the Model Optimizer scales the specified input image height `H` and width `W` to satisfy the `min_dimension` and `max_dimension` constraints defined in the `keep_aspect_ratio_resizer`. The following function calculates the input operation height and width:
 
 ```python
 def calculate_shape_keeping_aspect_ratio(H: int, W: int, min_dimension: int, max_dimension: int):
@@ -98,955 +114,18 @@ def calculate_shape_keeping_aspect_ratio(H: int, W: int, min_dimension: int, max
     ratio = min(ratio_min, ratio_max)
     return int(round(H * ratio)), int(round(W * ratio))
 ```
+The `--input_shape` command line parameter should be specified only if the "pad_to_max_dimension" does not exist of is set to "false" in the `keep_aspect_ratio_resizer`.
 
-Models with `keep_aspect_ratio_resizer` were trained to recognize object in real aspect ratio, in contrast with most of the classification topologies trained to recognize objects stretched vertically and horizontally as well. By default, the Model Optimizer converts topologies with `keep_aspect_ratio_resizer` to consume a square input image. If the non-square image is provided as input, it is stretched without keeping aspect ratio that results to objects detection quality decrease.
+Models with `keep_aspect_ratio_resizer` were trained to recognize object in real aspect ratio, in contrast with most of the classification topologies trained to recognize objects stretched vertically and horizontally as well. By default, the Model Optimizer converts topologies with `keep_aspect_ratio_resizer` to consume a square input image. If the non-square image is provided as input, it is stretched without keeping aspect ratio that results to object detection quality decrease.
 
 > **NOTE**: It is highly recommended specifying the `--input_shape` command line parameter for the models with `keep_aspect_ratio_resizer` if the input image dimensions are known in advance.
 
-## Important Notes About Feeding Input Images to the Samples
-
-Inference Engine comes with a number of samples that use Object Detection API models including:
-
-* [Object Detection for SSD Sample](../../../../../inference-engine/samples/object_detection_sample_ssd/README.md) --- for RFCN, SSD and Faster R-CNNs
-* [Mask R-CNN Sample for TensorFlow* Object Detection API Models](@ref omz_demos_mask_rcnn_demo_cpp) --- for Mask R-CNNs
-
-There are a number of important notes about feeding input images to the samples:
-
-1. Inference Engine samples stretch input image to the size of the input layer without preserving aspect ratio. This behavior is usually correct for most topologies (including SSDs), but incorrect for the following Faster R-CNN topologies: Inception ResNet, Inception V2, ResNet50 and ResNet101. Images pre-processing for these topologies keeps aspect ratio. Also all Mask R-CNN and R-FCN topologies require keeping aspect ratio. The type of pre-processing is defined in the pipeline configuration file in the section `image_resizer`. If keeping aspect ratio is required, then it is necessary to resize image before passing it to the sample.
-
-2. TensorFlow\* implementation of image resize may be different from the one implemented in the sample. Even reading input image from compressed format (like `.jpg`) could give different results in the sample and TensorFlow\*. So, if it is necessary to compare accuracy between the TensorFlow\* and the Inference Engine it is recommended to pass pre-scaled input image in a non-compressed format (like `.bmp`).
-
-3. If you want to infer the model with the Inference Engine samples, convert the model specifying the `--reverse_input_channels` command line parameter. The samples load images in BGR channels order, while TensorFlow* models were trained with images in RGB order. When the `--reverse_input_channels` command line parameter is specified, the Model Optimizer performs first convolution or other channel dependent operation weights modification so the output will be like the image is passed with RGB channels order.
-
-
 ## Detailed Explanations of Model Conversion Process
 
 This section is intended for users who want to understand how the Model Optimizer performs Object Detection API models conversion in details. The knowledge given in this section is also useful for users having complex models that are not converted with the Model Optimizer out of the box. It is highly recommended to read [Sub-Graph Replacement in Model Optimizer](../../customize_model_optimizer/Subgraph_Replacement_Model_Optimizer.md) chapter first to understand sub-graph replacement concepts which are used here.
 
-Implementation of the sub-graph replacers for Object Detection API models is located in the file `<INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf/ObjectDetectionAPI.py`.
-
 It is also important to open the model in the [TensorBoard](https://www.tensorflow.org/guide/summaries_and_tensorboard) to see the topology structure. Model Optimizer can create an event file that can be then fed to the TensorBoard* tool. Run the Model Optimizer with providing two command line parameters:
 * `--input_model <path_to_frozen.pb>` --- Path to the frozen model
 * `--tensorboard_logdir` --- Path to the directory where TensorBoard looks for the event files.
 
-### SSD (Single Shot Multibox Detector) Topologies
-
-The SSD topologies are the simplest ones among Object Detection API topologies, so they will be analyzed first. The sub-graph replacement configuration file `ssd_v2_support.json`, which should be used to convert these models, contains three sub-graph replacements: `ObjectDetectionAPIPreprocessorReplacement`, `ObjectDetectionAPISSDPostprocessorReplacement` and `ObjectDetectionAPIOutputReplacement`. Their implementation is described below.
-
-#### Preprocessor Block
-
-All Object Detection API topologies contain `Preprocessor` block of nodes (aka ["scope"](https://www.tensorflow.org/guide/graph_viz)) that performs two tasks:
-
-* Scales image to the size required by the topology.
-* Applies mean and scale values if needed.
-
-Model Optimizer cannot convert the part of the `Preprocessor` block performing scaling because the TensorFlow implementation uses `while`- loops which the Inference Engine does not support. Another reason is that the Inference Engine samples scale input images to the size of the input layer from the Intermediate Representation (IR) automatically. Given that it is necessary to cut-off the scaling part of the `Preprocessor` block and leave only operations applying mean and scale values. This task is solved using the Model Optimizer [sub-graph replacer mechanism](../../customize_model_optimizer/Subgraph_Replacement_Model_Optimizer.md).
-
-The `Preprocessor` block has two outputs: the tensor with pre-processed image(s) data and a tensor with pre-processed image(s) size(s). While converting the model, Model Optimizer keeps only the nodes producing the first tensor. The second tensor is a constant which can be obtained from the `pipeline.config` file to be used in other replacers.
-
-The implementation of the `Preprocessor` block sub-graph replacer is the following (file `<INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf/ObjectDetectionAPI.py`):
-
-```python
-class ObjectDetectionAPIPreprocessorReplacement(FrontReplacementFromConfigFileSubGraph):
-    """
-    The class replaces the "Preprocessor" block resizing input image and applying mean/scale values. Only nodes related
-    to applying mean/scaling values are kept.
-    """
-    replacement_id = 'ObjectDetectionAPIPreprocessorReplacement'
-
-    def run_before(self):
-        return [Pack, Sub]
-
-    def nodes_to_remove(self, graph: Graph, match: SubgraphMatch):
-        new_nodes_to_remove = match.matched_nodes_names()
-        # do not remove nodes that perform input image scaling and mean value subtraction
-        for node_to_keep in ('Preprocessor/sub', 'Preprocessor/sub/y', 'Preprocessor/mul', 'Preprocessor/mul/x'):
-            if node_to_keep in new_nodes_to_remove:
-                new_nodes_to_remove.remove(node_to_keep)
-        return new_nodes_to_remove
-
-    def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
-        argv = graph.graph['cmd_params']
-        layout = graph.graph['layout']
-        if argv.tensorflow_object_detection_api_pipeline_config is None:
-            raise Error(missing_param_error)
-        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-
-        sub_node = match.output_node(0)[0]
-        if not sub_node.has('op') or sub_node.op != 'Sub':
-            raise Error('The output op of the Preprocessor sub-graph is not of type "Sub". Looks like the topology is '
-                        'not created with TensorFlow Object Detection API.')
-
-        mul_node = None
-        if sub_node.in_node(0).has('op') and sub_node.in_node(0).op == 'Mul':
-            log.info('There is image scaling node in the Preprocessor block.')
-            mul_node = sub_node.in_node(0)
-
-        initial_input_node_name = 'image_tensor'
-        if initial_input_node_name not in graph.nodes():
-            raise Error('Input node "{}" of the graph is not found. Do not run the Model Optimizer with '
-                        '"--input" command line parameter.'.format(initial_input_node_name))
-        placeholder_node = Node(graph, initial_input_node_name)
-
-        # set default value of the batch size to 1 if user didn't specify batch size and input shape
-        batch_dim = get_batch_dim(layout, 4)
-        if argv.batch is None and placeholder_node.shape[batch_dim] == -1:
-            placeholder_node.shape[batch_dim] = 1
-        if placeholder_node.shape[batch_dim] > 1:
-            print("[ WARNING ] The batch size more than 1 is supported for SSD topologies only.")
-        height, width = calculate_placeholder_spatial_shape(graph, match, pipeline_config)
-        placeholder_node.shape[get_height_dim(layout, 4)] = height
-        placeholder_node.shape[get_width_dim(layout, 4)] = width
-
-        # save the pre-processed image spatial sizes to be used in the other replacers
-        graph.graph['preprocessed_image_height'] = placeholder_node.shape[get_height_dim(layout, 4)]
-        graph.graph['preprocessed_image_width'] = placeholder_node.shape[get_width_dim(layout, 4)]
-
-        to_float_node = placeholder_node.out_node(0)
-        if not to_float_node.has('op') or to_float_node.op != 'Cast':
-            raise Error('The output of the node "{}" is not Cast operation. Cannot apply replacer.'.format(
-                initial_input_node_name))
-
-        # connect to_float_node directly with node performing scale on mean value subtraction
-        if mul_node is None:
-            create_edge(to_float_node, sub_node, 0, 0)
-        else:
-            create_edge(to_float_node, mul_node, 0, 1)
-
-        print('The Preprocessor block has been removed. Only nodes performing mean value subtraction and scaling (if'
-              ' applicable) are kept.')
-        return {}
-```
-The `run_before` function defines a list of replacers which current replacer should be run before. In this case it is `Pack` and `Sub`. The `Sub` operation is not supported by Inference Engine plugins so Model Optimizer replaces it with a combination of the `Eltwise` layer (element-wise sum) and the `ScaleShift` layer. But the `Preprocessor` replacer expects to see `Sub` node, so it should be called before the `Sub` is replaced.
-
-The `nodes_to_remove` function returns list of nodes that should be removed after the replacement happens. In this case it removes all nodes matched in the `Preprocessor` scope except the `Sub` and `Mul` nodes performing mean value subtraction and scaling.
-
-The `generate_sub_graph` function performs the following actions:
-
-*  Lines 20-24: Reads the `pipeline.config` configuration file to get the model hyper-parameters and other attributes.
-*  Lines 25-29: Checks that the output node of the `Preprocessor` scope is of type `Sub`.
-*  Lines 31-34: Checks that the input of the `Sub` node is of type `Mul`. This information is needed to correctly connect the input node of the topology later.
-*  Lines 36-50: Finds the topology input (placeholder) node and sets its weight and height according to the image resizer defined in the `pipeline.config` file and the `--input_shape` provided by the user. The batch size is set to 1 by default, but it will be overridden if you specify a batch size using command-line option `-b`. Refer to the [Custom Input Shape](#tf_od_custom_input_shape) on how the Model Optimizer calculates input layer height and width.
-*  Lines 52-54: Saves the placeholder shape in the `graph` object for other sub-graph replacements.
-*  Lines 56-59: Checks that the placeholder node follows the 'Cast' node which converts model input data from UINT8 to FP32.
-*  Lines 61-65: Creates edge from the placeholder node to the `Mul` (if present) or `Sub` node to a correct input port (0 for `Sub` and 1 for `Mul`).
-*  Line 69: The replacer returns a dictionary with nodes mapping that is used by other sub-graph replacement functions. In this case, it is not needed, so the empty dictionary is returned.
-
-#### Postprocessor Block
-
-A distinct feature of any SSD topology is a part performing non-maximum suppression of proposed images bounding boxes. This part of the topology is implemented with dozens of primitive operations in TensorFlow, while in Inference Engine, it is one [layer](../../../../ops/opset.md) called `DetectionOutput`. Thus, to convert a SSD model from the TensorFlow, the Model Optimizer should replace the entire sub-graph of operations that implement the `DetectionOutput` layer with a single `DetectionOutput` node.
-
-The Inference Engine `DetectionOutput` layer implementation consumes three tensors in the following order:
-
-1.  Tensor with locations of bounding boxes
-2.  Tensor with confidences for each bounding box
-3.  Tensor with prior boxes ("anchors" in a TensorFlow terminology)
-
-The Inference Engine `DetectionOutput` layer implementation produces one tensor with seven numbers for each actual detection:
-
-* batch index
-* class label
-* class probability
-* x_1 box coordinate
-* y_1 box coordinate
-* x_2 box coordinate
-* y_2 box coordinate.
-
-There are more output tensors in the TensorFlow Object Detection API: "detection_boxes", "detection_classes", "detection_scores" and "num_detections", but the values in them are consistent with the output values of the Inference Engine DetectionOutput layer.
-
-The sub-graph replacement by points is used in the `ssd_v2_support.json` to match the `Postprocessor` block. The start points are defined the following way:
-
-*  "Postprocessor/Shape" receives tensor with bounding boxes;
-*  "Postprocessor/scale_logits" receives tensor with confidences(probabilities) for each box;
-*  "Postprocessor/Tile" receives tensor with prior boxes (anchors);
-*  "Postprocessor/Reshape_1" is specified only to match the whole `Postprocessor` scope. Not used in the replacement code;
-*  "Postprocessor/ToFloat" is specified only to match the whole `Postprocessor` scope. Not used in the replacement code.
-
-There are a number of differences in layout, format and content of in input tensors to `DetectionOutput` layer and what tensors generates TensorFlow, so additional tensors processing before creating `DetectionOutput` layer is required. It is described below. The sub-graph replacement class for the `DetectionOutput` layer is given below:
-
-```python
-class ObjectDetectionAPISSDPostprocessorReplacement(FrontReplacementFromConfigFileSubGraph):
-    replacement_id = 'ObjectDetectionAPISSDPostprocessorReplacement'
-
-    def run_after(self):
-        return [ObjectDetectionAPIPreprocessorReplacement]
-
-    def run_before(self):
-        # the replacer uses node of type "RealDiv" as one of the start points, but Model Optimizer replaces nodes of
-        # type "RealDiv" with a new ones, so it is necessary to replace the sub-graph before replacing the "RealDiv"
-        # nodes
-        return [Div, StandaloneConstEraser]
-
-    def output_edges_match(self, graph: Graph, match: SubgraphMatch, new_sub_graph: dict):
-        # the DetectionOutput in IE produces single tensor, but in TF it produces two tensors, so create only one output
-        # edge match
-        return {match.output_node(0)[0].id: new_sub_graph['detection_output_node'].id}
-
-    def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
-        argv = graph.graph['cmd_params']
-        if argv.tensorflow_object_detection_api_pipeline_config is None:
-            raise Error(missing_param_error)
-        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-        num_classes = _value_or_raise(match, pipeline_config, 'num_classes')
-
-        # reshapes confidences to 4D before applying activation function
-        expand_dims_op = Reshape(graph, {'dim': int64_array([0, 1, -1, num_classes + 1])})
-        # do not convert from NHWC to NCHW this node shape
-        expand_dims_node = expand_dims_op.create_node([match.input_nodes(1)[0][0].in_node(0)],
-                                                      dict(name='do_ExpandDims_conf'))
-
-        activation_function = _value_or_raise(match, pipeline_config, 'postprocessing_score_converter')
-        activation_conf_node = add_activation_function_after_node(graph, expand_dims_node, activation_function)
-        PermuteAttrs.set_permutation(expand_dims_node, expand_dims_node.out_node(), None)
-
-        # IE DetectionOutput layer consumes flattened tensors
-        # reshape operation to flatten locations tensor
-        reshape_loc_op = Reshape(graph, {'dim': int64_array([0, -1])})
-        reshape_loc_node = reshape_loc_op.create_node([match.input_nodes(0)[0][0].in_node(0)],
-                                                      dict(name='do_reshape_loc'))
-
-        # IE DetectionOutput layer consumes flattened tensors
-        # reshape operation to flatten confidence tensor
-        reshape_conf_op = Reshape(graph, {'dim': int64_array([0, -1])})
-        reshape_conf_node = reshape_conf_op.create_node([activation_conf_node], dict(name='do_reshape_conf'))
-
-        if pipeline_config.get_param('ssd_anchor_generator_num_layers') is not None or \
-                        pipeline_config.get_param('multiscale_anchor_generator_min_level') is not None:
-            # change the Reshape operations with hardcoded number of output elements of the convolution nodes to be
-            # reshapable
-            _relax_reshape_nodes(graph, pipeline_config)
-
-            # create PriorBoxClustered nodes instead of a constant value with prior boxes so the model could be reshaped
-            if pipeline_config.get_param('ssd_anchor_generator_num_layers') is not None:
-                priors_node = _create_prior_boxes_node(graph, pipeline_config)
-            elif pipeline_config.get_param('multiscale_anchor_generator_min_level') is not None:
-                priors_node = _create_multiscale_prior_boxes_node(graph, pipeline_config)
-        else:
-            log.info('The anchor generator is not known. Save constant with prior-boxes to IR.')
-            priors_node = match.input_nodes(2)[0][0].in_node(0)
-
-        # creates DetectionOutput Node object from Op class
-        detection_output_op = DetectionOutput(graph, match.custom_replacement_desc.custom_attributes)
-        detection_output_op.attrs['old_infer'] = detection_output_op.attrs['infer']
-        detection_output_op.attrs['infer'] = __class__.do_infer
-        detection_output_node = detection_output_op.create_node(
-            [reshape_loc_node, reshape_conf_node, priors_node],
-            dict(name=detection_output_op.attrs['type'],
-                 clip=1,
-                 confidence_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_score_threshold'),
-                 top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_detections_per_class'),
-                 keep_top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_total_detections'),
-                 nms_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_iou_threshold')))
-
-        return {'detection_output_node': detection_output_node}
-```
-
-The `run_before` and `run_after` functions define lists of replacers that this replacer should be run before and after respectively.
-
-The `input_edges_match` and `output_edges_match` functions generate dictionaries describing how the input/output nodes matched with the replacer should be connected with new nodes generated in the `generate_sub_graph` function. Refer to [sub-graph replacements](../../customize_model_optimizer/Subgraph_Replacement_Model_Optimizer.md) documentation for more information.
-
-The `generate_sub_graph` function performs the following actions:
-
-*  Lines 19-23: Reads the `pipeline.config` configuration file to get the model hyper-parameters and other attributes.
-*  Lines 25-32: Makes tensor with confidences 4D and apply correct activation function (read from the `pipeline.config` file) to it.
-*  Line 33: Disables permutation of `expand_dims_node`'s attributes because they are already in the NCHW layout.
-*  Lines 35-39: Makes tensor with bounding boxes 2D, where the first dimension corresponds to a batch size.
-*  Lines 49-52: Makes tensor with confidences 2D, where the first dimension corresponds to a batch size.
-*  Lines 41-44: Creates a node with `DetectionOutput` layer with a number of layer attributes from the `pipeline.config` file. Also the inference function (`infer` attribute) is updated with a custom inference function `__class__.do_infer`. The latter change is described below.
-*  Lines 46-59: Creates several `PriorBoxClustered` layers which generate prior boxes depending on the type of the grid anchor generator defined in the `pipeline.config` file. If the grid anchor type is not known then initialize `priors_node` as a node matched by the sub-graph replacement. In the latter case it is a constant node with prior boxes calculated for a particular input image shape.
-*  Lines 61-72: Creates `DetectionOutput` layer with attributes from the `pipeline.config` file.
-*  Line 74: Returns dictionary with mapping of nodes that is used in the `input_edges_match` and `output_edges_match` functions.
-
-The paragraphs below explains why the inference function for the Detection Output layer is modified. Before doing that it is necessary to make acquaintance with selected high-level steps of the Model Optimize model conversion pipeline. Note, that only selected steps are required for understanding the change are mentioned:
-
-1. Model Optimizer creates calculation graph from the initial topology where each nodes corresponds to a operation from the initial model.
-2. Model Optimizer performs "Front replacers" (including the one being described now).
-3. Model Optimizer adds data nodes between operation nodes to the graph.
-4. Model Optimizer performs "Middle replacers".
-5. Model Optimizer performs "shape inference" phase. During this phase the shape of all data nodes is being calculated. Model Optimizer also calculates value for data tensors which are constant, i.e. do not depend on input. For example, tensor with prior boxes (generated with `MultipleGridAnchorGenerator` or similar scopes) doesn't depend on input and is evaluated by Model Optimizer during shape inference. Model Optimizer uses inference function stored in the 'infer' attribute of operation nodes.
-6. Model Optimizer performs "Back replacers".
-7. Model Optimizer generates IR.
-
-The `do_infer` function is needed to perform some adjustments to the tensor with prior boxes (anchors) that is known only after the shape inference phase and to perform additional transformations described below. This change is performed only if the tensor with prior boxes is not constant (so it is produced by `PriorBoxClustered` layers during inference). It is possible to make the `Postprocessor` block replacement as a Middle replacer (so the prior boxes tensor would be evaluated by the time the replacer is called), but in this case it will be necessary to correctly handle data nodes which are created between each pair of initially adjacent operation nodes. In order to inject required modification to the inference function of the `DetectionOutput` node, a new function is created to perform modifications and to call the initial inference function. The code of a new inference function is the following:
-
-```python
-@staticmethod
-def do_infer(node: Node):
-    prior_boxes = node.in_node(2).value
-    if prior_boxes is not None:
-        argv = node.graph.graph['cmd_params']
-        if argv.tensorflow_object_detection_api_pipeline_config is None:
-            raise Error(missing_param_error)
-        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-        variance = _variance_from_pipeline_config(pipeline_config)
-        # replicating the variance values for all prior-boxes
-        variances = np.tile(variance, [prior_boxes.shape[-2], 1])
-        # DetectionOutput Inference Engine expects the prior-boxes in the following layout: (values, variances)
-        prior_boxes = prior_boxes.reshape([-1, 4])
-        prior_boxes = np.concatenate((prior_boxes, variances), 0)
-        # compared to the IE's DetectionOutput, the TF keeps the prior-boxes in YXYX, need to get back to the XYXY
-        prior_boxes = np.concatenate((prior_boxes[:, 1:2], prior_boxes[:, 0:1],
-                                      prior_boxes[:, 3:4], prior_boxes[:, 2:3]), 1)
-        #  adding another dimensions, as the prior-boxes are expected as 3d tensors
-        prior_boxes = prior_boxes.reshape((1, 2, -1))
-        node.in_node(2).shape = int64_array(prior_boxes.shape)
-        node.in_node(2).value = prior_boxes
-
-    node.old_infer(node)
-    # compared to the IE's DetectionOutput, the TF keeps the locations in YXYX, need to get back to the XYXY
-    # for last convolutions that operate the locations need to swap the X and Y for output feature weights & biases
-    conv_nodes = backward_bfs_for_operation(node.in_node(0), ['Conv2D'])
-    swap_weights_xy(conv_nodes)
-    squeeze_reshape_and_concat(conv_nodes)
-
-    for node_name in node.graph.nodes():
-        node = Node(node.graph, node_name)
-        if node.has_and_set('swap_xy_count') and len(node.out_nodes()) != node['swap_xy_count']:
-            raise Error('The weights were swapped for node "{}", but this weight was used in other nodes.'.format(
-                node.name))
-```
-
-*  Lines 3-18: Updates the value of the tensor with prior boxes by appending variance values if the prior boxes are pre-calculated. Inference Engine implementation of the `DetectionOutput` layer expects these values located within the tensor with bounding boxes, but in TensorFlow they are applied in different way.
-*  Line 23: Executes initial inference function to calculate the output shape of this node.
-*  Lines 26-27: Finds predecessor node of type "Conv2D" of the node with bounding boxes (which is `node.in_node(0)`) and modifies convolution weights so "X" and "Y" coordinates are swapped. In TensorFlow bounding boxes are stored in the tensors in "YXYX" order, while in the Inference Engine it is "XYXY".
-*  Line 28: Executes function looking for `Reshape` operations after the `Conv2D` nodes found above with 4D output and remove the dimension with index 2 which should be equal to 1. This is a workaround to make tensor 3D so its shape will not be transposed during the IR generation. The problem arises when bounding boxes predictions are reshaped from [1, 1, 1, X] to [1, X / 4, 1, 4]. The result tensor should not be transposed because after transpose it will have shape [1, 4, X / 4, 1] and the concatenation over dimension with index 2 will produce incorrect tensor. Also the function looks for `Concat` operations and changes the concatenation dimension from 2 to 1.
-
-### Faster R-CNN Topologies
-The Faster R-CNN models contain several building blocks similar to building blocks from SSD models so it is highly recommended to read the section about converting them first. Detailed information about Faster R-CNN topologies is provided [in the abstract](https://arxiv.org/abs/1506.01497).
-
-#### Preprocessor Block
-Faster R-CNN topologies contain similar `Preprocessor` block as SSD topologies. The same `ObjectDetectionAPIPreprocessorReplacement` sub-graph replacer is used to cut it off.
-
-#### Proposal Layer
-The `Proposal` layer is implemented with dozens of primitive operations in TensorFlow, meanwhile, it is a single layer in the Inference Engine. The `ObjectDetectionAPIProposalReplacement` sub-graph replacer identifies nodes corresponding to the layer and replaces them with required new nodes.
-
-```python
-class ObjectDetectionAPIProposalReplacement(FrontReplacementFromConfigFileSubGraph):
-    """
-    This class replaces sub-graph of operations with Proposal layer and additional layers transforming
-    tensors from layout of TensorFlow to layout required by Inference Engine.
-    Refer to comments inside the function for more information about performed actions.
-    """
-    replacement_id = 'ObjectDetectionAPIProposalReplacement'
-
-    def run_after(self):
-        return [ObjectDetectionAPIPreprocessorReplacement]
-
-    def run_before(self):
-        return [Sub, CropAndResizeReplacement]
-
-    def output_edges_match(self, graph: Graph, match: SubgraphMatch, new_sub_graph: dict):
-        return {match.output_node(0)[0].id: new_sub_graph['proposal_node'].id}
-
-    def nodes_to_remove(self, graph: Graph, match: SubgraphMatch):
-        new_list = match.matched_nodes_names().copy()
-        # do not remove nodes that produce box predictions and class predictions
-        new_list.remove(match.single_input_node(0)[0].id)
-        new_list.remove(match.single_input_node(1)[0].id)
-        return new_list
-
-    def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
-        argv = graph.graph['cmd_params']
-        if argv.tensorflow_object_detection_api_pipeline_config is None:
-            raise Error(missing_param_error)
-        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-
-        max_proposals = _value_or_raise(match, pipeline_config, 'first_stage_max_proposals')
-        proposal_ratios = _value_or_raise(match, pipeline_config, 'anchor_generator_aspect_ratios')
-        proposal_scales = _value_or_raise(match, pipeline_config, 'anchor_generator_scales')
-        anchors_count = len(proposal_ratios) * len(proposal_scales)
-
-        # Convolution/matmul node that produces classes predictions
-        # Permute result of the tensor with classes permissions so it will be in a correct layout for Softmax
-        predictions_node = backward_bfs_for_operation(match.single_input_node(1)[0], ['Add'])[0]
-
-        reshape_classes_op = Reshape(graph, dict(dim=int64_array([0, anchors_count, 2, -1])))
-        reshape_classes_node = reshape_classes_op.create_node([], dict(name='predictions/Reshape', nchw_layout=True))
-        predictions_node.insert_node_after(reshape_classes_node, 0)
-
-        softmax_conf_op = Softmax(graph, dict(axis=2, nchw_layout=True, name=reshape_classes_node.id + '/Softmax'))
-        softmax_conf_node = softmax_conf_op.create_node([reshape_classes_node])
-        permute_reshape_softmax_op = Permute(graph, dict(order=int64_array([0, 2, 1, 3]), nchw_layout=True))
-        permute_reshape_softmax_node = permute_reshape_softmax_op.create_node([softmax_conf_node], dict(
-            name=softmax_conf_node.name + '/Permute'))
-
-        initial_shape_op = Shape(graph, dict(name=predictions_node.id + '/Shape'))
-        initial_shape_node = initial_shape_op.create_node([predictions_node])
-
-        # implement custom reshape infer function because we need to know the input convolution node output dimension
-        # sizes but we can know it only after partial infer
-        reshape_permute_op = Reshape(graph, dict())
-        reshape_permute_node = reshape_permute_op.create_node([permute_reshape_softmax_node, initial_shape_node],
-                                                              dict(name='Reshape_Permute_Class'))
-
-        variance_height = pipeline_config.get_param('frcnn_variance_height')
-        variance_width = pipeline_config.get_param('frcnn_variance_width')
-        variance_x = pipeline_config.get_param('frcnn_variance_x')
-        variance_y = pipeline_config.get_param('frcnn_variance_y')
-        anchor_generator_height_stride = pipeline_config.get_param('anchor_generator_height_stride')
-        anchor_generator_width_stride = pipeline_config.get_param('anchor_generator_width_stride')
-        anchor_generator_height = pipeline_config.get_param('anchor_generator_height')
-        anchor_generator_width = pipeline_config.get_param('anchor_generator_width')
-
-        if variance_height != variance_width:
-            log.error('The values for variance for height "{}" is not equal to variance for width "{}". The detection '
-                      'results will be inaccurate.'.format(variance_height, variance_width))
-        if variance_x != variance_y:
-            log.error('The values for variance for x "{}" is not equal to variance for y "{}". The detection '
-                      'results will be inaccurate.'.format(variance_x, variance_y))
-        if anchor_generator_height_stride != anchor_generator_width_stride:
-            log.error('The values for the anchor generator height stride "{}" is not equal to the anchor generator '
-                      'width stride "{}". The detection results will be inaccurate.'.format(
-                anchor_generator_height_stride, anchor_generator_width_stride))
-        if anchor_generator_height != anchor_generator_width:
-            log.error('The values for the anchor generator height "{}" is not equal to the anchor generator width '
-                      'stride "{}". The detection results will be inaccurate.'.format(anchor_generator_height,
-                                                                                      anchor_generator_width))
-
-        proposal_op = ProposalOp(graph, dict(min_size=1,
-                                             framework='tensorflow',
-                                             pre_nms_topn=2 ** 31 - 1,
-                                             box_size_scale=variance_height,
-                                             box_coordinate_scale=variance_x,
-                                             post_nms_topn=max_proposals,
-                                             feat_stride=anchor_generator_height_stride,
-                                             ratio=proposal_ratios,
-                                             scale=proposal_scales,
-                                             normalize=1,
-                                             base_size=anchor_generator_height,
-                                             nms_thresh=_value_or_raise(match, pipeline_config,
-                                                                        'first_stage_nms_iou_threshold')))
-        for key in ('clip_before_nms', 'clip_after_nms'):
-            if key in match.custom_replacement_desc.custom_attributes:
-                proposal_op.attrs[key] = int(match.custom_replacement_desc.custom_attributes[key])
-
-        anchors_node = backward_bfs_for_operation(match.single_input_node(0)[0], ['Add'])[0]
-
-        # creates input to store input image height, width and scales (usually 1.0s)
-        # the batch size for this input is fixed because it is allowed to pass images of the same size only as input
-        input_op_with_image_size = Input(graph, dict(shape=int64_array([1, 3]), fixed_batch=True))
-        input_with_image_size_node = input_op_with_image_size.create_node([], dict(name='image_info'))
-
-        proposal_node = proposal_op.create_node([reshape_permute_node, anchors_node, input_with_image_size_node],
-                                                dict(name='proposals'))
-
-        if 'do_not_swap_proposals' in match.custom_replacement_desc.custom_attributes and \
-                match.custom_replacement_desc.custom_attributes['do_not_swap_proposals']:
-            swapped_proposals_node = proposal_node
-        else:
-            swapped_proposals_node = add_convolution_to_swap_xy_coordinates(graph, proposal_node, 5)
-
-        proposal_reshape_2d_op = Reshape(graph, dict(dim=int64_array([-1, 5]), nchw_layout=True))
-        proposal_reshape_2d_node = proposal_reshape_2d_op.create_node([swapped_proposals_node],
-                                                                      dict(name="reshape_swap_proposals_2d"))
-
-        # feed the CropAndResize node with a correct boxes information produced with the Proposal layer
-        # find the first CropAndResize node in the BFS order
-        crop_and_resize_nodes_ids = [node_id for node_id in bfs_search(graph, [match.single_input_node(0)[0].id]) if
-                                     graph.node[node_id]['op'] == 'CropAndResize']
-        assert len(crop_and_resize_nodes_ids) != 0, "Didn't find any CropAndResize nodes in the graph."
-        if 'do_not_swap_proposals' not in match.custom_replacement_desc.custom_attributes or not \
-                match.custom_replacement_desc.custom_attributes['do_not_swap_proposals']:
-            crop_and_resize_node = Node(graph, crop_and_resize_nodes_ids[0])
-            # set a marker that the input with box coordinates has been pre-processed so the CropAndResizeReplacement
-            # transform doesn't try to merge the second and the third inputs
-            crop_and_resize_node['inputs_preprocessed'] = True
-            graph.remove_edge(crop_and_resize_node.in_node(1).id, crop_and_resize_node.id)
-            graph.create_edge(proposal_reshape_2d_node, crop_and_resize_node, out_port=0, in_port=1)
-
-        tf_proposal_reshape_4d_op = Reshape(graph, dict(dim=int64_array([-1, 1, max_proposals, 5]), nchw_layout=True))
-        tf_proposal_reshape_4d_node = tf_proposal_reshape_4d_op.create_node([swapped_proposals_node],
-                                                                            dict(name="reshape_proposal_4d"))
-
-        crop_op = Crop(graph, dict(axis=int64_array([3]), offset=int64_array([1]), dim=int64_array([4]),
-                                   nchw_layout=True))
-        crop_node = crop_op.create_node([tf_proposal_reshape_4d_node], dict(name='crop_proposals'))
-
-        tf_proposals_crop_reshape_3d_op = Reshape(graph, dict(dim=int64_array([0, -1, 4]), nchw_layout=True))
-        tf_proposals_crop_reshape_3d_node = tf_proposals_crop_reshape_3d_op.create_node([crop_node],
-                                                                                        dict(name="reshape_crop_3d"))
-
-        return {'proposal_node': tf_proposals_crop_reshape_3d_node}
-```
-The main interest of the implementation of this replacer is the `generate_sub_graph` function.
-
-Lines 26-34: Parses the `pipeline.config` file and gets required parameters for the `Proposal` layer.
-
-Lines 38-57: Performs the following manipulations with the tensor with class predictions. TensorFlow uses the NHWC layout, while the Inference Engine uses NCHW. Model Optimizer by default performs transformations with all nodes data in the inference graph to convert it to the NCHW layout. The size of 'C' dimension of the tensor with class predictions is equal to \f$base\_anchors\_count \cdot 2\f$, where 2 corresponds to a number of classes (background and foreground) and \f$base\_anchors\_count\f$ is equal to number of anchors that are applied to each position of 'H' and 'W' dimensions. Therefore, there are \f$H \cdot W \cdot base\_anchors\_count\f$ bounding boxes. Lines 44-45 apply the Softmax layer to this tensor to get class probabilities for each bounding box.
-
-Lines 59-81: Reads topology parameters related to variances and anchors generation. 
-
-Lines 83-108: Adds the `Proposal` layer to the graph. This layer has one input (generated in lines 104-105) which should be filled with three values before inference: input image height, input image width, image scale factor.
-
-Lines 110-132: Swaps output values of the `Proposal` layer if the parameter `do_not_swap_proposals` is not set to `True` in the sub-graph replacement configuration file for the replacer. 
-
-Lines 134-144: Crops the output from the `Proposal` node to remove the batch indices (the Inference Engine implementation of the `Proposal` layer generates tensor with shape `[num_proposals, 5]`). The final tensor contains just box coordinates as in the TensorFlow implementation.
-
-#### SecondStagePostprocessor Block
-The `SecondStagePostprocessor` block is similar to the `Postprocessor` block from the SSDs topologies. But there are a number of differences in conversion of the `SecondStagePostprocessor` block.
-
-```python
-class ObjectDetectionAPIDetectionOutputReplacement(FrontReplacementFromConfigFileSubGraph):
-    """
-    Replaces the sub-graph that is equal to the DetectionOutput layer from Inference Engine. This replacer is used for
-    Faster R-CNN, R-FCN and Mask R-CNN topologies conversion.
-    The replacer uses a value of the custom attribute 'coordinates_swap_method' from the sub-graph replacement
-    configuration file to choose how to swap box coordinates of the 0-th input of the generated DetectionOutput layer.
-    Refer to the code for more details.
-    """
-    replacement_id = 'ObjectDetectionAPIDetectionOutputReplacement'
-
-    def run_before(self):
-        return [ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement, Unpack, Sub]
-
-    def run_after(self):
-        return [ObjectDetectionAPIProposalReplacement, CropAndResizeReplacement]
-
-    def nodes_to_remove(self, graph: Graph, match: SubgraphMatch):
-        new_nodes_to_remove = match.matched_nodes_names().copy()
-        outputs = ['detection_boxes', 'detection_scores', 'num_detections']
-        for output in outputs:
-            children = Node(graph, output).out_nodes()
-            if len(children) != 1:
-                log.warning('Output {} has {} children. It should have only one output: with op==`OpOutput`'
-                            ''.format(output, len(children)))
-            elif children[list(children.keys())[0]].op == 'OpOutput':
-                new_nodes_to_remove.append(children[list(children.keys())[0]].id)
-            else:
-                continue
-        new_nodes_to_remove.extend(outputs)
-        return new_nodes_to_remove
-
-    def output_edges_match(self, graph: Graph, match: SubgraphMatch, new_sub_graph: dict):
-        # the DetectionOutput in IE produces single tensor, but in TF it produces four tensors, so we need to create
-        # only one output edge match
-        return {match.output_node(0)[0].id: new_sub_graph['detection_output_node'].id}
-
-    @staticmethod
-    def skip_nodes_by_condition(current_node: Node, condition: callable):
-        while condition(current_node):
-            current_node = current_node.in_node()
-        return current_node
-
-    def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
-        argv = graph.graph['cmd_params']
-        if argv.tensorflow_object_detection_api_pipeline_config is None:
-            raise Error(missing_param_error)
-        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-
-        num_classes = _value_or_raise(match, pipeline_config, 'num_classes')
-        max_proposals = _value_or_raise(match, pipeline_config, 'first_stage_max_proposals')
-        activation_function = _value_or_raise(match, pipeline_config, 'postprocessing_score_converter')
-
-        activation_conf_node = add_activation_function_after_node(graph, match.single_input_node(1)[0].in_node(0),
-                                                                  activation_function)
-
-        # IE DetectionOutput layer consumes flattened tensors so need add a Reshape layer.
-        # The batch value of the input tensor is not equal to the batch of the topology, so it is not possible to use
-        # "0" value in the Reshape layer attribute to refer to the batch size, but we know how to
-        # calculate the second dimension so the batch value will be deduced from it with help of "-1".
-        reshape_conf_op = Reshape(graph, dict(dim=int64_array([-1, (num_classes + 1) * max_proposals])))
-        reshape_conf_node = reshape_conf_op.create_node([activation_conf_node], dict(name='do_reshape_conf'))
-
-        # Workaround for PermuteForReshape pass.
-        # We looking for first not Reshape-typed node before match.single_input_node(0)[0].in_node(0).
-        # And add  reshape_loc node after this first not Reshape-typed node.
-        current_node = self.skip_nodes_by_condition(match.single_input_node(0)[0].in_node(0),
-                                                    lambda x: x['kind'] == 'op' and x.soft_get('type') == 'Reshape')
-
-        reshape_loc_op = Reshape(graph, dict(dim=int64_array([-1, num_classes, 1, 4])))
-        reshape_loc_node = reshape_loc_op.create_node([current_node], dict(name='reshape_loc', nchw_layout=True))
-        update_attrs(reshape_loc_node, 'shape_attrs', 'dim')
-
-        # constant node with variances
-        variances_const_op = Const(graph, dict(value=_variance_from_pipeline_config(pipeline_config)))
-        variances_const_node = variances_const_op.create_node([])
-
-        # TF produces locations tensor without boxes for background.
-        # Inference Engine DetectionOutput layer requires background boxes so we generate them
-        loc_node = add_fake_background_loc(graph, reshape_loc_node)
-        PermuteAttrs.set_permutation(reshape_loc_node, loc_node, None)
-
-        # reshape locations tensor to 2D so it could be passed to Eltwise which will be converted to ScaleShift
-        reshape_loc_2d_op = Reshape(graph, dict(dim=int64_array([-1, 4])))
-        reshape_loc_2d_node = reshape_loc_2d_op.create_node([loc_node], dict(name='reshape_locs_2d', nchw_layout=True))
-        PermuteAttrs.set_permutation(loc_node, reshape_loc_2d_node, None)
-
-        # element-wise multiply locations with variances
-        eltwise_locs_op = Eltwise(graph, dict(operation='mul'))
-        eltwise_locs_node = eltwise_locs_op.create_node([reshape_loc_2d_node, variances_const_node],
-                                                        dict(name='scale_locs'))
-
-        # IE DetectionOutput layer consumes flattened tensors so need add a Reshape layer.
-        # The batch value of the input tensor is not equal to the batch of the topology, so it is not possible to use
-        # "0" value in the Reshape layer attribute to refer to the batch size, but we know how to
-        # calculate the second dimension so the batch value will be deduced from it with help of "-1".
-        reshape_loc_do_op = Reshape(graph, dict(dim=int64_array([-1, (num_classes + 1) * max_proposals * 4])))
-
-        custom_attributes = match.custom_replacement_desc.custom_attributes
-        coordinates_swap_method = 'add_convolution'
-        if 'coordinates_swap_method' not in custom_attributes:
-            log.error('The ObjectDetectionAPIDetectionOutputReplacement sub-graph replacement configuration file '
-                      'must contain "coordinates_swap_method" in the "custom_attributes" dictionary. Two values are '
-                      'supported: "swap_weights" and "add_convolution". The first one should be used when there is '
-                      'a MatMul or Conv2D node before the "SecondStagePostprocessor" block in the topology. With this '
-                      'solution the weights of the MatMul or Conv2D nodes are permutted, simulating the swap of XY '
-                      'coordinates in the tensor. The second could be used in any other cases but it is worse in terms '
-                      'of performance because it adds the Conv2D node which performs permutting of data. Since the '
-                      'attribute is not defined the second approach is used by default.')
-        else:
-            coordinates_swap_method = custom_attributes['coordinates_swap_method']
-        supported_swap_methods = ['swap_weights', 'add_convolution']
-        if coordinates_swap_method not in supported_swap_methods:
-            raise Error('Unsupported "coordinates_swap_method" defined in the sub-graph replacement configuration '
-                        'file. Supported methods are: {}'.format(', '.join(supported_swap_methods)))
-
-        if coordinates_swap_method == 'add_convolution':
-            swapped_locs_node = add_convolution_to_swap_xy_coordinates(graph, eltwise_locs_node, 4)
-            reshape_loc_do_node = reshape_loc_do_op.create_node([swapped_locs_node], dict(name='do_reshape_locs'))
-        else:
-            reshape_loc_do_node = reshape_loc_do_op.create_node([eltwise_locs_node], dict(name='do_reshape_locs'))
-
-        # find Proposal output which has the data layout as in TF: YXYX coordinates without batch indices.
-        proposal_nodes_ids = [node_id for node_id, attrs in graph.nodes(data=True)
-                              if 'name' in attrs and attrs['name'] == 'crop_proposals']
-        if len(proposal_nodes_ids) != 1:
-            raise Error("Found the following nodes '{}' with name 'crop_proposals' but there should be exactly 1. "
-                        "Looks like ObjectDetectionAPIProposalReplacement replacement didn't work.".
-                        format(proposal_nodes_ids))
-        proposal_node = Node(graph, proposal_nodes_ids[0])
-
-        # check whether it is necessary to permute proposals coordinates before passing them to the DetectionOutput
-        # currently this parameter is set for the RFCN topologies
-        if 'swap_proposals' in custom_attributes and custom_attributes['swap_proposals']:
-            proposal_node = add_convolution_to_swap_xy_coordinates(graph, proposal_node, 4)
-
-        # reshape priors boxes as Detection Output expects
-        reshape_priors_op = Reshape(graph, dict(dim=int64_array([-1, 1, max_proposals * 4])))
-        reshape_priors_node = reshape_priors_op.create_node([proposal_node],
-                                                            dict(name='DetectionOutput_reshape_priors_'))
-
-        detection_output_op = DetectionOutput(graph, {})
-        if coordinates_swap_method == 'swap_weights':
-            # update infer function to re-pack weights
-            detection_output_op.attrs['old_infer'] = detection_output_op.attrs['infer']
-            detection_output_op.attrs['infer'] = __class__.do_infer
-        for key in ('clip_before_nms', 'clip_after_nms'):
-            if key in match.custom_replacement_desc.custom_attributes:
-                detection_output_op.attrs[key] = int(match.custom_replacement_desc.custom_attributes[key])
-
-        detection_output_node = detection_output_op.create_node(
-            [reshape_loc_do_node, reshape_conf_node, reshape_priors_node],
-            dict(name=detection_output_op.attrs['type'], share_location=0, variance_encoded_in_target=1,
-                 code_type='caffe.PriorBoxParameter.CENTER_SIZE', pad_mode='caffe.ResizeParameter.CONSTANT',
-                 resize_mode='caffe.ResizeParameter.WARP',
-                 num_classes=num_classes,
-                 confidence_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_score_threshold'),
-                 top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_detections_per_class'),
-                 keep_top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_total_detections'),
-                 nms_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_iou_threshold')))
-        # sets specific name to the node so we can find it in other replacers
-        detection_output_node.name = 'detection_output'
-
-        output_op = Output(graph, dict(name='do_OutputOp'))
-        output_op.create_node([detection_output_node])
-
-        print('The graph output nodes "num_detections", "detection_boxes", "detection_classes", "detection_scores" '
-              'have been replaced with a single layer of type "Detection Output". Refer to IR catalogue in the '
-              'documentation for information about this layer.')
-
-        return {'detection_output_node': detection_output_node}
-
-    @staticmethod
-    def do_infer(node):
-        node.old_infer(node)
-        # compared to the IE's DetectionOutput, the TF keeps the locations in YXYX, need to get back to the XYXY
-        # for last matmul/Conv2D that operate the locations need to swap the X and Y for output feature weights & biases
-        swap_weights_xy(backward_bfs_for_operation(node.in_node(0), ['MatMul', 'Conv2D']))
-```
-
-The differences in conversion are the following:
-
-*  The locations tensor does not contain information about class 0 (background), but Inference Engine `DetectionOutput` layer expects it. Line 79 append dummy tensor with fake coordinates.
-*  The prior boxes tensor are not constant like in SSDs models, so it is not possible to apply the same solution. Instead, the element-wise multiplication is added to scale prior boxes tensor values with the variances values. The attribute `variance_encoded_in_target=1` is set to the `DetectionOutput` layer (lines 141-159).
-*  The X and Y coordinates in the tensor with bounding boxes locations adjustments should be swapped. For some topologies it could be done by updating preceding convolution weights, but if there is no preceding convolutional node, the Model Optimizer inserts convolution node with specific kernel and weights that performs coordinates swap during topology inference.
-*  Added marker node of type `OpOutput` that is used by the Model Optimizer to determine output nodes of the topology. It is used in the dead nodes elimination pass.
-
-#### Cutting Off Part of the Topology
-
-There is an ability to cut-off part of the topology using the `--output` command line parameter. Detailed information on why it could be useful is provided in the [Cutting Off Parts of a Model ](../Cutting_Model.md). The Faster R-CNN models are cut at the end using the sub-graph replacer `ObjectDetectionAPIOutputReplacement`.
-
-```python
-class ObjectDetectionAPIOutputReplacement(FrontReplacementFromConfigFileGeneral):
-    """
-    This replacer is used to cut-off the network by specified nodes for models generated with Object Detection API.
-    The custom attribute for the replacer contains one value for key "outputs". This string is a comma separated list
-    of outputs alternatives. Each output alternative is a '|' separated list of node name which could be outputs. The
-    first node from each alternative that exits in the graph is chosen. Others are ignored.
-    For example, if the "outputs" is equal to the following string:
-
-        "Reshape_16,SecondStageBoxPredictor_1/Conv_3/BiasAdd|SecondStageBoxPredictor_1/Conv_1/BiasAdd"
-
-    then the "Reshape_16" will be an output if it exists in the graph. The second output will be
-    SecondStageBoxPredictor_1/Conv_3/BiasAdd if it exist in the graph, if not then
-    SecondStageBoxPredictor_1/Conv_1/BiasAdd will be output if it exists in the graph.
-    """
-    replacement_id = 'ObjectDetectionAPIOutputReplacement'
-
-    def run_before(self):
-        return [ObjectDetectionAPIPreprocessorReplacement]
-
-    def transform_graph(self, graph: Graph, replacement_descriptions: dict):
-        if graph.graph['cmd_params'].output is not None:
-            log.warning('User defined output nodes are specified. Skip the graph cut-off by the '
-                        'ObjectDetectionAPIOutputReplacement.')
-            return
-        outputs = []
-        outputs_string = replacement_descriptions['outputs']
-        for alternatives in outputs_string.split(','):
-            for out_node_name in alternatives.split('|'):
-                if graph.has_node(out_node_name):
-                    outputs.append(out_node_name)
-                    break
-                else:
-                    log.debug('A node "{}" does not exist in the graph. Do not add it as output'.format(out_node_name))
-        _outputs = output_user_data_repack(graph, outputs)
-        add_output_ops(graph, _outputs, graph.graph['inputs'])
-```
-
-This is a replacer of type "general" which is called just once in comparison with other Front-replacers ("scope" and "points") which are called for each matched instance. The replacer reads node names that should become new output nodes, like specifying `--output <node_names>`. The only difference is that the string containing node names could contain '|' character specifying output node names alternatives. Detailed explanation is provided in the class description in the code.
-
-The `detection_boxes`, `detection_scores`, `num_detections` nodes are specified as outputs in the `faster_rcnn_support.json` file. These nodes are used to remove part of the graph that is not be needed to calculate value of specified output nodes.
-
-### R-FCN topologies
-
-The R-FCN models are based on Faster R-CNN models so it is highly recommended to read the section about converting them first. Detailed information about R-FCN topologies is provided [in the abstract](https://arxiv.org/abs/1605.06409).
-
-#### Preprocessor Block
-
-R-FCN topologies contain similar `Preprocessor` block as SSD and Faster R-CNN topologies. The same `ObjectDetectionAPIPreprocessorReplacement` sub-graph replacer is used to cut it off.
-
-#### Proposal Layer
-
-Similar to Faster R-CNNs, R-FCN topologies contain implementation of Proposal layer before the `SecondStageBoxPredictor` block, so `ObjectDetectionAPIProposalReplacement` replacement is used in the sub-graph replacement configuration file.
-
-#### SecondStageBoxPredictor block
-
-The `SecondStageBoxPredictor` block differs from the self-titled block from Faster R-CNN topologies. It contains a number of `CropAndResize` operations consuming variously scaled boxes generated with a Proposal layer. The combination of `CropAndResize` layers located in the `while` loop forms a single position-sensitive ROI pooling (PSROIPooling) layer with bilinear interpolation. The `ObjectDetectionAPIPSROIPoolingReplacement` replacement matches two `while` loops with PSROIPooling layers applied to the blobs with box coordinates and classes predictions.
-
-```python
-class ObjectDetectionAPIPSROIPoolingReplacement(FrontReplacementFromConfigFileSubGraph):
-    replacement_id = 'ObjectDetectionAPIPSROIPoolingReplacement'
-
-    def run_after(self):
-        return [ObjectDetectionAPIProposalReplacement]
-
-    def output_edges_match(self, graph: Graph, match: SubgraphMatch, new_sub_graph: dict):
-        return {match.output_node(0)[0].id: new_sub_graph['output_node'].id}
-
-    def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
-        argv = graph.graph['cmd_params']
-        if argv.tensorflow_object_detection_api_pipeline_config is None:
-            raise Error(missing_param_error)
-        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-        num_classes = _value_or_raise(match, pipeline_config, 'num_classes')
-
-        input_node = match.input_nodes(0)[0][0].in_node(0)
-        if 'class_predictions' in input_node.id:
-            psroipooling_output_dim = num_classes + 1
-        else:
-            psroipooling_output_dim = num_classes * 4
-
-        num_spatial_bins_height = pipeline_config.get_param('num_spatial_bins_height')
-        num_spatial_bins_width = pipeline_config.get_param('num_spatial_bins_width')
-        crop_height = pipeline_config.get_param('crop_height')
-        crop_width = pipeline_config.get_param('crop_width')
-        if crop_height != crop_width:
-            raise Error('Different "crop_height" and "crop_width" parameters from the pipeline config are not '
-                        'supported: {} vs {}'.format(crop_height, crop_width))
-        psroipooling_op = PSROIPoolingOp(graph, {'name': input_node.soft_get('name') + '/PSROIPooling',
-                                                 'output_dim': psroipooling_output_dim,
-                                                 'group_size': crop_width / num_spatial_bins_width,
-                                                 'spatial_bins_x': num_spatial_bins_width,
-                                                 'spatial_bins_y': num_spatial_bins_height,
-                                                 'mode': 'bilinear',
-                                                 'spatial_scale': 1,
-                                                 })
-
-        if 'reshape_swap_proposals_2d' in graph.nodes():
-            reshape_swap_proposals_node = Node(graph, 'reshape_swap_proposals_2d')
-        else:
-            swap_proposals_node = add_convolution_to_swap_xy_coordinates(graph, Node(graph, 'proposals'), 5)
-            reshape_swap_proposals_node = Reshape(graph, {'dim': [-1, 5], 'nchw_layout': True,
-                                                          'name': 'reshape_swap_proposals_2d'}).create_node(
-                [swap_proposals_node])
-        psroipooling_node = psroipooling_op.create_node([input_node, reshape_swap_proposals_node])
-
-        reduce_op = Reduce(graph, {'name': 'mean',
-                                   'reduce_type': 'mean',
-                                   'axis': int64_array([1, 2]),
-                                   'keep_dims': True
-                                   })
-        reduce_node = reduce_op.create_node([psroipooling_node])
-
-        graph.erase_node(match.output_node(0)[0].out_node())
-
-        return {'output_node': reduce_node}
-```
-
-The main interest of the implementation of this replacer is the `generate_sub_graph` function.
-
-Lines 12-15: Parses the `pipeline.config` file and gets required parameters for the `PSROIPooling` layer.
-Lines 17-21: Determines number of output channels for the `PSROIPooling` layer for box coordinates and classes predictions.
-Lines 23-46: Create `PSROIPooling` layer based on model parameters determined from the pipeline configuration file. 
-Lines 48-53: Add Reduce layer which is the output of the `while` loops being replaced.
-
-#### SecondStagePostprocessor block
-
-The `SecondStagePostprocessor` block implements functionality of the `DetectionOutput` layer from the Inference Engine. The `ObjectDetectionAPIDetectionOutputReplacement` sub-graph replacement is used to replace the block. For this type of topologies the replacer adds convolution node to swap coordinates of boxes in of the 0-th input tensor to the `DetectionOutput` layer. The custom attribute `coordinates_swap_method` is set to value `add_convolution` in the sub-graph replacement configuration file to enable that behaviour. A method (`swap_weights`) is not suitable for this type of topologies because there are no `Mul` or `Conv2D` operations before the 0-th input of the `DetectionOutput` layer.
-
-#### Cutting Off Part of the Topology
-
-The R-FCN models are cut at the end with the sub-graph replacer `ObjectDetectionAPIOutputReplacement` as Faster R-CNNs topologies using the following output node names: `detection_boxes`.
-
-### Mask R-CNN Topologies
-
-The Mask R-CNN models are based on Faster R-CNN models so it is highly recommended to read the section about converting them first. Detailed information about Mask R-CNN topologies is provided [in the abstract](https://arxiv.org/abs/1703.06870).
-
-#### Preprocessor Block
-
-Mask R-CNN topologies contain similar `Preprocessor` block as SSD and Faster R-CNN topologies. The same `ObjectDetectionAPIPreprocessorReplacement` sub-graph replacer is used to cut it off.
-
-#### Proposal and ROI (Region of Interest) Pooling
-
-Proposal and ROI Pooling layers are added to Mask R-CNN topologies like in Faster R-CNNs.
-
-#### DetectionOutput Layer
-
-Unlike in SSDs and Faster R-CNNs, the implementation of the `DetectionOutput` layer in Mask R-CNNs topologies is not separated in a dedicated scope. But the matcher is defined with start/end points defined in the `mask_rcnn_support.json` so the replacer correctly adds the `DetectionOutput` layer.
-
-#### One More ROIPooling
-
-There is the second `CropAndResize` (equivalent of `ROIPooling` layer) that uses boxes produced with the `DetectionOutput` layer. The `ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement` replacer is used to replace this node.
-
-```python
-class ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement(FrontReplacementFromConfigFileSubGraph):
-    replacement_id = 'ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement'
-
-    def run_after(self):
-        return [ObjectDetectionAPIProposalReplacement]
-
-    def output_edges_match(self, graph: Graph, match: SubgraphMatch, new_sub_graph: dict):
-        return {match.output_node(0)[0].id: new_sub_graph['roi_pooling_node'].id}
-
-    def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
-        argv = graph.graph['cmd_params']
-        if argv.tensorflow_object_detection_api_pipeline_config is None:
-            raise Error(missing_param_error)
-        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-        roi_pool_size = _value_or_raise(match, pipeline_config, 'initial_crop_size')
-
-        detection_output_nodes_ids = [node_id for node_id, attrs in graph.nodes(data=True)
-                                      if 'name' in attrs and attrs['name'] == 'detection_output']
-        if len(detection_output_nodes_ids) != 1:
-            raise Error("Found the following nodes '{}' with 'detection_output' but there should be exactly 1.".
-                        format(detection_output_nodes_ids))
-        detection_output_node = Node(graph, detection_output_nodes_ids[0])
-
-        # add reshape of Detection Output so it can be an output of the topology
-        reshape_detection_output_2d_op = Reshape(graph, dict(dim=int64_array([-1, 7])))
-        reshape_detection_output_2d_node = reshape_detection_output_2d_op.create_node(
-            [detection_output_node], dict(name='reshape_do_2d'))
-
-        # adds special node of type "Output" that is a marker for the output nodes of the topology
-        output_op = Output(graph, dict(name='do_reshaped_OutputOp'))
-        output_node = output_op.create_node([reshape_detection_output_2d_node])
-
-        # add attribute 'output_sort_order' so it will be used as a key to sort output nodes before generation of IR
-        output_node.in_edge()['data_attrs'].append('output_sort_order')
-        output_node.in_edge()['output_sort_order'] = [('detection_boxes', 0)]
-
-        # creates two Crop operations which get input from the DetectionOutput layer, cuts of slices of data with class
-        # ids and probabilities and produce a tensor with batch ids and bounding boxes only (as it is expected by the
-        # ROIPooling layer)
-        crop_batch_op = Crop(graph, dict(axis=int64_array([3]), offset=int64_array([0]), dim=int64_array([1]),
-                                         nchw_layout=True))
-        crop_batch_node = crop_batch_op.create_node([detection_output_node], dict(name='crop_do_batch_ids'))
-
-        crop_coordinates_op = Crop(graph, dict(axis=int64_array([3]), offset=int64_array([3]), dim=int64_array([4]),
-                                               nchw_layout=True))
-        crop_coordinates_node = crop_coordinates_op.create_node([detection_output_node], dict(name='crop_do_coords'))
-
-        concat_op = Concat(graph, dict(axis=3))
-        concat_node = concat_op.create_node([crop_batch_node, crop_coordinates_node], dict(name='batch_and_coords',
-                                                                                           nchw_layout=True))
-
-        # reshape bounding boxes as required by ROIPooling
-        reshape_do_op = Reshape(graph, dict(dim=int64_array([-1, 5])))
-        reshape_do_node = reshape_do_op.create_node([concat_node], dict(name='reshape_do'))
-
-        roi_pooling_op = ROIPooling(graph, dict(method="bilinear", spatial_scale=1,
-                                                pooled_h=roi_pool_size, pooled_w=roi_pool_size))
-        roi_pooling_node = roi_pooling_op.create_node([match.single_input_node(0)[0].in_node(), reshape_do_node],
-                                                      dict(name='ROI_pooling_2'))
-        return {'roi_pooling_node': roi_pooling_node}
-```
-The Inference Engine `DetectionOutput` layer implementation produces one tensor with seven numbers for each actual detection:
-
-* batch index
-* class label
-* class probability
-* x_1 box coordinate
-* y_1 box coordinate
-* x_2 box coordinate
-* y_2 box coordinate.
-
-The boxes coordinates must be fed to the `ROIPooling` layer, so the `Crop` layer is added to remove unnecessary part (lines 37-50).
-
-Then the result tensor is reshaped (lines 53-54) and `ROIPooling` layer is created (lines 56-59).
-
-#### Mask Tensors Processing
-
-The post-processing part of Mask R-CNN topologies filters out bounding boxes with low probabilities and applies activation function to the rest one. This post-processing is implemented using the `Gather` operation, which is not supported by the Inference Engine. Special Front-replacer removes this post-processing and just inserts the activation layer to the end. The filtering of bounding boxes is done in the dedicated demo `mask_rcnn_demo`. The code of the replacer is the following:
-
-```python
-class ObjectDetectionAPIMaskRCNNSigmoidReplacement(FrontReplacementFromConfigFileGeneral):
-    """
-    This replacer is used to convert Mask R-CNN topologies only.
-    Adds activation with sigmoid function to the end of the network producing masks tensors.
-    """
-    replacement_id = 'ObjectDetectionAPIMaskRCNNSigmoidReplacement'
-
-    def run_after(self):
-        return [ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement]
-
-    def transform_graph(self, graph: Graph, replacement_descriptions):
-        output_node = None
-        op_outputs = [n for n, d in graph.nodes(data=True) if 'op' in d and d['op'] == 'OpOutput']
-        for op_output in op_outputs:
-            last_node = Node(graph, op_output).in_node(0)
-            if last_node.name.startswith('SecondStageBoxPredictor'):
-                sigmoid_op = Activation(graph, dict(operation='sigmoid'))
-                sigmoid_node = sigmoid_op.create_node([last_node], dict(name=last_node.id + '/sigmoid'))
-                sigmoid_node.name = 'masks'
-
-                if output_node is not None:
-                    raise Error('Identified two possible outputs from the topology. Cannot proceed.')
-                # add special node of type "Output" that is a marker for the output nodes of the topology
-                output_op = Output(graph, dict(name=sigmoid_node.name + '/OutputOp'))
-                output_node = output_op.create_node([sigmoid_node])
-
-        print('The predicted masks are produced by the "masks" layer for each bounding box generated with a '
-              '"detection_output" layer.\n Refer to IR catalogue in the documentation for information '
-              'about the DetectionOutput layer and Inference Engine documentation about output data interpretation.\n'
-              'The topology can be inferred using dedicated demo "mask_rcnn_demo".')
-```
-The replacer looks for the output node which name starts with 'SecondStageBoxPredictor' (the another node of type 'OpOutput' is located after the `DetectionOutput` node). This node contains the generated masks. The replacer adds activation layer 'Sigmoid' after this node as it is done in the initial TensorFlow* model.
-
-#### Cutting Off Part of the Topology
-
-The Mask R-CNN models are cut at the end with the sub-graph replacer `ObjectDetectionAPIOutputReplacement` using the following output node names:
-
-```SecondStageBoxPredictor_1/Conv_3/BiasAdd|SecondStageBoxPredictor_1/Conv_1/BiasAdd```
-
-One of these two nodes produces output mask tensors. The child nodes of these nodes are related to post-processing which is implemented in the [Mask R-CNN demo](@ref omz_demos_mask_rcnn_demo_cpp) and should be cut off.
+Implementation of the transformations for Object Detection API models is located in the file `<INSTALL_DIR>/tools/model_optimizer/extensions/front/tf/ObjectDetectionAPI.py`. Refer to the code in this file to understand the details of the conversion process.
diff --git a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_XLNet_From_Tensorflow.md b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_XLNet_From_Tensorflow.md
index cc121ab19e1ad9..ac706c664f2d1e 100644
--- a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_XLNet_From_Tensorflow.md
+++ b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_XLNet_From_Tensorflow.md
@@ -24,13 +24,15 @@ To get pb-file from the archive contents, you need to do the following.
 1. Run commands
 
 ```sh
-   cd ~
-   mkdir XLNet-Base
-   cd XLNet-Base
-   git clone https://github.com/zihangdai/xlnet
-   wget https://storage.googleapis.com/xlnet/released_models/cased_L-12_H-768_A-12.zip
-   unzip cased_L-12_H-768_A-12.zip
-   mkdir try_save
+cd ~
+mkdir XLNet-Base
+cd XLNet-Base
+git clone https://github.com/zihangdai/xlnet
+wget https://storage.googleapis.com/xlnet/released_models/cased_L-12_H-768_A-12.zip
+unzip cased_L-12_H-768_A-12.zip
+mkdir try_save
+cd xlnet
+sed -i "s/tf\.train\.Optimizer/tf\.train.Optimizer if tf.version < '1.15' else tf.compat.v1.train.Optimizer/g" model_utils.py
 ```
 
    
diff --git a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_YOLO_From_Tensorflow.md b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_YOLO_From_Tensorflow.md
index 60674b1c768ad8..40d592e4690d61 100644
--- a/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_YOLO_From_Tensorflow.md
+++ b/docs/MO_DG/prepare_model/convert_model/tf_specific/Convert_YOLO_From_Tensorflow.md
@@ -67,7 +67,11 @@ git checkout ed60b90
 ```
 3. Download [coco.names](https://raw.githubusercontent.com/pjreddie/darknet/master/data/coco.names) file from the DarkNet website **OR** use labels that fit your task.
 4. Download the [yolov3.weights](https://pjreddie.com/media/files/yolov3.weights) (for the YOLOv3 model) or [yolov3-tiny.weights](https://pjreddie.com/media/files/yolov3-tiny.weights) (for the YOLOv3-tiny model) file **OR** use your pre-trained weights with the same structure
-5. Run a converter:
+5. Install PIL, which is used by the conversion script in the repo:
+```sh
+pip install PIL
+```
+6. Run a converter:
 - for YOLO-v3:
 ```sh
 python3 convert_weights_pb.py --class_names coco.names --data_format NHWC --weights_file yolov3.weights
@@ -88,7 +92,7 @@ python3 convert_weights_pb.py --class_names coco.names --data_format NHWC --weig
 
 ### Convert YOLOv3 TensorFlow Model to IR
 
-To solve the problems explained in the <a href="#yolov3-overview">YOLOv3 architecture overview</a> section, use the `yolo_v3.json` or `yolo_v3_tiny.json` (depending on a model) configuration file with custom operations located in the `<OPENVINO_INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf` repository.
+To solve the problems explained in the <a href="#yolov3-overview">YOLOv3 architecture overview</a> section, use the `yolo_v3.json` or `yolo_v3_tiny.json` (depending on a model) configuration file with custom operations located in the `<OPENVINO_INSTALL_DIR>/tools/model_optimizer/extensions/front/tf` repository.
 
 It consists of several attributes:<br>
 ```sh
@@ -202,7 +206,7 @@ Converted TensorFlow YOLO model is missing `Region` layer and its parameters. Or
 file under the `[region]` title.   
 
 To recreate the original model structure, use the corresponding yolo `.json` configuration file with custom operations and `Region` layer
-parameters when converting the model to the IR. This file is located in the `<OPENVINO_INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf` directory.
+parameters when converting the model to the IR. This file is located in the `<OPENVINO_INSTALL_DIR>/tools/model_optimizer/extensions/front/tf` directory.
 
 If chosen model has specific values of this parameters,
 create another configuration file with custom operations and use it for conversion.
@@ -213,7 +217,7 @@ python3 ./mo_tf.py
 --input_model <path_to_model>/<model_name>.pb       \
 --batch 1                                       \
 --scale 255 \
---transformations_config <OPENVINO_INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf/<yolo_config>.json
+--transformations_config <OPENVINO_INSTALL_DIR>/tools/model_optimizer/extensions/front/tf/<yolo_config>.json
 ```
 where:
 
diff --git a/docs/MO_DG/prepare_model/customize_model_optimizer/Customize_Model_Optimizer.md b/docs/MO_DG/prepare_model/customize_model_optimizer/Customize_Model_Optimizer.md
index cda8458e4dd72f..567543a01a88dd 100644
--- a/docs/MO_DG/prepare_model/customize_model_optimizer/Customize_Model_Optimizer.md
+++ b/docs/MO_DG/prepare_model/customize_model_optimizer/Customize_Model_Optimizer.md
@@ -34,7 +34,7 @@
 
 <a name="model-optimizer-extensibility"></a>Model Optimizer extensibility mechanism enables support of new operations and custom transformations to generate the optimized intermediate representation (IR) as described in the 
 [Deep Learning Network Intermediate Representation and Operation Sets in OpenVINO™](../../IR_and_opsets.md). This
-mechanism is a core part of the Model Optimizer. The Model Optimizer itself uses it under the hood, being a huge set of examples on how to add custom logic to support your model.
+mechanism is a core part of the Model Optimizer, which uses it under the hood, so the Model Optimizer itself is a huge set of examples for adding custom logic to support your model.
 
 There are several cases when the customization is needed:
 
diff --git a/docs/MO_DG/prepare_model/customize_model_optimizer/Extending_Model_Optimizer_with_Caffe_Python_Layers.md b/docs/MO_DG/prepare_model/customize_model_optimizer/Extending_Model_Optimizer_with_Caffe_Python_Layers.md
index e4a71a8fdc9298..579437aeb5a98a 100644
--- a/docs/MO_DG/prepare_model/customize_model_optimizer/Extending_Model_Optimizer_with_Caffe_Python_Layers.md
+++ b/docs/MO_DG/prepare_model/customize_model_optimizer/Extending_Model_Optimizer_with_Caffe_Python_Layers.md
@@ -35,7 +35,7 @@ operation.
 
 Here is a simplified example of the extractor for the custom operation Proposal from Faster-R-CNN model mentioned above.
 The full code with additional checks is provided in the
-`<INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/caffe/proposal_python_ext.py`. The sample code uses
+`<INSTALL_DIR>/tools/model_optimizer/extensions/front/caffe/proposal_python_ext.py`. The sample code uses
 operation `ProposalOp` which corresponds to `Proposal` operation described in the [Available Operations Sets](../../../ops/opset.md)
 document. Refer to the source code below for a detailed explanation of the extractor.
 
diff --git a/docs/benchmarks/performance_benchmarks_faq.md b/docs/benchmarks/performance_benchmarks_faq.md
index 2ff33612097b38..b833f03c531862 100644
--- a/docs/benchmarks/performance_benchmarks_faq.md
+++ b/docs/benchmarks/performance_benchmarks_faq.md
@@ -19,31 +19,34 @@ All of the performance benchmarks were generated using the open-sourced tool wit
 
 #### 6. What image sizes are used for the classification network models?
 The image size used in the inference depends on the network being benchmarked. The following table shows the list of input sizes for each network model.
-|   **Model**																														 |   **Public Network**                    |     **Task**                | **Input Size** (Height x Width)   |
-|------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------|-----------------------------|-----------------------------------|
-|    [bert-large-uncased-whole-word-masking-squad](https://github.com/openvinotoolkit/open_model_zoo/tree/develop/models/intel/bert-large-uncased-whole-word-masking-squad-int8-0001)   | 	BERT-large	|question / answer	|384|
-|    [deeplabv3-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/deeplabv3)                                    |	  DeepLab v3 Tf	                       |semantic segmentation	     |    513x513                          |
-|    [densenet-121-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/densenet-121-tf)                  | 	  Densenet-121 Tf	                   |classification	    |    224x224                 |
-|    [facenet-20180408-102900-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/facenet-20180408-102900)        |    FaceNet TF                           |    face recognition         |    160x160                        |
-|    [faster_rcnn_resnet50_coco-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/faster_rcnn_resnet50_coco)    |    Faster RCNN Tf                       |    object detection           |    600x1024					     |
-|    [googlenet-v1-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/googlenet-v1-tf)				     |    GoogLeNet_ILSVRC-2012                |    classification           |    224x224				  |
-|    [inception-v3-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/googlenet-v3)								 |    Inception v3 Tf                      |    classification           |    299x299				  |
-|    [mobilenet-ssd-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/mobilenet-ssd)						     |    SSD (MobileNet)_COCO-2017_Caffe      |    object detection         |    300x300						 |
-|    [mobilenet-v1-1.0-224-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/mobilenet-v1-1.0-224-tf)  |    MobileNet v1 Tf                      |    classification    |    224x224                        |
-|    [mobilenet-v2-1.0-224-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/mobilenet-v2-1.0-224)			     |    MobileNet v2 Tf                      |    classification           |    224x224						 |
-|    [mobilenet-v2-pytorch](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/mobilenet-v2-pytorch )		 |    Mobilenet V2 PyTorch                 |    classification           |    224x224					     |
-|    [resnet-18-pytorch](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-18-pytorch)		  			     |    ResNet-18 PyTorch                    |    classification           |    224x224						 |
-|    [resnet-50-pytorch](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-50-pytorch)              |    ResNet-50 v1 PyTorch                 |    classification           |    224x224                        |
-|    [resnet-50-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-50-tf)								 |    ResNet-50_v1_ILSVRC-2012             |    classification           |    224x224						 |
-|    [se-resnext-50-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/se-resnext-50)						     |    Se-ResNext-50_ILSVRC-2012_Caffe      |    classification           |    224x224						 |
-|    [squeezenet1.1-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/squeezenet1.1)						     |    SqueezeNet_v1.1_ILSVRC-2012_Caffe    |    classification           |    227x227						 |
-|    [ssd300-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/ssd300)										     |    SSD (VGG-16)_VOC-2007_Caffe          |    object detection         |    300x300						 |
-|    [yolo_v3-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/yolo-v3-tf)                            | 	  TF Keras YOLO v3 Modelset            |	 object detection	      |    300x300                        |
-|    [yolo_v4-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/yolo-v4-tf)                            | 	  Yolo-V4 TF                           |	 object detection	     |    608x608                        |
-|    [ssd_mobilenet_v1_coco-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/ssd_mobilenet_v1_coco)   |    ssd_mobilenet_v1_coco                |    object detection         |    300x300                        |
-|    [ssdlite_mobilenet_v2-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/ssdlite_mobilenet_v2)     |    ssd_mobilenet_v2                     |    object detection         |    300x300                        |
-|    [unet-camvid-onnx-0001](https://github.com/openvinotoolkit/open_model_zoo/blob/master/models/intel/unet-camvid-onnx-0001/description/unet-camvid-onnx-0001.md)            |    U-Net                    |    semantic segmentation          |    368x480                        |
-
+|   **Model**																														 |   **Public Network**               |     **Task**                | **Input Size** (Height x Width)   |
+|------------------------------------------------------------------------------------------------------------------------------------|------------------------------------|-----------------------------|-----------------------------------|
+| [bert-large-uncased-whole-word-masking-squad](https://github.com/openvinotoolkit/open_model_zoo/tree/develop/models/intel/bert-large-uncased-whole-word-masking-squad-int8-0001) | BERT-large	|question / answer	|384|
+| [brain-tumor-segmentation-0001-MXNET](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/brain-tumor-segmentation-0001) | brain-tumor-segmentation-0001 | semantic segmentation       | 128x128x128 |
+| [brain-tumor-segmentation-0002-CF2](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/brain-tumor-segmentation-0002)   | brain-tumor-segmentation-0002 | semantic segmentation       | 128x128x128 |
+| [deeplabv3-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/deeplabv3)                                    |	DeepLab v3 Tf	                      | semantic segmentation	    | 513x513                          |
+| [densenet-121-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/densenet-121-tf)                  | Densenet-121 Tf	                      | classification	            | 224x224                 |
+| [facenet-20180408-102900-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/facenet-20180408-102900)        | FaceNet TF                            | face recognition            | 160x160                        |
+| [faster_rcnn_resnet50_coco-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/faster_rcnn_resnet50_coco)    | Faster RCNN Tf                        | object detection            | 600x1024					     |
+| [inception-v4-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/develop/models/public/googlenet-v4-tf)				  | Inception v4 Tf (aka GoogleNet-V4)    | classification              | 299x299				  |
+| [inception-v3-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/googlenet-v3)							  | Inception v3 Tf                       | classification              | 299x299				  |
+| [mobilenet-ssd-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/mobilenet-ssd)						      | SSD (MobileNet)_COCO-2017_Caffe       | object detection            | 300x300						 |
+| [mobilenet-v2-1.0-224-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/mobilenet-v2-1.0-224)			  | MobileNet v2 Tf                       | classification              | 224x224						 |
+| [mobilenet-v2-pytorch](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/mobilenet-v2-pytorch )		  | Mobilenet V2 PyTorch                  | classification              | 224x224					     |
+| [resnet-18-pytorch](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-18-pytorch)		  			      | ResNet-18 PyTorch                     | classification              | 224x224						 |
+| [resnet-50-pytorch](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-50-pytorch)              | ResNet-50 v1 PyTorch                  | classification              | 224x224                        |
+| [resnet-50-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/resnet-50-tf)								  | ResNet-50_v1_ILSVRC-2012              | classification              | 224x224						 |
+| [se-resnext-50-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/se-resnext-50)						      | Se-ResNext-50_ILSVRC-2012_Caffe       | classification              | 224x224						 |
+| [squeezenet1.1-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/squeezenet1.1)						      | SqueezeNet_v1.1_ILSVRC-2012_Caffe     | classification              | 227x227						 |
+| [ssd300-CF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/ssd300)										  | SSD (VGG-16)_VOC-2007_Caffe           | object detection            | 300x300						 |
+| [yolo_v4-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/yolo-v4-tf)                            | Yolo-V4 TF                            |	object detection	        | 608x608                        |
+| [ssd_mobilenet_v1_coco-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/ssd_mobilenet_v1_coco)   | ssd_mobilenet_v1_coco                 | object detection            | 300x300                        |
+| [ssdlite_mobilenet_v2-TF](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/ssdlite_mobilenet_v2)     | ssdlite_mobilenet_v2                  | object detection            | 300x300                        |
+| [unet-camvid-onnx-0001](https://github.com/openvinotoolkit/open_model_zoo/blob/master/models/intel/unet-camvid-onnx-0001/description/unet-camvid-onnx-0001.md) | U-Net  | semantic segmentation       | 368x480                        |
+| [yolo-v3-tiny-tf](https://github.com/openvinotoolkit/open_model_zoo/tree/develop/models/public/yolo-v3-tiny-tf)                 | YOLO v3 Tiny                          | object detection            | 416x416 |
+| [ssd-resnet34-1200-onnx](https://github.com/openvinotoolkit/open_model_zoo/tree/develop/models/public/ssd-resnet34-1200-onnx)   | ssd-resnet34 onnx model               | object detection            | 1200x1200 |
+| [vgg19-caffe](https://github.com/openvinotoolkit/open_model_zoo/tree/master/models/public/vgg19-caffe2)                         | VGG-19                                | classification              | 224x224|
+ 
 #### 7. Where can I purchase the specific hardware used in the benchmarking?
 Intel partners with various vendors all over the world. Visit the [Intel® AI: In Production Partners & Solutions Catalog](https://www.intel.com/content/www/us/en/internet-of-things/ai-in-production/partners-solutions-catalog.html) for a list of Equipment Makers and the [Supported Devices](../IE_DG/supported_plugins/Supported_Devices.md) documentation. You can also remotely test and run models before purchasing any hardware by using [Intel® DevCloud for the Edge](http://devcloud.intel.com/edge/).
 
diff --git a/docs/benchmarks/performance_benchmarks_openvino.md b/docs/benchmarks/performance_benchmarks_openvino.md
index 456f593db14461..be7c46410d752f 100644
--- a/docs/benchmarks/performance_benchmarks_openvino.md
+++ b/docs/benchmarks/performance_benchmarks_openvino.md
@@ -29,81 +29,86 @@ Measuring inference performance involves many variables and is extremely use-cas
 
 
 \htmlonly
-<script src="bert-large-uncased-whole-word-masking-squad-int8-0001-ov-2021-3-338-5.js" id="bert-large-uncased-whole-word-masking-squad-int8-0001-ov-2021-3-338-5"></script>
+<script src="bert-large-uncased-whole-word-masking-squad-int8-0001-384-ov-2021-4-569.js" id="bert-large-uncased-whole-word-masking-squad-int8-0001-384-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="deeplabv3-tf-ov-2021-3-338-5.js" id="deeplabv3-tf-ov-2021-3-338-5"></script>
+<script src="deeplabv3-tf-513x513-ov-2021-4-569.js" id="deeplabv3-tf-513x513-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="densenet-121-tf-ov-2021-3-338-5.js" id="densenet-121-tf-ov-2021-3-338-5"></script>
+<script src="densenet-121-tf-224x224-ov-2021-4-569.js" id="densenet-121-tf-224x224-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="faster-rcnn-resnet50-coco-tf-ov-2021-3-338-5.js" id="faster-rcnn-resnet50-coco-tf-ov-2021-3-338-5"></script>
+<script src="faster-rcnn-resnet50-coco-tf-600x1024-ov-2021-4-569.js" id="faster-rcnn-resnet50-coco-tf-600x1024-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="googlenet-v1-tf-ov-2021-3-338-5.js" id="googlenet-v1-tf-ov-2021-3-338-5"></script>
+<script src="inception-v3-tf-299x299-ov-2021-4-569.js" id="inception-v3-tf-299x299-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="inception-v3-tf-ov-2021-3-338-5.js" id="inception-v3-tf-ov-2021-3-338-5"></script>
+<script src="inception-v4-tf-299x299-ov-2021-4-569.js" id="inception-v4-tf-299x299-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="mobilenet-ssd-cf-ov-2021-3-338-5.js" id="mobilenet-ssd-cf-ov-2021-3-338-5"></script>
+<script src="mobilenet-ssd-cf-300x300-ov-2021-4-569.js" id="mobilenet-ssd-cf-300x300-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="mobilenet-v1-1-0-224-tf-ov-2021-3-338-5.js" id="mobilenet-v1-1-0-224-tf-ov-2021-3-338-5"></script>
+<script src="mobilenet-v2-pytorch-224x224-ov-2021-4-569.js" id="mobilenet-v2-pytorch-224x224-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="mobilenet-v2-pytorch-ov-2021-3-338-5.js" id="mobilenet-v2-pytorch-ov-2021-3-338-5"></script>
+<script src="resnet-18-pytorch-224x224-ov-2021-4-569.js" id="resnet-18-pytorch-224x224-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="resnet-18-pytorch-ov-2021-3-338-5.js" id="resnet-18-pytorch-ov-2021-3-338-5"></script>
+<script src="resnet-50-tf-224x224-ov-2021-4-569.js" id="resnet-50-tf-224x224-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="resnet-50-tf-ov-2021-3-338-5.js" id="resnet-50-tf-ov-2021-3-338-5"></script>
+<script src="se-resnext-50-cf-224x224-ov-2021-4-569.js" id="se-resnext-50-cf-224x224-ov-2021-4-569"></script>
 \endhtmlonly
 
-
 \htmlonly
-<script src="se-resnext-50-cf-ov-2021-3-338-5.js" id="se-resnext-50-cf-ov-2021-3-338-5"></script>
+<script src="squeezenet1-1-cf-227x227-ov-2021-4-569.js" id="squeezenet1-1-cf-227x227-ov-2021-4-569"></script>
 \endhtmlonly
 
+
 \htmlonly
-<script src="squeezenet1-1-cf-ov-2021-3-338-5.js" id="squeezenet1-1-cf-ov-2021-3-338-5"></script>
+<script src="ssd300-cf-300x300-ov-2021-4-569.js" id="ssd300-cf-300x300-ov-2021-4-569"></script>
 \endhtmlonly
 
+\htmlonly
+<script src="yolo-v3-tiny-tf-416x416-ov-2021-4-569.js" id="yolo-v3-tiny-tf-416x416-ov-2021-4-569"></script>
+\endhtmlonly
 
 \htmlonly
-<script src="ssd300-cf-ov-2021-3-338-5.js" id="ssd300-cf-ov-2021-3-338-5"></script>
+<script src="yolo-v4-tf-608x608-ov-2021-4-569.js" id="yolo-v4-tf-608x608-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="yolo-v3-tf-ov-2021-3-338-5.js" id="yolo-v3-tf-ov-2021-3-338-5"></script>
+<script src="unet-camvid-onnx-0001-368x480-ov-2021-4-569.js" id="unet-camvid-onnx-0001-368x480-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="yolo-v4-tf-ov-2021-3-338-5.js" id="yolo-v4-tf-ov-2021-3-338-5"></script>
+<script src="ssd-resnet34-1200-onnx-1200x1200-ov-2021-4-569.js" id="ssd-resnet34-1200-onnx-1200x1200-ov-2021-4-569"></script>
 \endhtmlonly
 
 \htmlonly
-<script src="unet-camvid-onnx-0001-ov-2021-3-338-5.js" id="unet-camvid-onnx-0001-ov-2021-3-338-5"></script>
+<script src="vgg19-caffe-224x224-ov-2021-4-569.js" id="vgg19-caffe-224x224-ov-2021-4-569"></script>
 \endhtmlonly
 
 
+
+
 ## Platform Configurations
 
-Intel® Distribution of OpenVINO™ toolkit performance benchmark numbers are based on release 2021.3. 
+Intel® Distribution of OpenVINO™ toolkit performance benchmark numbers are based on release 2021.4. 
 
-Intel technologies’ features and benefits depend on system configuration and may require enabled hardware, software or service activation. Learn more at intel.com, or from the OEM or retailer. Performance results are based on testing as of March 15, 2021 and may not reflect all publicly available updates. See configuration disclosure for details. No product can be absolutely secure. 
+Intel technologies’ features and benefits depend on system configuration and may require enabled hardware, software or service activation. Learn more at intel.com, or from the OEM or retailer. Performance results are based on testing as of June 18, 2021 and may not reflect all publicly available updates. See configuration disclosure for details. No product can be absolutely secure. 
 
 Performance varies by use, configuration and other factors. Learn more at [www.intel.com/PerformanceIndex](https://www.intel.com/PerformanceIndex).
 
@@ -127,15 +132,15 @@ Testing by Intel done on: see test date for each HW platform below.
 | Operating System                | Ubuntu* 18.04 LTS                  | Ubuntu* 18.04 LTS                  | Ubuntu* 18.04 LTS                       |
 | Kernel Version                  | 5.3.0-24-generic                   | 5.3.0-24-generic                   | 5.3.0-24-generic                        | 
 | BIOS Vendor                     | American Megatrends Inc.*          | American Megatrends Inc.           | Intel Corporation                       |
-| BIOS Version                    | 0904                               | 607                                | SE5C620.86B.02.01.<br>0009.092820190230 |
-| BIOS Release                    | April 12, 2019                     | May 29, 2020                       | September 28, 2019                      |
+| BIOS Version                    | 0904                               | 607                                | SE5C620.86B.02.01.<br>0013.121520200651 |
+| BIOS Release                    | April 12, 2019                     | May 29, 2020                       | December 15, 2020                       |
 | BIOS Settings                   | Select optimized default settings, <br>save & exit | Select optimized default settings, <br>save & exit | Select optimized default settings, <br>change power policy <br>to "performance", <br>save & exit |
 | Batch size                      | 1                                  | 1                                  | 1                            
 | Precision                       | INT8                               | INT8                               | INT8                         
 | Number of concurrent inference requests | 4                          | 5                                  | 32                           
-| Test Date                       | March 15, 2021                     | March 15, 2021                     | March 15, 2021             
-| Power dissipation, TDP in Watt  | [71](https://ark.intel.com/content/www/us/en/ark/products/134854/intel-xeon-e-2124g-processor-8m-cache-up-to-4-50-ghz.html#tab-blade-1-0-1)                    | [125](https://ark.intel.com/content/www/us/en/ark/products/199336/intel-xeon-w-1290p-processor-20m-cache-3-70-ghz.html)                          | [125](https://ark.intel.com/content/www/us/en/ark/products/193394/intel-xeon-silver-4216-processor-22m-cache-2-10-ghz.html#tab-blade-1-0-1) |
-| CPU Price on Mach 15th, 2021, USD<br>Prices may vary  | [213](https://ark.intel.com/content/www/us/en/ark/products/134854/intel-xeon-e-2124g-processor-8m-cache-up-to-4-50-ghz.html)     | [539](https://ark.intel.com/content/www/us/en/ark/products/199336/intel-xeon-w-1290p-processor-20m-cache-3-70-ghz.html)     |[1,002](https://ark.intel.com/content/www/us/en/ark/products/193394/intel-xeon-silver-4216-processor-22m-cache-2-10-ghz.html)                 | 
+| Test Date                       | June 18, 2021                     | June 18, 2021                     | June 18, 2021             
+| Rated maximum TDP/socket in Watt  | [71](https://ark.intel.com/content/www/us/en/ark/products/134854/intel-xeon-e-2124g-processor-8m-cache-up-to-4-50-ghz.html#tab-blade-1-0-1)                    | [125](https://ark.intel.com/content/www/us/en/ark/products/199336/intel-xeon-w-1290p-processor-20m-cache-3-70-ghz.html)                          | [125](https://ark.intel.com/content/www/us/en/ark/products/193394/intel-xeon-silver-4216-processor-22m-cache-2-10-ghz.html#tab-blade-1-0-1) |
+| CPU Price/socket on June 21, 2021, USD<br>Prices may vary  | [213](https://ark.intel.com/content/www/us/en/ark/products/134854/intel-xeon-e-2124g-processor-8m-cache-up-to-4-50-ghz.html)     | [539](https://ark.intel.com/content/www/us/en/ark/products/199336/intel-xeon-w-1290p-processor-20m-cache-3-70-ghz.html)     |[1,002](https://ark.intel.com/content/www/us/en/ark/products/193394/intel-xeon-silver-4216-processor-22m-cache-2-10-ghz.html)                 | 
 
 **CPU Inference Engines (continue)**
 
@@ -149,84 +154,104 @@ Testing by Intel done on: see test date for each HW platform below.
 | Operating System                | Ubuntu* 18.04 LTS                       | Ubuntu* 18.04 LTS                        | Ubuntu* 18.04 LTS                        |
 | Kernel Version                  | 5.3.0-24-generic                        | 5.3.0-24-generic                         | 5.3.0-24-generic                         |
 | BIOS Vendor                     | Intel Corporation                       | Intel Corporation                        | Intel Corporation                        |
-| BIOS Version                    | SE5C620.86B.02.01.<br>0009.092820190230 | SE5C620.86B.02.01.<br>0009.092820190230  | WLYDCRB1.SYS.0020.<br>P86.2103050636     |
-| BIOS Release                    | September 28, 2019                      | September 28, 2019                       | March 5, 2021                            |
+| BIOS Version                    | SE5C620.86B.02.01.<br>0013.121520200651 | SE5C620.86B.02.01.<br>0013.121520200651  | WLYDCRB1.SYS.0020.<br>P86.2103050636     |
+| BIOS Release                    | December 15, 2020                       | December 15, 2020                        | March 5, 2021                            |
 | BIOS Settings                   | Select optimized default settings, <br>change power policy to "performance", <br>save & exit | Select optimized default settings, <br>change power policy to "performance", <br>save & exit | Select optimized default settings, <br>change power policy to "performance", <br>save & exit |
 | Batch size                      | 1                                       | 1                                        | 1                                        |
 | Precision                       | INT8                                    | INT8                                     | INT8                                     |
 | Number of concurrent inference requests |32                               | 52                                       | 80                                       |
-| Test Date                       | March 15, 2021                          | March 15, 2021                           | March 22, 2021                           |
-| Power dissipation, TDP in Watt  | [105](https://ark.intel.com/content/www/us/en/ark/products/193953/intel-xeon-gold-5218t-processor-22m-cache-2-10-ghz.html#tab-blade-1-0-1)           | [205](https://ark.intel.com/content/www/us/en/ark/products/192482/intel-xeon-platinum-8270-processor-35-75m-cache-2-70-ghz.html#tab-blade-1-0-1)          | [270](https://ark.intel.com/content/www/us/en/ark/products/212287/intel-xeon-platinum-8380-processor-60m-cache-2-30-ghz.html) |
-| CPU Price, USD<br>Prices may vary  | [1,349](https://ark.intel.com/content/www/us/en/ark/products/193953/intel-xeon-gold-5218t-processor-22m-cache-2-10-ghz.html) (on Mach 15th, 2021) | [7,405](https://ark.intel.com/content/www/us/en/ark/products/192482/intel-xeon-platinum-8270-processor-35-75m-cache-2-70-ghz.html) (on Mach 15th, 2021)   | [8,099](https://ark.intel.com/content/www/us/en/ark/products/212287/intel-xeon-platinum-8380-processor-60m-cache-2-30-ghz.html) (on March 26th, 2021) |
+| Test Date                       | June 18, 2021                          | June 18, 2021                           | June 18, 2021                           |
+| Rated maximum TDP/socket in Watt  | [105](https://ark.intel.com/content/www/us/en/ark/products/193953/intel-xeon-gold-5218t-processor-22m-cache-2-10-ghz.html#tab-blade-1-0-1)           | [205](https://ark.intel.com/content/www/us/en/ark/products/192482/intel-xeon-platinum-8270-processor-35-75m-cache-2-70-ghz.html#tab-blade-1-0-1)          | [270](https://ark.intel.com/content/www/us/en/ark/products/212287/intel-xeon-platinum-8380-processor-60m-cache-2-30-ghz.html) |
+| CPU Price/socket on June 21, 2021, USD<br>Prices may vary  | [1,349](https://ark.intel.com/content/www/us/en/ark/products/193953/intel-xeon-gold-5218t-processor-22m-cache-2-10-ghz.html) | [7,405](https://ark.intel.com/content/www/us/en/ark/products/192482/intel-xeon-platinum-8270-processor-35-75m-cache-2-70-ghz.html) | [8,099](https://ark.intel.com/content/www/us/en/ark/products/212287/intel-xeon-platinum-8380-processor-60m-cache-2-30-ghz.html) |
 
 
 **CPU Inference Engines (continue)**
 
-|                      | Intel® Core™ i7-8700T               | Intel® Core™ i9-10920X               | 11th Gen Intel® Core™ i7-1185G7 |
-| -------------------- | ----------------------------------- |--------------------------------------| --------------------------------|
-| Motherboard          | GIGABYTE* Z370M DS3H-CF             | ASUS* PRIME X299-A II                | Intel Corporation<br>internal/Reference<br>Validation Platform |
-| CPU                  | Intel® Core™ i7-8700T CPU @ 2.40GHz | Intel® Core™ i9-10920X CPU @ 3.50GHz | 11th Gen Intel® Core™ i7-1185G7 @ 3.00GHz |
-| Hyper Threading      | ON                                  | ON                                   | ON                                        |
-| Turbo Setting        | ON                                  | ON                                   | ON                                        |
-| Memory               | 4 x 16 GB DDR4 2400MHz              | 4 x 16 GB DDR4 2666MHz               | 2 x 8 GB DDR4 3200MHz                     |
-| Operating System     | Ubuntu* 18.04 LTS                   | Ubuntu* 18.04 LTS                    | Ubuntu* 18.04 LTS                         |
-| Kernel Version       | 5.3.0-24-generic                    | 5.3.0-24-generic                     | 5.8.0-05-generic                          |
-| BIOS Vendor          | American Megatrends Inc.*           | American Megatrends Inc.*            | Intel Corporation                         |
-| BIOS Version         | F11                                 | 505                                  | TGLSFWI1.R00.3425.<br>A00.2010162309      |
-| BIOS Release         | March 13, 2019                      | December 17, 2019                    | October 16, 2020                          |
-| BIOS Settings        | Select optimized default settings, <br>set OS type to "other", <br>save & exit | Default Settings | Default Settings   |
-| Batch size           | 1                                   | 1                                    | 1                                         |
-| Precision            | INT8                                | INT8                                 | INT8                                      |
-| Number of concurrent inference requests |4                 | 24                                   | 4                                         |
-| Test Date            | March 15, 2021                      | March 15, 2021                       | March 15, 2021                          |
-| Power dissipation, TDP in Watt                             | [35](https://ark.intel.com/content/www/us/en/ark/products/129948/intel-core-i7-8700t-processor-12m-cache-up-to-4-00-ghz.html#tab-blade-1-0-1) | [165](https://ark.intel.com/content/www/us/en/ark/products/198012/intel-core-i9-10920x-x-series-processor-19-25m-cache-3-50-ghz.html) | [28](https://ark.intel.com/content/www/us/en/ark/products/208664/intel-core-i7-1185g7-processor-12m-cache-up-to-4-80-ghz-with-ipu.html#tab-blade-1-0-1) |
-| CPU Price on Mach 15th, 2021, USD<br>Prices may vary    | [303](https://ark.intel.com/content/www/us/en/ark/products/129948/intel-core-i7-8700t-processor-12m-cache-up-to-4-00-ghz.html)                | [700](https://ark.intel.com/content/www/us/en/ark/products/198012/intel-core-i9-10920x-x-series-processor-19-25m-cache-3-50-ghz.html) | [426](https://ark.intel.com/content/www/us/en/ark/products/208664/intel-core-i7-1185g7-processor-12m-cache-up-to-4-80-ghz-with-ipu.html#tab-blade-1-0-0)             |
+|                      | Intel® Core™ i7-8700T               | Intel® Core™ i9-10920X               |
+| -------------------- | ----------------------------------- |--------------------------------------|
+| Motherboard          | GIGABYTE* Z370M DS3H-CF             | ASUS* PRIME X299-A II                |
+| CPU                  | Intel® Core™ i7-8700T CPU @ 2.40GHz | Intel® Core™ i9-10920X CPU @ 3.50GHz |
+| Hyper Threading      | ON                                  | ON                                   |
+| Turbo Setting        | ON                                  | ON                                   |
+| Memory               | 4 x 16 GB DDR4 2400MHz              | 4 x 16 GB DDR4 2666MHz               |
+| Operating System     | Ubuntu* 18.04 LTS                   | Ubuntu* 18.04 LTS                    |
+| Kernel Version       | 5.3.0-24-generic                    | 5.3.0-24-generic                     |
+| BIOS Vendor          | American Megatrends Inc.*           | American Megatrends Inc.*            |
+| BIOS Version         | F14c                                | 1004                                 |
+| BIOS Release         | March 23, 2021                      | March 19, 2021                       |
+| BIOS Settings        | Select optimized default settings, <br>set OS type to "other", <br>save & exit | Default Settings |
+| Batch size           | 1                                   | 1                                    |
+| Precision            | INT8                                | INT8                                 |
+| Number of concurrent inference requests |4                 | 24                                   |
+| Test Date            | June 18, 2021                      | June 18, 2021                         |
+| Rated maximum TDP/socket in Watt                             | [35](https://ark.intel.com/content/www/us/en/ark/products/129948/intel-core-i7-8700t-processor-12m-cache-up-to-4-00-ghz.html#tab-blade-1-0-1) | [165](https://ark.intel.com/content/www/us/en/ark/products/198012/intel-core-i9-10920x-x-series-processor-19-25m-cache-3-50-ghz.html) |
+| CPU Price/socket on June 21, 2021, USD<br>Prices may vary    | [303](https://ark.intel.com/content/www/us/en/ark/products/129948/intel-core-i7-8700t-processor-12m-cache-up-to-4-00-ghz.html)                | [700](https://ark.intel.com/content/www/us/en/ark/products/198012/intel-core-i9-10920x-x-series-processor-19-25m-cache-3-50-ghz.html) |
 
+**CPU Inference Engines (continue)**
+|                      | 11th Gen Intel® Core™ i7-1185G7 | 11th Gen Intel® Core™ i7-11850HE |
+| -------------------- | --------------------------------|----------------------------------|
+| Motherboard          | Intel Corporation<br>internal/Reference<br>Validation Platform | Intel Corporation<br>internal/Reference<br>Validation Platform |
+| CPU                  | 11th Gen Intel® Core™ i7-1185G7 @ 3.00GHz | 11th Gen Intel® Core™ i7-11850HE @ 2.60GHz |
+| Hyper Threading      | ON                                        | ON |
+| Turbo Setting        | ON                                        | ON |
+| Memory               | 2 x 8 GB DDR4 3200MHz                     | 2 x 16 GB DDR4 3200MHz |
+| Operating System     | Ubuntu* 18.04 LTS                         | Ubuntu* 18.04.4 LTS |
+| Kernel Version       | 5.8.0-05-generic                          | 5.8.0-050800-generic |
+| BIOS Vendor          | Intel Corporation                         | Intel Corporation |
+| BIOS Version         | TGLSFWI1.R00.3425.<br>A00.2010162309      | TGLIFUI1.R00.4064.<br>A01.2102200132 |
+| BIOS Release         | October 16, 2020                          | February 20, 2021 |
+| BIOS Settings        | Default Settings                          | Default Settings |
+| Batch size           | 1                                         | 1 |
+| Precision            | INT8                                      | INT8 |
+| Number of concurrent inference requests |4                       | 4 |
+| Test Date            | June 18, 2021                             | June 18, 2021  |
+| Rated maximum TDP/socket in Watt                             | [28](https://ark.intel.com/content/www/us/en/ark/products/208664/intel-core-i7-1185g7-processor-12m-cache-up-to-4-80-ghz-with-ipu.html) | [45](https://ark.intel.com/content/www/us/en/ark/products/213799/intel-core-i7-11850h-processor-24m-cache-up-to-4-80-ghz.html) |
+| CPU Price/socket on June 21, 2021, USD<br>Prices may vary    | [426](https://ark.intel.com/content/www/us/en/ark/products/208664/intel-core-i7-1185g7-processor-12m-cache-up-to-4-80-ghz-with-ipu.html)                | [395](https://ark.intel.com/content/www/us/en/ark/products/213799/intel-core-i7-11850h-processor-24m-cache-up-to-4-80-ghz.html) |
 
 **CPU Inference Engines (continue)**
 
-|                      | Intel® Core™ i5-8500               | Intel® Core™ i5-10500TE               |
-| -------------------- | ---------------------------------- | -----------------------------------   |
-| Motherboard          | ASUS* PRIME Z370-A                 | GIGABYTE* Z490 AORUS PRO AX           |
-| CPU                  | Intel® Core™ i5-8500 CPU @ 3.00GHz | Intel® Core™ i5-10500TE CPU @ 2.30GHz |
-| Hyper Threading      | OFF                                | ON                                    |
-| Turbo Setting        | ON                                 | ON                                    |
-| Memory               | 2 x 16 GB DDR4 2666MHz             | 2 x 16 GB DDR4 @ 2666MHz              |
-| Operating System     | Ubuntu* 18.04 LTS                  | Ubuntu* 18.04 LTS                     |
-| Kernel Version       | 5.3.0-24-generic                   | 5.3.0-24-generic                      |
-| BIOS Vendor          | American Megatrends Inc.*          | American Megatrends Inc.*             |
-| BIOS Version         | 2401                               | F3                                    |
-| BIOS Release         | July 12, 2019                      | March 25, 2020                        |
-| BIOS Settings        | Select optimized default settings, <br>save & exit | Select optimized default settings, <br>set OS type to "other", <br>save & exit |
-| Batch size           | 1                                  | 1                                     |
-| Precision            | INT8                               | INT8                                  |
-| Number of concurrent inference requests | 3               | 4                                     |
-| Test Date            | March 15, 2021                     | March 15, 2021                      |
-| Power dissipation, TDP in Watt                            | [65](https://ark.intel.com/content/www/us/en/ark/products/129939/intel-core-i5-8500-processor-9m-cache-up-to-4-10-ghz.html#tab-blade-1-0-1)| [35](https://ark.intel.com/content/www/us/en/ark/products/203891/intel-core-i5-10500te-processor-12m-cache-up-to-3-70-ghz.html)  |
-| CPU Price on Mach 15th, 2021, USD<br>Prices may vary   | [192](https://ark.intel.com/content/www/us/en/ark/products/129939/intel-core-i5-8500-processor-9m-cache-up-to-4-10-ghz.html)               | [195](https://ark.intel.com/content/www/us/en/ark/products/203891/intel-core-i5-10500te-processor-12m-cache-up-to-3-70-ghz.html) |
+|                      | Intel® Core™ i3-8100               | Intel® Core™ i5-8500               | Intel® Core™ i5-10500TE               |
+| -------------------- |----------------------------------- | ---------------------------------- | -----------------------------------   |
+| Motherboard          | GIGABYTE* Z390 UD                  | ASUS* PRIME Z370-A                 | GIGABYTE* Z490 AORUS PRO AX           |
+| CPU                  | Intel® Core™ i3-8100 CPU @ 3.60GHz | Intel® Core™ i5-8500 CPU @ 3.00GHz | Intel® Core™ i5-10500TE CPU @ 2.30GHz |
+| Hyper Threading      | OFF                                | OFF                                | ON                                    |
+| Turbo Setting        | OFF                                | ON                                 | ON                                    |
+| Memory               | 4 x 8 GB DDR4 2400MHz              | 2 x 16 GB DDR4 2666MHz             | 2 x 16 GB DDR4 @ 2666MHz              |
+| Operating System     | Ubuntu* 18.04 LTS                  | Ubuntu* 18.04 LTS                  | Ubuntu* 18.04 LTS                     |
+| Kernel Version       | 5.3.0-24-generic                   | 5.3.0-24-generic                   | 5.3.0-24-generic                      |
+| BIOS Vendor          | American Megatrends Inc.*          | American Megatrends Inc.*          | American Megatrends Inc.*             |
+| BIOS Version         | F8                                 | 2401                               | F3                                    |
+| BIOS Release         | May 24, 2019                       | July 12, 2019                      | March 25, 2020                        |
+| BIOS Settings        | Select optimized default settings, <br> set OS type to "other", <br>save & exit | Select optimized default settings, <br>save & exit | Select optimized default settings, <br>set OS type to "other", <br>save & exit |
+| Batch size           | 1                                  | 1                                  | 1                                     |
+| Precision            | INT8                               | INT8                               | INT8                                  |
+| Number of concurrent inference requests | 4               | 3               | 4                                     |
+| Test Date            | June 18, 2021                       | June 18, 2021                     | June 18, 2021                      |
+| Rated maximum TDP/socket in Watt                            |  [65](https://ark.intel.com/content/www/us/en/ark/products/126688/intel-core-i3-8100-processor-6m-cache-3-60-ghz.html#tab-blade-1-0-1)| [65](https://ark.intel.com/content/www/us/en/ark/products/129939/intel-core-i5-8500-processor-9m-cache-up-to-4-10-ghz.html#tab-blade-1-0-1)| [35](https://ark.intel.com/content/www/us/en/ark/products/203891/intel-core-i5-10500te-processor-12m-cache-up-to-3-70-ghz.html)  |
+| CPU Price/socket on June 21, 2021, USD<br>Prices may vary   |  [117](https://ark.intel.com/content/www/us/en/ark/products/126688/intel-core-i3-8100-processor-6m-cache-3-60-ghz.html) | [192](https://ark.intel.com/content/www/us/en/ark/products/129939/intel-core-i5-8500-processor-9m-cache-up-to-4-10-ghz.html)               | [195](https://ark.intel.com/content/www/us/en/ark/products/203891/intel-core-i5-10500te-processor-12m-cache-up-to-3-70-ghz.html) |
 
 
 **CPU Inference Engines (continue)**
 
-|                      | Intel Atom® x5-E3940                  | Intel Atom® x6425RE                               | Intel® Core™ i3-8100               | 
-| -------------------- | --------------------------------------|-------------------------------                    |----------------------------------- |
-| Motherboard          |                                       | Intel Corporation /<br>ElkhartLake LPDDR4x T3 CRB | GIGABYTE* Z390 UD                  |
-| CPU                  | Intel Atom® Processor E3940 @ 1.60GHz | Intel Atom® x6425RE<br>Processor @ 1.90GHz        | Intel® Core™ i3-8100 CPU @ 3.60GHz |
-| Hyper Threading      | OFF                                   | OFF                                               | OFF                                |
-| Turbo Setting        | ON                                    | ON                                                | OFF                                |
-| Memory               | 1 x 8 GB DDR3 1600MHz                 | 2 x 4GB DDR4 3200 MHz                             | 4 x 8 GB DDR4 2400MHz              |
-| Operating System     | Ubuntu* 18.04 LTS                     | Ubuntu* 18.04 LTS                                 | Ubuntu* 18.04 LTS                  |
-| Kernel Version       | 5.3.0-24-generic                      | 5.8.0-050800-generic                              | 5.3.0-24-generic                   |
-| BIOS Vendor          | American Megatrends Inc.*             | Intel Corporation                                 | American Megatrends Inc.*          |
-| BIOS Version         | 5.12                                  | EHLSFWI1.R00.2463.<br>A03.2011200425              | F8                                 |
-| BIOS Release         | September 6, 2017                     | November 22, 2020                                 | May 24, 2019                       |
-| BIOS Settings        | Default settings                      | Default settings                                  | Select optimized default settings, <br> set OS type to "other", <br>save & exit |
-| Batch size           | 1                                     | 1                                                 | 1                                  |
-| Precision            | INT8                                  | INT8                                              | INT8                               |
-| Number of concurrent inference requests | 4                  | 4                                                 | 4                                  |
-| Test Date            | March 15, 2021                        | March 15, 2021                                    | March 15, 2021                     |
-| Power dissipation, TDP in Watt | [9.5](https://ark.intel.com/content/www/us/en/ark/products/96485/intel-atom-x5-e3940-processor-2m-cache-up-to-1-80-ghz.html)  | [12](https://ark.intel.com/content/www/us/en/ark/products/207899/intel-atom-x6425re-processor-1-5m-cache-1-90-ghz.html) | [65](https://ark.intel.com/content/www/us/en/ark/products/126688/intel-core-i3-8100-processor-6m-cache-3-60-ghz.html#tab-blade-1-0-1)|
-| CPU Price, USD<br>Prices may vary  | [34](https://ark.intel.com/content/www/us/en/ark/products/96485/intel-atom-x5-e3940-processor-2m-cache-up-to-1-80-ghz.html) (on March 15th, 2021) | [59](https://ark.intel.com/content/www/us/en/ark/products/207899/intel-atom-x6425re-processor-1-5m-cache-1-90-ghz.html) (on March 26th, 2021) | [117](https://ark.intel.com/content/www/us/en/ark/products/126688/intel-core-i3-8100-processor-6m-cache-3-60-ghz.html) (on March 15th, 2021)  |
+|                      | Intel Atom® x5-E3940                  | Intel Atom® x6425RE                               | Intel® Celeron® 6305E            |
+| -------------------- | --------------------------------------|-------------------------------                    |----------------------------------|
+| Motherboard          | Intel Corporation<br>internal/Reference<br>Validation Platform | Intel Corporation<br>internal/Reference<br>Validation Platform | Intel Corporation<br>internal/Reference<br>Validation Platform      |
+| CPU                  | Intel Atom® Processor E3940 @ 1.60GHz | Intel Atom® x6425RE<br>Processor @ 1.90GHz        | Intel® Celeron®<br>6305E @ 1.80GHz  |
+| Hyper Threading      | OFF                                   | OFF                                               | OFF |
+| Turbo Setting        | ON                                    | ON                                                | ON |
+| Memory               | 1 x 8 GB DDR3 1600MHz                 | 2 x 4GB DDR4 3200MHz                              | 2 x 8 GB DDR4 3200MHz |                                  
+| Operating System     | Ubuntu* 18.04 LTS                     | Ubuntu* 18.04 LTS                                 | Ubuntu 18.04.5 LTS               |
+| Kernel Version       | 5.3.0-24-generic                      | 5.8.0-050800-generic                              | 5.8.0-050800-generic |
+| BIOS Vendor          | American Megatrends Inc.*             | Intel Corporation                                 | Intel Corporation |
+| BIOS Version         | 5.12                                  | EHLSFWI1.R00.2463.<br>A03.2011200425              | TGLIFUI1.R00.4064.A02.2102260133 |
+| BIOS Release         | September 6, 2017                     | November 22, 2020                                 | February 26, 2021 |
+| BIOS Settings        | Default settings                      | Default settings                                  | Default settings |
+| Batch size           | 1                                     | 1                                                 | 1 |
+| Precision            | INT8                                  | INT8                                              | INT8 |
+| Number of concurrent inference requests | 4                  | 4                                                 | 4|
+| Test Date            | June 18, 2021                          | June 18, 2021                                    | June 18, 2021 |
+| Rated maximum TDP/socket in Watt | [9.5](https://ark.intel.com/content/www/us/en/ark/products/96485/intel-atom-x5-e3940-processor-2m-cache-up-to-1-80-ghz.html)  | [12](https://ark.intel.com/content/www/us/en/ark/products/207899/intel-atom-x6425re-processor-1-5m-cache-1-90-ghz.html) | [15](https://ark.intel.com/content/www/us/en/ark/products/208072/intel-celeron-6305e-processor-4m-cache-1-80-ghz.html)|
+| CPU Price/socket on June 21, 2021, USD<br>Prices may vary  | [34](https://ark.intel.com/content/www/us/en/ark/products/96485/intel-atom-x5-e3940-processor-2m-cache-up-to-1-80-ghz.html) | [59](https://ark.intel.com/content/www/us/en/ark/products/207899/intel-atom-x6425re-processor-1-5m-cache-1-90-ghz.html) |[107](https://ark.intel.com/content/www/us/en/ark/products/208072/intel-celeron-6305e-processor-4m-cache-1-80-ghz.html) |
 
 
 
@@ -239,8 +264,8 @@ Testing by Intel done on: see test date for each HW platform below.
 | Batch size                              | 1                                     | 1                                     |
 | Precision                               | FP16                                  | FP16                                  |
 | Number of concurrent inference requests | 4                                     | 32                                    |
-| Power dissipation, TDP in Watt          | 2.5                                   | [30](https://www.arrow.com/en/products/mustang-v100-mx8-r10/iei-technology?gclid=Cj0KCQiA5bz-BRD-ARIsABjT4ng1v1apmxz3BVCPA-tdIsOwbEjTtqnmp_rQJGMfJ6Q2xTq6ADtf9OYaAhMUEALw_wcB)          |
-| CPU Price, USD<br>Prices may vary | [69](https://ark.intel.com/content/www/us/en/ark/products/140109/intel-neural-compute-stick-2.html) (from March 15, 2021) | [1180](https://www.arrow.com/en/products/mustang-v100-mx8-r10/iei-technology?gclid=Cj0KCQiA5bz-BRD-ARIsABjT4ng1v1apmxz3BVCPA-tdIsOwbEjTtqnmp_rQJGMfJ6Q2xTq6ADtf9OYaAhMUEALw_wcB) (from March 15, 2021)                           |
+| Rated maximum TDP/socket in Watt          | 2.5                                   | [30](https://www.arrow.com/en/products/mustang-v100-mx8-r10/iei-technology?gclid=Cj0KCQiA5bz-BRD-ARIsABjT4ng1v1apmxz3BVCPA-tdIsOwbEjTtqnmp_rQJGMfJ6Q2xTq6ADtf9OYaAhMUEALw_wcB)          |
+| CPU Price/socket on June 21, 2021, USD<br>Prices may vary | [69](https://ark.intel.com/content/www/us/en/ark/products/140109/intel-neural-compute-stick-2.html) | [425](https://www.arrow.com/en/products/mustang-v100-mx8-r10/iei-technology?gclid=Cj0KCQiA5bz-BRD-ARIsABjT4ng1v1apmxz3BVCPA-tdIsOwbEjTtqnmp_rQJGMfJ6Q2xTq6ADtf9OYaAhMUEALw_wcB)  |
 | Host Computer                           | Intel® Core™ i7                       | Intel® Core™ i5                       |
 | Motherboard                             | ASUS* Z370-A II                       | Uzelinfo* / US-E1300                  |
 | CPU                                     | Intel® Core™ i7-8700 CPU @ 3.20GHz    | Intel® Core™ i5-6600 CPU @ 3.30GHz    |
@@ -252,9 +277,9 @@ Testing by Intel done on: see test date for each HW platform below.
 | BIOS Vendor                             | American Megatrends Inc.*             | American Megatrends Inc.*             |
 | BIOS Version                            | 411                                   | 5.12                                  |
 | BIOS Release                            | September 21, 2018                    | September 21, 2018                    |
-| Test Date                               | March 15, 2021                        | March 15, 2021                      |        
+| Test Date                               | June 18, 2021                        | June 18, 2021                      |        
 
-Please follow this link for more detailed configuration descriptions: [Configuration Details](https://docs.openvinotoolkit.org/resources/benchmark_files/system_configurations_2021.3.html)
+Please follow this link for more detailed configuration descriptions: [Configuration Details](https://docs.openvinotoolkit.org/resources/benchmark_files/system_configurations_2021.4.html)
 
 \htmlonly
 <style>
diff --git a/docs/benchmarks/performance_benchmarks_ovms.md b/docs/benchmarks/performance_benchmarks_ovms.md
index 604a68438edec2..5e897955baafa0 100644
--- a/docs/benchmarks/performance_benchmarks_ovms.md
+++ b/docs/benchmarks/performance_benchmarks_ovms.md
@@ -18,20 +18,98 @@ OpenVINO™ Model Server is measured in multiple-client-single-server configurat
 
 * **Execution Controller** is launched on the client platform. It is responsible for synchronization of the whole measurement process, downloading metrics from the load balancer, and presenting the final report of the execution.
 
-## 3D U-Net (FP32)
-![](../img/throughput_ovms_3dunet.png)
 ## resnet-50-TF (INT8)
 ![](../img/throughput_ovms_resnet50_int8.png)
 ## resnet-50-TF (FP32)
-![](../img/throughput_ovms_resnet50_fp32.png)
+![](../img/throughput_ovms_resnet50_fp32_bs_1.png)
+## 3D U-Net (FP32)
+![](../img/throughput_ovms_3dunet.png)
+## yolo-v3-tf (FP32)
+![](../img/throughput_ovms_yolo3_fp32.png)
+## yolo-v3-tiny-tf (FP32)
+![](../img/throughput_ovms_yolo3tiny_fp32.png)
+## yolo-v4-tf (FP32)
+![](../img/throughput_ovms_yolo4_fp32.png)
+## bert-small-uncased-whole-word-masking-squad-0002 (FP32)
+![](../img/throughput_ovms_bertsmall_fp32.png)
+## bert-small-uncased-whole-word-masking-squad-int8-0002 (INT8)
+![](../img/throughput_ovms_bertsmall_int8.png)
+## bert-large-uncased-whole-word-masking-squad-0001 (FP32)
+![](../img/throughput_ovms_bertlarge_fp32.png)
 ## bert-large-uncased-whole-word-masking-squad-int8-0001 (INT8)
 ![](../img/throughput_ovms_bertlarge_int8.png)
+## mobilenet-v3-large-1.0-224-tf (FP32)
+![](../img/throughput_ovms_mobilenet3large_fp32.png)
+## ssd_mobilenet_v1_coco (FP32)
+![](../img/throughput_ovms_ssdmobilenet1_fp32.png)
 
-## bert-large-uncased-whole-word-masking-squad-0001 (FP32)
-![](../img/throughput_ovms_bertlarge_fp32.png)
 ## Platform Configurations
 
-OpenVINO™ Model Server performance benchmark numbers are based on release 2021.3. Performance results are based on testing as of March 15, 2021 and may not reflect all publicly available updates. 
+OpenVINO™ Model Server performance benchmark numbers are based on release 2021.4. Performance results are based on testing as of June 17, 2021 and may not reflect all publicly available updates. 
+
+**Platform with Intel® Xeon® Platinum 8260M**
+
+<table>
+  <tr>
+    <th></th>
+    <th><strong>Server Platform</strong></th>
+    <th><strong>Client Platform</strong></th>
+  </tr>
+  <tr>
+    <td><strong>Motherboard</strong></td>
+    <td>Inspur YZMB-00882-104 NF5280M5</td>
+    <td>Intel® Server Board S2600WF H48104-872</td>
+  </tr>
+  <tr>
+    <td><strong>Memory</strong></td>
+    <td>Samsung 16 x 16GB @ 2666 MT/s DDR4</td>
+    <td>Hynix 16 x 16GB @ 2666 MT/s DDR4</td>
+  </tr>
+  <tr>
+    <td><strong>CPU</strong></td>
+    <td>Intel® Xeon® Platinum 8260M CPU @ 2.40GHz</td>
+    <td>Intel® Xeon® Gold 6252 CPU @ 2.10GHz</td>
+  </tr>
+  <tr>
+    <td><strong>Selected CPU Flags</strong></td>
+    <td>Hyper Threading, Turbo Boost, DL Boost</td>
+    <td>Hyper Threading, Turbo Boost, DL Boost</td>
+  </tr>
+  <tr>
+    <td><strong>CPU Thermal Design Power</strong></td>
+    <td>162 W</td>
+    <td>150 W</td>
+  </tr>
+  <tr>
+    <td><strong>Operating System</strong></td>
+    <td>Ubuntu 20.04.2 LTS</td>
+    <td>Ubuntu 20.04.2 LTS</td>
+  </tr>
+  <tr>
+    <td><strong>Kernel Version</strong></td>
+    <td>5.4.0-54-generic</td>
+    <td>5.4.0-65-generic</td>
+  </tr>
+  <tr>
+    <td><strong>BIOS Vendor</strong></td>
+    <td>American Megatrends Inc.</td>
+    <td>Intel® Corporation</td>
+  </tr>
+  <tr>
+    <td><strong>BIOS Version & Release</strong></td>
+    <td>4.1.16, date: 06/23/2020</td>
+    <td>SE5C620.86B.02.01, date: 03/26/2020</td>
+  </tr>
+  <tr>
+    <td><strong>Docker Version</strong></td>
+    <td>20.10.3</td>
+    <td>20.10.3</td>
+  </tr>
+  <tr>
+    <td><strong>Network Speed</strong></td>
+    <td colspan="2">40 Gb/s</td>
+  </tr>
+</table>
 
 **Platform with Intel® Xeon® Gold 6252**
 
@@ -65,7 +143,7 @@ OpenVINO™ Model Server performance benchmark numbers are based on release 2021
     <td><strong>CPU Thermal Design Power</strong></td>
     <td>150 W</td>
     <td>162 W</td>
-  </tr>
+</tr>
   <tr>
     <td><strong>Operating System</strong></td>
     <td>Ubuntu 20.04.2 LTS</td>
diff --git a/docs/benchmarks/performance_int8_vs_fp32.md b/docs/benchmarks/performance_int8_vs_fp32.md
index 35be3673e1a991..e6e85d02df556f 100644
--- a/docs/benchmarks/performance_int8_vs_fp32.md
+++ b/docs/benchmarks/performance_int8_vs_fp32.md
@@ -20,25 +20,25 @@ The table below illustrates the speed-up factor for the performance gain by swit
     <td>bert-large-<br>uncased-whole-word-<br>masking-squad-0001</td>
     <td>SQuAD</td>
     <td>1.6</td>
-    <td>3.0</td>
-    <td>1.6</td>
-    <td>2.3</td>
+    <td>3.1</td>
+    <td>1.5</td>
+    <td>2.5</td>
   </tr>
   <tr>
     <td>brain-tumor-<br>segmentation-<br>0001-MXNET</td>
     <td>BraTS</td>
     <td>1.6</td>
-    <td>1.9</td>
-    <td>1.7</td>
-    <td>1.7</td>
+    <td>2.0</td>
+    <td>1.8</td>
+    <td>1.8</td>
   </tr>
   <tr>
     <td>deeplabv3-TF</td>
     <td>VOC 2012<br>Segmentation</td>
-    <td>2.1</td>
-    <td>3.1</td>
-    <td>3.1</td>
+    <td>1.9</td>
     <td>3.0</td>
+    <td>2.8</td>
+    <td>3.1</td>
   </tr>
   <tr>
     <td>densenet-121-TF</td>
@@ -51,7 +51,7 @@ The table below illustrates the speed-up factor for the performance gain by swit
   <tr>
     <td>facenet-<br>20180408-<br>102900-TF</td>
     <td>LFW</td>
-    <td>2.0</td>
+    <td>2.1</td>
     <td>3.6</td>
     <td>2.2</td>
     <td>3.7</td>
@@ -60,17 +60,9 @@ The table below illustrates the speed-up factor for the performance gain by swit
     <td>faster_rcnn_<br>resnet50_coco-TF</td>
     <td>MS COCO</td>
     <td>1.9</td>
-    <td>3.8</td>
-    <td>2.0</td>
-    <td>3.5</td>
-  </tr>
-  <tr>
-    <td>googlenet-v1-TF</td>
-    <td>ImageNet</td>
-    <td>1.8</td>
-    <td>3.6</td>
+    <td>3.7</td>
     <td>2.0</td>
-    <td>3.9</td>
+    <td>3.4</td>
   </tr>
   <tr>
     <td>inception-v3-TF</td>
@@ -78,24 +70,16 @@ The table below illustrates the speed-up factor for the performance gain by swit
     <td>1.9</td>
     <td>3.8</td>
     <td>2.0</td>
-    <td>4.0</td>
+    <td>4.1</td>
   </tr>
   <tr>
     <td>mobilenet-<br>ssd-CF</td>
     <td>VOC2012</td>
-    <td>1.7</td>
+    <td>1.6</td>
     <td>3.1</td>
-    <td>1.8</td>
+    <td>1.9</td>
     <td>3.6</td>
   </tr>
-  <tr>
-    <td>mobilenet-v1-1.0-<br>224-TF</td>
-    <td>ImageNet</td>
-    <td>1.7</td>
-    <td>3.1</td>
-    <td>1.8</td>
-    <td>4.1</td>
-  </tr>
   <tr>
     <td>mobilenet-v2-1.0-<br>224-TF</td>
     <td>ImageNet</td>
@@ -107,10 +91,10 @@ The table below illustrates the speed-up factor for the performance gain by swit
   <tr>
     <td>mobilenet-v2-<br>pytorch</td>
     <td>ImageNet</td>
-    <td>1.6</td>
+    <td>1.7</td>
     <td>2.4</td>
     <td>1.9</td>
-    <td>3.9</td>
+    <td>4.0</td>
   </tr>
   <tr>
     <td>resnet-18-<br>pytorch</td>
@@ -124,7 +108,7 @@ The table below illustrates the speed-up factor for the performance gain by swit
     <td>resnet-50-<br>pytorch</td>
     <td>ImageNet</td>
     <td>1.9</td>
-    <td>3.7</td>
+    <td>3.6</td>
     <td>2.0</td>
     <td>3.9</td>
   </tr>
@@ -147,16 +131,16 @@ The table below illustrates the speed-up factor for the performance gain by swit
   <tr>
     <td>ssd_mobilenet_<br>v1_coco-tf</td>
     <td>VOC2012</td>
-    <td>1.7</td>
-    <td>3.0</td>
-    <td>1.9</td>
+    <td>1.8</td>
+    <td>3.1</td>
+    <td>2.0</td>
     <td>3.6</td>
   </tr>
   <tr>
     <td>ssd300-CF</td>
     <td>MS COCO</td>
     <td>1.8</td>
-    <td>4.4</td>
+    <td>4.2</td>
     <td>1.9</td>
     <td>3.9</td>
   </tr>
@@ -165,32 +149,56 @@ The table below illustrates the speed-up factor for the performance gain by swit
     <td>MS COCO</td>
     <td>1.7</td>
     <td>2.5</td>
-    <td>2.2</td>
-    <td>3.4</td>
+    <td>2.4</td>
+    <td>3.5</td>
   </tr>
   <tr>
-    <td>yolo_v3-TF</td>
+    <td>yolo_v4-TF</td>
     <td>MS COCO</td>
-    <td>1.8</td>
-    <td>4.0</td>
     <td>1.9</td>
+    <td>3.6</td>
+    <td>2.0</td>
+    <td>3.4</td>
+  </tr>
+  <tr>
+    <td>unet-camvid-onnx-0001</td>
+    <td>MS COCO</td>
+    <td>1.7</td>
     <td>3.9</td>
+    <td>1.7</td>
+    <td>3.7</td>
   </tr>
   <tr>
-    <td>yolo_v4-TF</td>
+    <td>ssd-resnet34-<br>1200-onnx</td>
     <td>MS COCO</td>
     <td>1.7</td>
-    <td>3.4</td>
+    <td>4.0</td>
     <td>1.7</td>
-    <td>2.8</td>
+    <td>3.4</td>
   </tr>
   <tr>
-    <td>unet-camvid-onnx-0001</td>
+    <td>googlenet-v4-tf</td>
+    <td>ImageNet</td>
+    <td>1.9</td>
+    <td>3.9</td>
+    <td>2.0</td>
+    <td>4.1</td>
+  </tr>
+  <tr>
+    <td>vgg19-caffe</td>
+    <td>ImageNet</td>
+    <td>1.9</td>
+    <td>4.7</td>
+    <td>2.0</td>
+    <td>4.5</td>
+  </tr>
+  <tr>
+    <td>yolo-v3-tiny-tf</td>
     <td>MS COCO</td>
-    <td>1.6</td>
-    <td>3.8</td>
-    <td>1.6</td>
-    <td>3.7</td>
+    <td>1.7</td>
+    <td>3.4</td>
+    <td>1.9</td>
+    <td>3.5</td>
   </tr>
 </table>
 
@@ -217,18 +225,18 @@ The following table shows the absolute accuracy drop that is calculated as the d
     <td>SQuAD</td>
     <td>F1</td>
     <td>0.62</td>
-    <td>0.88</td>
-    <td>0.52</td>
+    <td>0.71</td>
+    <td>0.62</td>
     <td>0.62</td>
   </tr>
   <tr>
     <td>brain-tumor-<br>segmentation-<br>0001-MXNET</td>
     <td>BraTS</td>
     <td>Dice-index@ <br>Mean@ <br>Overall Tumor</td>
-    <td>0.09</td>
+    <td>0.08</td>
     <td>0.10</td>
-    <td>0.11</td>
-    <td>0.09</td>
+    <td>0.10</td>
+    <td>0.08</td>
   </tr>
   <tr>
     <td>deeplabv3-TF</td>
@@ -243,10 +251,10 @@ The following table shows the absolute accuracy drop that is calculated as the d
     <td>densenet-121-TF</td>
     <td>ImageNet</td>
     <td>acc@top-1</td>
-    <td>0.54</td>
-    <td>0.57</td>
-    <td>0.57</td>
-    <td>0.54</td>
+    <td>0.49</td>
+    <td>0.56</td>
+    <td>0.56</td>
+    <td>0.49</td>
   </tr>
   <tr>
     <td>facenet-<br>20180408-<br>102900-TF</td>
@@ -261,46 +269,28 @@ The following table shows the absolute accuracy drop that is calculated as the d
     <td>faster_rcnn_<br>resnet50_coco-TF</td>
     <td>MS COCO</td>
     <td>coco_<br>precision</td>
-    <td>0.04</td>
-    <td>0.04</td>
-    <td>0.04</td>
-    <td>0.04</td>
+    <td>0.09</td>
+    <td>0.09</td>
+    <td>0.09</td>
+    <td>0.09</td>
   </tr>
   <tr>
-    <td>googlenet-v1-TF</td>
+    <td>inception-v3-TF</td>
     <td>ImageNet</td>
     <td>acc@top-1</td>
+    <td>0.02</td>
     <td>0.01</td>
-    <td>0.00</td>
-    <td>0.00</td>
     <td>0.01</td>
-  </tr>
-  <tr>
-    <td>inception-v3-TF</td>
-    <td>ImageNet</td>
-    <td>acc@top-1</td>
-    <td>0.04</td>
-    <td>0.00</td>
-    <td>0.00</td>
-    <td>0.04</td>
+    <td>0.02</td>
   </tr>
   <tr>
     <td>mobilenet-<br>ssd-CF</td>
     <td>VOC2012</td>
     <td>mAP</td>
-    <td>0.77</td>
-    <td>0.77</td>
-    <td>0.77</td>
-    <td>0.77</td>
-  </tr>
-  <tr>
-    <td>mobilenet-v1-1.0-<br>224-TF</td>
-    <td>ImageNet</td>
-    <td>acc@top-1</td>
-    <td>0.26</td>
-    <td>0.28</td>
-    <td>0.28</td>
-    <td>0.26</td>
+    <td>0.06</td>
+    <td>0.04</td>
+    <td>0.04</td>
+    <td>0.06</td>
   </tr>
   <tr>
     <td>mobilenet-v2-1.0-<br>224-TF</td>
@@ -342,37 +332,37 @@ The following table shows the absolute accuracy drop that is calculated as the d
     <td>resnet-50-<br>TF</td>
     <td>ImageNet</td>
     <td>acc@top-1</td>
-    <td>0.10</td>
-    <td>0.08</td>
-    <td>0.08</td>
-    <td>0.10</td>
+    <td>0.11</td>
+    <td>0.11</td>
+    <td>0.11</td>
+    <td>0.11</td>
   </tr>
   <tr>
     <td>squeezenet1.1-<br>CF</td>
     <td>ImageNet</td>
     <td>acc@top-1</td>
-    <td>0.63</td>
+    <td>0.64</td>
     <td>0.66</td>
     <td>0.66</td>
-    <td>0.63</td>
+    <td>0.64</td>
   </tr>
   <tr>
     <td>ssd_mobilenet_<br>v1_coco-tf</td>
     <td>VOC2012</td>
     <td>COCO mAp</td>
-    <td>0.18</td>
-    <td>3.06</td>
-    <td>3.06</td>
-    <td>0.18</td>
+    <td>0.17</td>
+    <td>2.96</td>
+    <td>2.96</td>
+    <td>0.17</td>
   </tr>
   <tr>
     <td>ssd300-CF</td>
     <td>MS COCO</td>
     <td>COCO mAp</td>
-    <td>0.05</td>
-    <td>0.05</td>
-    <td>0.05</td>
-    <td>0.05</td>
+    <td>0.18</td>
+    <td>3.06</td>
+    <td>3.06</td>
+    <td>0.18</td>
   </tr>
   <tr>
     <td>ssdlite_<br>mobilenet_<br>v2-TF</td>
@@ -384,31 +374,58 @@ The following table shows the absolute accuracy drop that is calculated as the d
     <td>0.11</td>
   </tr>
   <tr>
-    <td>yolo_v3-TF</td>
+    <td>yolo_v4-TF</td>
     <td>MS COCO</td>
     <td>COCO mAp</td>
-    <td>0.11</td>
-    <td>0.24</td>
-    <td>0.24</td>
-    <td>0.11</td>
+    <td>0.06</td>
+    <td>0.03</td>
+    <td>0.03</td>
+    <td>0.06</td>
   </tr>
   <tr>
-    <td>yolo_v4-TF</td>
+    <td>unet-camvid-<br>onnx-0001</td>
     <td>MS COCO</td>
     <td>COCO mAp</td>
-    <td>0.01</td>
-    <td>0.09</td>
-    <td>0.09</td>
-    <td>0.01</td>
+    <td>0.29</td>
+    <td>0.29</td>
+    <td>0.31</td>
+    <td>0.29</td>
   </tr>
   <tr>
-    <td>unet-camvid-<br>onnx-0001</td>
+    <td>ssd-resnet34-<br>1200-onnx</td>
     <td>MS COCO</td>
     <td>COCO mAp</td>
-    <td>0.31</td>
-    <td>0.31</td>
-    <td>0.31</td>
-    <td>0.31</td>
+    <td>0.02</td>
+    <td>0.03</td>
+    <td>0.03</td>
+    <td>0.02</td>
+  </tr>
+  <tr>
+    <td>googlenet-v4-tf</td>
+    <td>ImageNet</td>
+    <td>COCO mAp</td>
+    <td>0.08</td>
+    <td>0.06</td>
+    <td>0.06</td>
+    <td>0.06</td>
+  </tr>
+  <tr>
+    <td>vgg19-caffe</td>
+    <td>ImageNet</td>
+    <td>COCO mAp</td>
+    <td>0.02</td>
+    <td>0.04</td>
+    <td>0.04</td>
+    <td>0.02</td>
+  </tr>
+  <tr>
+    <td>yolo-v3-tiny-tf</td>
+    <td>MS COCO</td>
+    <td>COCO mAp</td>
+    <td>0.02</td>
+    <td>0.6</td>
+    <td>0.6</td>
+    <td>0.02</td>
   </tr>
 </table>
 
diff --git a/docs/doxygen/doxy_md_filter.py b/docs/doxygen/doxy_md_filter.py
index 5969063167554e..8d2b9fa1813832 100644
--- a/docs/doxygen/doxy_md_filter.py
+++ b/docs/doxygen/doxy_md_filter.py
@@ -51,6 +51,15 @@ def replace_links(content, items, folder, labels, docs_folder):
     return content
 
 
+def add_htmlonly(content):
+    content = content.replace('<details>', '\n\\htmlonly\n<details>')
+    content = content.replace('</summary>', '</summary>\n\\endhtmlonly')
+    content = content.replace('</details>', '\n\\htmlonly\n</details>\n\\endhtmlonly')
+    content = content.replace('<iframe', '\n\\htmlonly\n<iframe')
+    content = content.replace('</iframe>', '</iframe>\n\\endhtmlonly')
+    return content
+
+
 def process_github_md_links(content, items):
     """
     This is a workaround to support github markdown links in doxygen 1.8.12.
@@ -81,6 +90,7 @@ def process(docs_folder):
         content = replace_links(content, inline_links, md_folder, labels, docs_folder)
         content = replace_links(content, reference_links, md_folder, labels, docs_folder)
         content = process_github_md_links(content, github_md_links)
+        content = add_htmlonly(content)
         if inline_links or reference_links or github_md_links:
             with open(md_file, 'w', encoding='utf-8') as f:
                 f.write(content)
diff --git a/docs/doxygen/doxygen-ignore.txt b/docs/doxygen/doxygen-ignore.txt
index c2bc8a0825cb27..023d555cf0491a 100644
--- a/docs/doxygen/doxygen-ignore.txt
+++ b/docs/doxygen/doxygen-ignore.txt
@@ -1,5 +1,6 @@
 openvino/inference-engine/samples/hello_reshape_ssd/README.md
 openvino/docs/index.md
+inference-engine/include/ie_icnn_network.hpp
 openvino/docs/get_started/get_started_dl_workbench.md
 openvino/docs/get_started/get_started_linux.md
 openvino/docs/get_started/get_started_raspbian.md
@@ -10,10 +11,24 @@ openvino/docs/install_guides/deployment-manager-tool.md
 openvino/docs/MO_DG/prepare_model/customize_model_optimizer/Customize_Model_Optimizer.md
 openvino/docs/ovsa/ovsa_get_started.md
 openvino/inference-engine/ie_bridges/c/docs/api_overview.md
+inference-engine/include/cpp/ie_infer_request.hpp
+inference-engine/include/ie_parallel.hpp
+inference-engine/include/gpu/gpu_context_api_ocl.hpp
+inference-engine/include/gpu/gpu_context_api_va.hpp
+inference-engine/include/ie_plugin_config.hpp
+inference-engine/include/ie_unicode.hpp
+inference-engine/include/vpu/myriad_config.hpp
+inference-engine/include/vpu/vpu_config.hpp
+inference-engine/include/vpu/vpu_plugin_config.hpp
 openvino/docs/benchmarks/performance_int8_vs_fp32.md
 openvino/docs/get_started/get_started_macos.md
-openvino/docs/optimization_guide/dldt_optimization_guide.md
-openvino/docs/IE_DG/ShapeInference.md
+inference-engine/include/details/ie_so_pointer.hpp
+inference-engine/include/ie_compound_blob.h
+inference-engine/include/ie_data.h
+inference-engine/include/ie_blob.h
+inference-engine/include/ie_precision.hpp
+inference-engine/include/ie_remote_context.hpp
+inference-engine/include/gpu/gpu_context_api_dx.hpp
 build/docs/openvino_docs.xml
 openvino/docs/install_guides/installing-openvino-linux-ivad-vpu.md
 inference-engine/src/inference_engine/include/ie/ie_parallel.hpp
diff --git a/docs/doxygen/ie_docs.xml b/docs/doxygen/ie_docs.xml
index ee07308a19aefc..a4ae8c245ee5ba 100644
--- a/docs/doxygen/ie_docs.xml
+++ b/docs/doxygen/ie_docs.xml
@@ -19,11 +19,10 @@ limitations under the License.
 <doxygenlayout xmlns:xi="http://www.w3.org/2001/XInclude" version="1.0">
     <!-- Navigation index tabs for HTML output -->
     <navindex>
-        <tab id="converting_and_preparing_models" type="usergroup" title="Converting and Preparing Models" url="">
+        <tab id="converting_and_preparing_models" type="usergroup" title="Converting and Preparing Models" url="@ref openvino_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide">
             <!-- Model Optimizer Developer Guide-->
             <tab type="usergroup" title="Model Optimizer Developer Guide" url="@ref openvino_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide">
-                <tab type="usergroup" title="Preparing and Optimizing Your Trained Model" url="@ref openvino_docs_MO_DG_prepare_model_Prepare_Trained_Model">
-                    <tab type="user" title="Configuring the Model Optimizer" url="@ref openvino_docs_MO_DG_prepare_model_Config_Model_Optimizer"/>
+                    <tab type="user" title="Installing Model Optimizer Pre-Requisites" url="@ref openvino_docs_MO_DG_prepare_model_Config_Model_Optimizer"/>
                     <tab type="usergroup" title="Converting a Model to Intermediate Representation (IR)" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_Converting_Model">
                         <tab type="user" title="Converting a Model Using General Conversion Parameters" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_Converting_Model_General"/>
                         <tab type="user" title="Converting a Caffe* Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_Convert_Model_From_Caffe"/>
@@ -57,12 +56,12 @@ limitations under the License.
                             <tab type="user" title="Convert ONNX* GPT-2 Model to the Intermediate Representation" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_onnx_specific_Convert_GPT2"/>
                             <tab type="user" title="[DEPRECATED] Convert DLRM ONNX* Model to the Intermediate Representation" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_onnx_specific_Convert_DLRM"/>
                             <tab type="usergroup" title="Converting Your PyTorch* Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_Convert_Model_From_PyTorch">
-                            <tab type="user" title="Convert PyTorch* QuartzNet Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_QuartzNet"/>
-                            <tab type="user" title="Convert PyTorch* RNN-T Model " url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_RNNT"/>
-                            <tab type="user" title="Convert PyTorch* YOLACT Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_YOLACT"/>
-                            <tab type="user" title="Convert PyTorch* F3Net Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_F3Net"/>
-                            <tab type="user" title="Convert PyTorch* RCAN Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_RCAN"/>
-                            <tab type="user" title="Convert PyTorch* BERT-NER Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_Bert_ner"/>
+                                <tab type="user" title="Convert PyTorch* QuartzNet Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_QuartzNet"/>
+                                <tab type="user" title="Convert PyTorch* RNN-T Model " url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_RNNT"/>
+                                <tab type="user" title="Convert PyTorch* YOLACT Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_YOLACT"/>
+                                <tab type="user" title="Convert PyTorch* F3Net Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_F3Net"/>
+                                <tab type="user" title="Convert PyTorch* RCAN Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_RCAN"/>
+                                <tab type="user" title="Convert PyTorch* BERT-NER Model" url="@ref openvino_docs_MO_DG_prepare_model_convert_model_pytorch_specific_Convert_Bert_ner"/>
                             </tab>
                         </tab>
                         <tab type="user" title="Model Optimizations Techniques" url="@ref openvino_docs_MO_DG_prepare_model_Model_Optimization_Techniques"/>
@@ -76,10 +75,8 @@ limitations under the License.
                         <tab type="user" title="Extending Model Optimizer with New Primitives" url="@ref openvino_docs_MO_DG_prepare_model_customize_model_optimizer_Extending_Model_Optimizer_with_New_Primitives"/>
                         <tab type="user" title="Extending Model Optimizer with Caffe* Python Layers" url="@ref openvino_docs_MO_DG_prepare_model_customize_model_optimizer_Extending_Model_Optimizer_With_Caffe_Python_Layers"/>
                         <tab type="user" title="Extending Model Optimizer for Custom MXNet* Operations" url="@ref openvino_docs_MO_DG_prepare_model_customize_model_optimizer_Extending_MXNet_Model_Optimizer_with_New_Primitives"/>
-                        <tab type="user" title="Legacy Mode for Caffe* Custom Layers" url="@ref openvino_docs_MO_DG_prepare_model_customize_model_optimizer_Legacy_Mode_for_Caffe_Custom_Layers"/>
-                        <tab type="user" title="[DEPRECATED] Offloading Sub-Graph Inference" url="https://docs.openvinotoolkit.org/2020.1/_docs_MO_DG_prepare_model_customize_model_optimizer_Offloading_Sub_Graph_Inference.html"/>
+                        <tab type="user" title="[DEPRECATED] Legacy Mode for Caffe* Custom Layers" url="@ref openvino_docs_MO_DG_prepare_model_customize_model_optimizer_Legacy_Mode_for_Caffe_Custom_Layers"/>
                     </tab>
-                </tab>
                 <tab type="user" title="Model Optimizer Frequently Asked Questions" url="@ref openvino_docs_MO_DG_prepare_model_Model_Optimizer_FAQ"/>
                 <tab type="user" title="Known Issues" url="@ref openvino_docs_MO_DG_Known_Issues_Limitations"/>
             </tab>
@@ -375,4 +372,4 @@ limitations under the License.
             <tab type="user" title="Inference Engine Plugin Development Guide" url="ie_plugin_api/index.html"/>
         </tab>
     </navindex>
-</doxygenlayout>
+</doxygenlayout>
\ No newline at end of file
diff --git a/docs/doxygen/ngraph_cpp_api.config b/docs/doxygen/ngraph_cpp_api.config
index e289689d3156a1..2b0b50b6d70b59 100644
--- a/docs/doxygen/ngraph_cpp_api.config
+++ b/docs/doxygen/ngraph_cpp_api.config
@@ -29,7 +29,8 @@ FILE_PATTERNS          = *.cpp \
 LAYOUT_FILE            = "@NGRAPH_CPP_LAYOUT_BUILD@"
 
 INPUT                  = "@NGRAPH_DIR@/core/include/" \
-                         "@NGRAPH_DIR@/frontend/onnx_import/include"
+                         "@NGRAPH_DIR@/frontend/onnx/frontend/include/" \
+                         "@NGRAPH_DIR@/frontend/paddlepaddle/frontend/include/"
 
 HTML_OUTPUT            = "@NGRAPH_CPP_OUTPUT@"
 
diff --git a/docs/doxygen/openvino_docs.xml b/docs/doxygen/openvino_docs.xml
index fb898216fe7f65..73610bd0a9bcad 100644
--- a/docs/doxygen/openvino_docs.xml
+++ b/docs/doxygen/openvino_docs.xml
@@ -27,11 +27,9 @@ limitations under the License.
             <tab type="usergroup" title="Installation Guides" url=""><!--automatically generated-->
                 <tab type="usergroup" title="Linux" url="@ref openvino_docs_install_guides_installing_openvino_linux">
                     <tab type="user" title="Install Intel® Distribution of OpenVINO™ toolkit for Linux* OS" url="@ref openvino_docs_install_guides_installing_openvino_linux"/>
-                    <tab type="user" title="[DEPRECATED] Install Intel® Distribution of OpenVINO™ toolkit for Linux with FPGA Support" url="@ref openvino_docs_install_guides_installing_openvino_linux_fpga"/>
                 </tab>     
                 <tab type="usergroup" title="Windows" url="@ref openvino_docs_install_guides_installing_openvino_windows">
                     <tab type="user" title="Install Intel® Distribution of OpenVINO™ toolkit for Windows* 10" url="@ref openvino_docs_install_guides_installing_openvino_windows"/>
-                    <tab type="user" title="[DEPRECATED] Install Intel® Distribution of OpenVINO™ toolkit for Windows* with FPGA support" url="@ref openvino_docs_install_guides_installing_openvino_windows_fpga"/>
                 </tab>
                 <tab type="user" title="macOS" url="@ref openvino_docs_install_guides_installing_openvino_macos"/>
                 <tab type="user" title="Raspbian OS" url="@ref openvino_docs_install_guides_installing_openvino_raspbian"/>
@@ -42,7 +40,7 @@ limitations under the License.
                     <tab type="user" title="Install Intel® Distribution of OpenVINO™ toolkit for Linux* from a Docker* Image" url="@ref openvino_docs_install_guides_installing_openvino_docker_linux"/>
                     <tab type="user" title="Install Intel® Distribution of OpenVINO™ toolkit for Windows* from a Docker* Image" url="@ref openvino_docs_install_guides_installing_openvino_docker_windows"/>
                 </tab>
-                <tab type="user" title="Docker with DL Workbench" url="./workbench_docs_Workbench_DG_Install_from_Docker_Hub.html"/><!-- Link to the original Workbench topic -->
+                <tab type="user" title="Docker with DL Workbench" url="./workbench_docs_Workbench_DG_Run_Locally.html"/><!-- Link to the original Workbench topic -->
                 <tab type="user" title="APT" url="@ref openvino_docs_install_guides_installing_openvino_apt"/>
                 <tab type="user" title="YUM" url="@ref openvino_docs_install_guides_installing_openvino_yum"/>
                 <tab type="user" title="Anaconda Cloud" url="@ref openvino_docs_install_guides_installing_openvino_conda"/>
@@ -57,7 +55,7 @@ limitations under the License.
                 <tab type="user" title="Windows" url="@ref openvino_docs_get_started_get_started_windows"/>
                 <tab type="user" title="macOS" url="@ref openvino_docs_get_started_get_started_macos"/>
                 <tab type="user" title="Raspbian" url="@ref openvino_docs_get_started_get_started_raspbian"/>
-                <tab type="user" title="Get Started with OpenVINO via DL Workbench" url="@ref openvino_docs_get_started_get_started_dl_workbench"/>
+                <tab type="user" title="DL Workbench: Quick Start with OpenVINO™ Toolkit" url="@ref openvino_docs_get_started_get_started_dl_workbench"/>
                 <tab type="user" title="Legal Information" url="@ref openvino_docs_Legal_Information"/>
             </tab>
             <!-- Configuration for Hardware -->
@@ -67,10 +65,6 @@ limitations under the License.
                     <tab type="user" title="Intel® Movidius™ VPUs Setup Guide" url="@ref openvino_docs_install_guides_movidius_setup_guide"/>
                     <tab type="user" title="Intel® Movidius™ VPUs Programming Guide" url="@ref openvino_docs_install_guides_movidius_programming_guide"/>
                 </tab>
-                <tab type="usergroup" title="[DEPRECATED] FPGAs" url="@ref openvino_docs_install_guides_VisionAcceleratorFPGA_Configure">
-                    <tab type="user" title="[DEPRECATED] Configuration Guide for Intel® Vision Accelerator Design with an Intel® Arria 10 FPGA SG2 (IEIs Mustang-F100-A10) on Linux" url="@ref openvino_docs_install_guides_VisionAcceleratorFPGA_Configure"/>
-                    <tab type="user" title="[DEPRECATED] Configuration Guide for Intel® Programmable Acceleration Card with Intel® Arria® 10 FPGA GX on CentOS or Ubuntu*" url="@ref openvino_docs_install_guides_PAC_Configure"/>   
-                </tab>
             </tab>
             <!-- Security -->
             <tab type="usergroup" title="Security" url="@ref openvino_docs_security_guide_introduction"><!--automatically generated-->
@@ -103,7 +97,7 @@ limitations under the License.
                 <tab type="usergroup" title="Performance Benchmark Results" url="@ref openvino_docs_performance_benchmarks">
                     <tab type="usergroup" title="Intel® Distribution of OpenVINO™ toolkit Benchmark Results" url="@ref openvino_docs_performance_benchmarks_openvino">
                         <tab type="user" title="Performance Information Frequently Asked Questions" url="@ref openvino_docs_performance_benchmarks_faq"/>
-                        <tab type="user" title="Download Performance Data Spreadsheet in MS Excel* Format" url="https://docs.openvinotoolkit.org/downloads/benchmark_files/OV-2021.3-Download-Excel.xlsx"/>
+                        <tab type="user" title="Download Performance Data Spreadsheet in MS Excel* Format" url="https://docs.openvinotoolkit.org/downloads/benchmark_files/OV-2021.4-Download-Excel.xlsx"/>
                         <tab type="user" title="INT8 vs. FP32 Comparison on Select Networks and Platforms" url="@ref openvino_docs_performance_int8_vs_fp32"/>
                     </tab>
                     <tab type="user" title="OpenVINO™ Model Server Benchmark Results" url="@ref openvino_docs_performance_benchmarks_ovms"/>
@@ -118,6 +112,9 @@ limitations under the License.
                     <xi:include href="omz_docs.xml" xpointer="omz_tools_accuracy_checker">
                         <xi:fallback/>
                     </xi:include>
+                    <xi:include href="omz_docs.xml" xpointer="omz_data">
+                        <xi:fallback/>
+                    </xi:include>
                     <tab type="user" title="Using Cross Check Tool for Per-Layer Comparison Between Plugins" url="@ref openvino_inference_engine_tools_cross_check_tool_README"/>
                 </tab>
                 <tab type="user" title="Case Studies" url="https://www.intel.com/openvino-success-stories"/>
@@ -158,9 +155,6 @@ limitations under the License.
             <xi:include href="omz_docs.xml" xpointer="omz_models">
                 <xi:fallback/>
             </xi:include>
-            <tab type="user" title="Dataset Preparation Guide" url="@ref omz_data_datasets"/>
-            <tab type="user" title="Intel's Pre-Trained Models Device Support" url="@ref omz_models_intel_device_support"/>
-            <tab type="user" title="Public Pre-Trained Models Device Support" url="@ref omz_models_public_device_support"/>
             <xi:include href="omz_docs.xml" xpointer="omz_demos">
                 <xi:fallback/>
             </xi:include>
@@ -189,15 +183,6 @@ limitations under the License.
                 <tab type="user" title="Benchmark C++ Tool" url="@ref openvino_inference_engine_samples_benchmark_app_README"/>
                 <tab type="user" title="Benchmark Python* Tool" url="@ref openvino_inference_engine_tools_benchmark_tool_README"/>
             </tab>
-            <!-- Reference Implementations -->
-            <tab type="usergroup" title="Reference Implementations" url="">
-                <tab type="usergroup" title="Speech Library and Speech Recognition Demos" url="@ref openvino_inference_engine_samples_speech_libs_and_demos_Speech_libs_and_demos">
-                    <tab type="user" title="Speech Library" url="@ref openvino_inference_engine_samples_speech_libs_and_demos_Speech_library"/>
-                    <tab type="user" title="Offline Speech Recognition Demo" url="@ref openvino_inference_engine_samples_speech_libs_and_demos_Offline_speech_recognition_demo"/>
-                    <tab type="user" title="Live Speech Recognition Demo" url="@ref openvino_inference_engine_samples_speech_libs_and_demos_Live_speech_recognition_demo"/>
-                    <tab type="user" title="Kaldi* Statistical Language Model Conversion Tool" url="@ref openvino_inference_engine_samples_speech_libs_and_demos_Kaldi_SLM_conversion_tool"/>
-                </tab>    
-            </tab>
             <!-- DL Streamer Examples -->
             <tab type="usergroup" title="DL Streamer Examples" url="@ref gst_samples_README">
                 <tab type="usergroup" title="Command Line Samples" url="">
diff --git a/docs/get_started/dl_workbench_img/active_projects_page.png b/docs/get_started/dl_workbench_img/active_projects_page.png
new file mode 100644
index 00000000000000..5f039232446d5f
--- /dev/null
+++ b/docs/get_started/dl_workbench_img/active_projects_page.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6038ccd7873a1a818d944139ea3144a115dae19f0d3094e590a8a0c2b7b3a46c
+size 95228
diff --git a/docs/get_started/dl_workbench_img/openvino_in_dl_wb.png b/docs/get_started/dl_workbench_img/openvino_in_dl_wb.png
new file mode 100644
index 00000000000000..bd86f059507e71
--- /dev/null
+++ b/docs/get_started/dl_workbench_img/openvino_in_dl_wb.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:90e5ff4285c9d1069647097157eccf7d8a3f545f4ba8b93930b55d8b62c17a1a
+size 100677
diff --git a/docs/get_started/get_started_dl_workbench.md b/docs/get_started/get_started_dl_workbench.md
index edd1ab21cd64df..0812f543495ea9 100644
--- a/docs/get_started/get_started_dl_workbench.md
+++ b/docs/get_started/get_started_dl_workbench.md
@@ -1,139 +1,53 @@
-# Get Started with OpenVINO™ Toolkit via Deep Learning Workbench {#openvino_docs_get_started_get_started_dl_workbench}
+# Quick Start with OpenVINO™ Toolkit via Deep Learning Workbench {#openvino_docs_get_started_get_started_dl_workbench}
 
-The OpenVINO™ toolkit optimizes and runs Deep Learning Neural Network models on Intel® hardware. This guide helps you get started with the OpenVINO™ toolkit via the Deep Learning Workbench (DL Workbench) on Linux\*, Windows\*, or macOS\*. 
+The OpenVINO™ toolkit  is a comprehensive toolkit for optimizing pretrained deep learning models to achieve high performance and prepare them for deployment on Intel® platforms. Deep Learning Workbench (DL Workbench) is the OpenVINO™ toolkit UI designed to make the production of pretrained deep learning models significantly easier.
 
-In this guide, you will:
-* Learn the OpenVINO™ inference workflow.
-* Start DL Workbench on Linux. Links to instructions for other operating systems are provided as well.
-* Create a project and run a baseline inference.     
+Start working with the OpenVINO™ toolkit right from your browser: import a model, analyze its performance and accuracy, visualize the outputs, optimize and prepare the model for deployment in a matter of minutes. DL Workbench will take you through the full OpenVINO™ workflow, providing the opportunity to learn about various toolkit components.
 
-[DL Workbench](@ref workbench_docs_Workbench_DG_Introduction) is a web-based graphical environment that enables you to easily use various sophisticated
-OpenVINO™ toolkit components:
-* [Model Downloader](@ref omz_tools_downloader) to download models from the [Intel® Open Model Zoo](@ref omz_models_group_intel) 
-with pre-trained models for a range of different tasks
-* [Model Optimizer](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md) to transform models into
-the Intermediate Representation (IR) format
-* [Post-training Optimization Tool](@ref pot_README) to calibrate a model and then execute it in the
- INT8 precision
-* [Accuracy Checker](@ref omz_tools_accuracy_checker) to determine the accuracy of a model
-* [Benchmark Tool](@ref openvino_inference_engine_samples_benchmark_app_README) to estimate inference performance on supported devices
+![](./dl_workbench_img/openvino_in_dl_wb.png)
 
-![](./dl_workbench_img/DL_Workbench.jpg)
+##  User Goals
 
-DL Workbench supports the following scenarios:
-1. [Calibrate the model in INT8 precision](@ref workbench_docs_Workbench_DG_Int_8_Quantization)  
-2. [Find the best combination](@ref workbench_docs_Workbench_DG_View_Inference_Results) of inference parameters: [number of streams and batches](../optimization_guide/dldt_optimization_guide.md)
-3. [Analyze inference results](@ref workbench_docs_Workbench_DG_Visualize_Model) and [compare them across different configurations](@ref workbench_docs_Workbench_DG_Compare_Performance_between_Two_Versions_of_Models)
-4. [Implement an optimal configuration into your application](@ref workbench_docs_Workbench_DG_Deploy_and_Integrate_Performance_Criteria_into_Application)   
+* Learn what neural networks are, how they work, and how to examine their architectures with more than 200 deep learning models.
+* Measure and interpret model performance right after the import​.
+* Tune the model for enhanced performance.
+* Analyze the quality of your model and visualize output.
+* Use preconfigured JupyterLab\* environment to learn OpenVINO™ workflow. 
 
-## Prerequisites
+## Run DL Workbench 
 
-Prerequisite | Linux* | Windows* | macOS*
-:----- | :----- |:----- |:-----
-Operating system|Ubuntu\* 18.04. Other Linux distributions, such as Ubuntu\* 16.04 and CentOS\* 7, are not validated.|Windows\* 10 | macOS\* 10.15 Catalina
-CPU | Intel® Core™ i5| Intel® Core™ i5 | Intel® Core™ i5
-GPU| Intel® Pentium® processor N4200/5 with Intel® HD Graphics | Not supported| Not supported
-HDDL, MYRIAD| Intel® Neural Compute Stick 2 <br> Intel® Vision Accelerator Design with Intel® Movidius™ VPUs| Not supported | Not supported
-Available RAM space| 4 GB| 4 GB| 4 GB
-Available storage space   | 8 GB + space for imported artifacts| 8 GB + space for imported artifacts| 8 GB + space for imported artifacts
-Docker\*| Docker CE 18.06.1 | Docker Desktop 2.1.0.1|Docker CE 18.06.1
-Web browser| Google Chrome\* 76 <br> Browsers like Mozilla Firefox\* 71 or Apple Safari\* 12 are not validated. <br> Microsoft Internet Explorer\* is not supported.|  Google Chrome\* 76 <br> Browsers like Mozilla Firefox\* 71 or Apple Safari\* 12 are not validated. <br> Microsoft Internet Explorer\* is not supported.|  Google Chrome\* 76 <br>Browsers like Mozilla Firefox\* 71 or Apple Safari\* 12 are not validated. <br> Microsoft Internet Explorer\* is not supported.
-Resolution| 1440 x 890|1440 x 890|1440 x 890
-Internet|Optional|Optional|Optional
-Installation method| From Docker Hub <br> From OpenVINO™ toolkit package|From Docker Hub|From Docker Hub
+You can [run DL Workbench](@ref workbench_docs_Workbench_DG_Install) on your local system or in the Intel® DevCloud for the Edge. Ensure that you have met the [prerequisites](@ref workbench_docs_Workbench_DG_Prerequisites).
 
-## Start DL Workbench 
+Run DL Workbench on your local system by using the installation form. Select your options and run the commands on the local machine:
 
-This section provides instructions to run the DL Workbench on Linux from Docker Hub. 
+<iframe style="width: 100%; height: 620px;" src="https://openvinotoolkit.github.io/workbench_aux/"  frameborder="0" allow="clipboard-write;"></iframe>
 
-Use the command below to pull the latest Docker image with the application and run it:
+Once DL Workbench is set up, open the http://127.0.0.1:5665 link.
 
-```bash
-wget https://raw.githubusercontent.com/openvinotoolkit/workbench_aux/master/start_workbench.sh && bash start_workbench.sh
-```
-DL Workbench uses [authentication tokens](@ref workbench_docs_Workbench_DG_Authentication) to access the application. A token 
-is generated automatically and displayed in the console output when you run the container for the first time. Once the command is executed, follow the link with the token. The **Get Started** page opens:
-![](./dl_workbench_img/Get_Started_Page-b.png)
+![](./dl_workbench_img/active_projects_page.png)
 
-For details and more installation options, visit the links below:
-* [Install DL Workbench from Docker Hub* on Linux* OS](@ref workbench_docs_Workbench_DG_Install_from_DockerHub_Linux)
-* [Install DL Workbench from Docker Hub on Windows*](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub_Win)
-* [Install DL Workbench from Docker Hub on macOS*](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub_mac)
-* [Install DL Workbench from the OpenVINO toolkit package on Linux](@ref workbench_docs_Workbench_DG_Install_from_Package)
 
-## <a name="workflow-overview"></a>OpenVINO™ DL Workbench Workflow Overview
+Congratulations, you have installed DL Workbench. Your next step is to [Get Started with DL Workbench](@ref workbench_docs_Workbench_DG_Work_with_Models_and_Sample_Datasets) and create your first project. 
 
-The simplified OpenVINO™ DL Workbench workflow is:
-1. **Get a trained model** for your inference task. Example inference tasks: pedestrian detection, face detection, vehicle detection, license plate recognition, head pose.
-2. **Run the trained model through the Model Optimizer** to convert the model to an Intermediate Representation, which consists of a pair of `.xml` and `.bin` files that are used as the input for Inference Engine.
-3. **Run inference against the Intermediate Representation** (optimized model) and output inference results.
+## Videos
 
-## Run Baseline Inference
+<table>
+  <tr>
+    <td>
+<iframe width="320" src="https://www.youtube.com/embed/on8xSSTKCt8" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
+</td>
+<td>
+    <iframe width="320" src="https://www.youtube.com/embed/JBDG2g5hsoM" frameborder="0" allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
+</td>
+  </tr>
+  <tr>
+    <td><strong>What is the OpenVINO™ toolkit DL Workbench</strong>. <br>Duration: 1:31</td>
+    <td><strong>How to Install the OpenVINO™ toolkit DL Workbench</strong>. <br>Duration: 8:20</td>
+  </tr>
+</table>
 
-This section illustrates a sample use case of how to infer a pre-trained model from the [Intel® Open Model Zoo](@ref omz_models_group_intel) with an autogenerated noise dataset on a CPU device.
-\htmlonly
-<iframe width="560" height="315" src="https://www.youtube.com/embed/9TRJwEmY0K4" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
-\endhtmlonly
-
-Once you log in to the DL Workbench, create a project, which is a combination of a model, a dataset, and a target device. Follow the steps below:
-
-### Step 1. Open a New Project 
-
-On the the **Active Projects** page, click **Create** to open the **Create Project** page:
-![](./dl_workbench_img/create_configuration.png)
-
-### Step 2. Choose a Pre-trained Model
-
-Click **Import** next to the **Model** table on the **Create Project** page. The **Import Model** page opens. Select the squeezenet1.1 model from the Open Model Zoo and click **Import**.
-![](./dl_workbench_img/import_model_02.png)
-
-### Step 3. Convert the Model into Intermediate Representation
-
-The **Convert Model to IR** tab opens. Keep the FP16 precision and click **Convert**.
-![](./dl_workbench_img/convert_model.png)
-
-You are directed back to the **Create Project** page where you can see the status of the chosen model.
-![](./dl_workbench_img/model_loading.png)
-
-### Step 4. Generate a Noise Dataset
-
-Scroll down to the **Validation Dataset** table. Click **Generate** next to the table heading.
-![](./dl_workbench_img/validation_dataset.png)
-
-The **Autogenerate Dataset** page opens. Click **Generate**.
-![](./dl_workbench_img/generate_dataset.png)
-
-You are directed back to the **Create Project** page where you can see the status of the dataset.
-![](./dl_workbench_img/dataset_loading.png)
-
-### Step 5. Create the Project and Run a Baseline Inference
-
-On the **Create Project** page, select the imported model, CPU target, and the generated dataset. Click **Create**.
-![](./dl_workbench_img/selected.png)
-
-The inference starts and you cannot proceed until it is done.
-![](./dl_workbench_img/inference_banner.png)
-
-Once the inference is complete, the **Projects** page opens automatically. Find your inference job in the **Projects Settings** table indicating all jobs.
-![](./dl_workbench_img/inference_complete.png)
-
-Congratulations, you have performed your first inference in the OpenVINO DL Workbench. Now you can proceed to:
-* [Select the inference](@ref workbench_docs_Workbench_DG_Run_Single_Inference) 
-* [Visualize statistics](@ref workbench_docs_Workbench_DG_Visualize_Model)
-* [Experiment with model optimization](@ref workbench_docs_Workbench_DG_Int_8_Quantization)
-and inference options to profile the configuration
-
-For detailed instructions to create a new project, visit the links below: 
-* [Select a model](@ref workbench_docs_Workbench_DG_Select_Model)
-* [Select a dataset](@ref workbench_docs_Workbench_DG_Select_Datasets)
-* [Select a target and an environment](@ref workbench_docs_Workbench_DG_Select_Environment). This can be your local workstation or a remote target. If you use a remote target, [register the remote machine](@ref workbench_docs_Workbench_DG_Add_Remote_Target) first. 
-
-## Additional Resources
-
-* [OpenVINO™ Release Notes](https://software.intel.com/en-us/articles/OpenVINO-RelNotes)
+## See Also
+* [Get Started with DL Workbench](@ref workbench_docs_Workbench_DG_Work_with_Models_and_Sample_Datasets)
+* [DL Workbench Overview](@ref workbench_docs_Workbench_DG_Introduction)
+* [DL Workbench Educational Resources](@ref workbench_docs_Workbench_DG_Additional_Resources)
 * [OpenVINO™ Toolkit Overview](../index.md)
-* [DL Workbench Installation Guide](@ref workbench_docs_Workbench_DG_Install_Workbench)
-* [Inference Engine Developer Guide](../IE_DG/Deep_Learning_Inference_Engine_DevGuide.md)
-* [Model Optimizer Developer Guide](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md)
-* [Inference Engine Samples Overview](../IE_DG/Samples_Overview.md)
-* [Overview of OpenVINO™ Toolkit Pre-Trained Models](https://software.intel.com/en-us/openvino-toolkit/documentation/pretrained-models)
diff --git a/docs/get_started/get_started_linux.md b/docs/get_started/get_started_linux.md
index d93201f4665551..10b1b79aebe946 100644
--- a/docs/get_started/get_started_linux.md
+++ b/docs/get_started/get_started_linux.md
@@ -4,7 +4,7 @@ The OpenVINO™ toolkit optimizes and runs Deep Learning Neural Network models o
 
 In this guide, you will:
 * Learn the OpenVINO™ inference workflow.
-* Run demo scripts that perform the steps for you. These demo scripts illustrate the workflow.
+* Run sample scripts that perform the steps for you. These sample scripts illustrate the workflow.
 * Run the workflow steps yourself, using detailed instructions with a code sample and demo application.       
 
 ## <a name="openvino-components"></a>OpenVINO™ toolkit Components
@@ -13,8 +13,8 @@ The toolkit consists of three primary components:
 * **Model Optimizer:** Optimizes models for Intel® architecture, converting models into a format compatible with the Inference Engine. This format is called an Intermediate Representation (IR).
 * **Intermediate Representation (IR):** The Model Optimizer output. A model converted to a format that has been optimized for Intel® architecture and is usable by the Inference Engine.
 
-In addition, demo scripts, code samples and demo applications are provided to help you get up and running with the toolkit:
-* **Demo Scripts** - Shell scripts that automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios.  
+In addition, sample scripts, code samples and demo applications are provided to help you get up and running with the toolkit:
+* **Sample Scripts** - Shell scripts that automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios.  
 * **[Code Samples](../IE_DG/Samples_Overview.md)** - Small console applications that show you how to: 
     * Utilize specific OpenVINO capabilities in an application
     * Perform specific tasks, such as loading a model, running inference, querying specific device capabilities, and more.
@@ -27,18 +27,18 @@ By default, the Intel® Distribution of OpenVINO™ is installed to the followin
 * For root or administrator: `/opt/intel/openvino_<version>/`
 * For regular users: `/home/<USER>/intel/openvino_<version>/`
 
-For simplicity, a symbolic link to the latest installation is also created: `/home/<user>/intel/openvino_2021/`
+For simplicity, a symbolic link to the latest installation is also created: `/home/<user>/intel/openvino_2022/`
 
 If you installed the Intel® Distribution of OpenVINO™ toolkit to a directory other than the default, replace `/opt/intel` or `/home/<USER>/` with the directory in which you installed the software.
 
-The primary tools for deploying your models and applications are installed to the `/opt/intel/openvino_2021/deployment_tools` directory.
+The primary tools for deploying your models and applications are installed to the `/opt/intel/openvino_2022/tools` directory.
 <details>
     <summary><strong>Click for the Intel® Distribution of OpenVINO™ toolkit directory structure</strong></summary>
-   
+
 
 | Directory&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; | Description                                                                           |  
 |:----------------------------------------|:--------------------------------------------------------------------------------------|
-| `demo/`                                 | Demo scripts. Demonstrate pipelines for inference scenarios, automatically perform steps and print detailed output to the console. For more information, see the [Use OpenVINO: Demo Scripts](#use-openvino-demo-scripts) section.|
+| `demo/`                                 | Sample scripts. Demonstrate pipelines for inference scenarios, automatically perform steps and print detailed output to the console. For more information, see the [Use OpenVINO: Sample Scripts](#use-openvino-sample-scripts) section.|
 | `inference_engine/`                     | Inference Engine directory. Contains Inference Engine API binaries and source files, samples and extensions source files, and resources like hardware drivers.|
 | `~intel_models/` | Symbolic link to the `intel_models` subfolder of the `open_model-zoo` folder |
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`include/`      | Inference Engine header files. For API documentation, see the [Inference Engine API Reference](./annotated.html). |
@@ -61,29 +61,29 @@ The simplified OpenVINO™ workflow is:
 2. **Run the trained model through the Model Optimizer** to convert the model to an Intermediate Representation, which consists of a pair of `.xml` and `.bin` files that are used as the input for Inference Engine.
 3. **Use the Inference Engine API in the application** to run inference against the Intermediate Representation (optimized model) and output inference results. The application can be an OpenVINO™ sample, demo, or your own application. 
 
-## Use the Demo Scripts to Learn the Workflow
+## Use the Sample Scripts to Learn the Workflow
 
-The demo scripts in `/opt/intel/openvino_2021/deployment_tools/demo` give you a starting point to learn the OpenVINO workflow. These scripts automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios. The demo steps let you see how to: 
+The sample scripts in `/opt/intel/openvino_2022/samples/scripts` give you a starting point to learn the OpenVINO workflow. These scripts automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios. The sample steps let you see how to: 
 * Compile several samples from the source files delivered as part of the OpenVINO toolkit.
 * Download trained models.
 * Perform pipeline steps and see the output on the console.
 
-> **NOTE**: You must have Internet access to run the demo scripts. If your Internet access is through a proxy server, make sure the operating system environment proxy information is configured.
+> **NOTE**: You must have Internet access to run the sample scripts. If your Internet access is through a proxy server, make sure the operating system environment proxy information is configured.
 
-The demo scripts can run inference on any [supported target device](https://software.intel.com/en-us/openvino-toolkit/hardware). Although the default inference device is CPU, you can use the `-d` parameter to change the inference device. The general command to run the scripts looks as follows:
+The sample scripts can run inference on any [supported target device](https://software.intel.com/en-us/openvino-toolkit/hardware). Although the default inference device is CPU, you can use the `-d` parameter to change the inference device. The general command to run the scripts looks as follows:
 
 ```sh
 ./<script_name> -d [CPU, GPU, MYRIAD, HDDL]
 ```
 
-Before running the demo applications on Intel® Processor Graphics or on an Intel® Neural Compute Stick 2 device, you must complete the additional configuration steps. For details, see:
+Before running the sample or demo applications on Intel® Processor Graphics or on an Intel® Neural Compute Stick 2 device, you must complete the additional configuration steps. For details, see:
 * Steps for Intel® Processor Graphics (GPU) section in the [installation instructions](../install_guides/installing-openvino-linux.md)
 * Steps for Intel® Neural Compute Stick 2 section in the [installation instructions](../install_guides/installing-openvino-linux.md).
 
-The following paragraphs describe each demo script.
+The following paragraphs describe each sample script.
 
-### Image Classification Demo Script
-The `demo_squeezenet_download_convert_run` script illustrates the image classification pipeline.
+### Image Classification Sample Script
+The `run_sample_squeezenet` script illustrates the image classification pipeline.
 
 The script: 
 1. Downloads a SqueezeNet model. 
@@ -92,19 +92,19 @@ The script:
 4. Runs the compiled sample with the `car.png` image located in the `demo` directory.
 
 <details>
-    <summary><strong>Click for an example of running the Image Classification demo script</strong></summary>
+    <summary><strong>Click for an example of running the Image Classification sample script</strong></summary>
 
 To preview the image that the script will classify:
 
 ```sh
-cd ${INTEL_OPENVINO_DIR}/deployment_tools/demo
+cd ${INTEL_OPENVINO_DIR}/samples/scripts
 eog car.png
 ```
 
 To run the script to perform inference on a CPU:
 
 ```sh
-./demo_squeezenet_download_convert_run.sh
+./run_sample_squeezenet.sh
 ```
 
 When the script completes, you see the label and confidence for the top-10 categories:
@@ -134,56 +134,27 @@ Average running time of one iteration: 2.6642941 ms
 
 Throughput: 375.3339402 FPS
 
-[ INFO ] Execution successful
+[ INFO ] Classification sample execution successful
 ```
 
 </details>
 
-### Inference Pipeline Demo Script
-The `demo_security_barrier_camera` uses vehicle recognition in which vehicle attributes build on each other to narrow in on a specific attribute.
+### Benchmark Sample Script
+The `run_sample_benchmark_app` script illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices.
 
 The script:
-1. Downloads three pre-trained model IRs.
-2. Builds the Security Barrier Camera Demo application.
-3. Runs the application with the downloaded models and the `car_1.bmp` image from the `demo` directory to show an inference pipeline. 
-
-This application:
-
-1. Identifies an object identified as a vehicle. 
-2. Uses the vehicle identification as input to the second model, which identifies specific vehicle attributes, including the license plate.
-3. Uses the the license plate as input to the third model, which recognizes specific characters in the license plate.
-
-<details>
-    <summary><strong>Click for an example of Running the Pipeline demo script</strong></summary>
-    
-To run the script performing inference on Intel® Processor Graphics:
-
-```sh
-./demo_security_barrier_camera.sh -d GPU
-```
-
-When the verification script completes, you see an image that displays the resulting frame with detections rendered as bounding boxes, and text:
-
-![](../img/inference_pipeline_script_lnx.png)
-
-</details>
-
-### Benchmark Demo Script
-The `demo_benchmark_app` script illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices. 
-
-The script: 
 1. Downloads a SqueezeNet model.
 2. Runs the Model Optimizer to convert the model to the IR.
-3. Builds the Inference Engine Benchmark tool.
+3. Builds the Inference Engine Benchmark sample.
 4. Runs the tool with the `car.png` image located in the `demo` directory.
 
 <details>
-    <summary><strong>Click for an example of running the Benchmark demo script</strong></summary>
+    <summary><strong>Click for an example of running the Benchmark sample script</strong></summary>
 
 To run the script that performs inference (runs on CPU by default):
 
 ```sh
-./demo_benchmark_app.sh
+./run_sample_benchmark_app.sh
 ```
 
 When the verification script completes, you see the performance counters, resulting latency, and throughput values displayed on the screen.
@@ -191,9 +162,9 @@ When the verification script completes, you see the performance counters, result
 
 ## <a name="using-sample-application"></a>Use Code Samples and Demo Applications to Learn the Workflow
 
-This section guides you through a simplified workflow for the Intel® Distribution of OpenVINO™ toolkit using code samples and demo applications. 
+This section guides you through a simplified workflow for the Intel® Distribution of OpenVINO™ toolkit using code samples and demo applications.
 
-You will perform the following steps: 
+You will perform the following steps:
 
 1. <a href="#download-models">Use the Model Downloader to download suitable models.</a>
 2. <a href="#convert-models-to-intermediate-representation">Convert the models with the Model Optimizer.</a> 
@@ -215,7 +186,7 @@ Inputs you'll need to specify:
 
 ### Build the Code Samples and Demo Applications 
 
-To perform sample inference, run the Image Classification code sample and Security Barrier Camera demo application that were automatically compiled when you ran the Image Classification and Inference Pipeline demo scripts. The binary files are in the `~/inference_engine_cpp_samples_build/intel64/Release` and `~/inference_engine_demos_build/intel64/Release` directories, respectively.
+The Image Classification Sample that was automatically compiled when you ran the Image Classification sample script. The binary file is in the `~/inference_engine_cpp_samples_build/intel64/Release` directory.
 
 To run other sample code or demo applications, build them from the source files delivered as part of the OpenVINO toolkit. To learn how to build these, see the [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md) and [Demo Applications Overview](@ref omz_demos) sections.
 
@@ -235,7 +206,7 @@ This guide uses the Model Downloader to get pre-trained models. You can use one
 
 * **List the models available in the downloader**: 
 ```sh
-cd /opt/intel/openvino_2021/deployment_tools/tools/model_downloader/
+cd /opt/intel/openvino_2022/extras/open_model_zoo/tools/downloader/
 ```
 ```sh
 python3 info_dumper.py --print_all
@@ -252,14 +223,11 @@ sudo python3 ./downloader.py --name <model_name> --output_dir <models_dir>
 ```
 > **NOTE:** Always run the downloader with `sudo`.
 
-Download the following models if you want to run the Image Classification Sample and Security Barrier Camera Demo application:
+Download the following models if you want to run the Image Classification Sample:
 
-|Model Name                                     | Code Sample or Demo App                             |
+|Model Name                                     | Code Sample                                         |
 |-----------------------------------------------|-----------------------------------------------------|
 |`squeezenet1.1`                                | Image Classification Sample                         |
-|`vehicle-license-plate-detection-barrier-0106` | Security Barrier Camera Demo application            |
-|`vehicle-attributes-recognition-barrier-0039`  | Security Barrier Camera Demo application            |
-|`license-plate-recognition-barrier-0001`       | Security Barrier Camera Demo application            |
 
 <details>
     <summary><strong>Click for an example of downloading the SqueezeNet Caffe* model</strong></summary>
@@ -285,36 +253,6 @@ Your screen looks similar to this after the download:
 ```
 </details>
 
-<details>
-    <summary><strong>Click for an example of downloading models for the Security Barrier Camera Demo application</strong></summary>
-
-To download all three pre-trained models in FP16 precision to the `~/models` folder:   
-
-```sh
-./downloader.py --name vehicle-license-plate-detection-barrier-0106,vehicle-attributes-recognition-barrier-0039,license-plate-recognition-barrier-0001 --output_dir ~/models --precisions FP16
-```   
-Your screen looks similar to this after the download:
-```
-################|| Downloading models ||################
-
-========== Downloading /home/username/models/intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.xml
-... 100%, 204 KB, 183949 KB/s, 0 seconds passed
-
-========== Downloading /home/username/models/intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.bin
-... 100%, 1256 KB, 3948 KB/s, 0 seconds passed
-
-========== Downloading /home/username/models/intel/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.xml
-... 100%, 32 KB, 133398 KB/s, 0 seconds passed
-
-========== Downloading /home/username/models/intel/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.bin
-... 100%, 1222 KB, 3167 KB/s, 0 seconds passed
-
-========== Downloading /home/username/models/intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.xml
-... 100%, 47 KB, 85357 KB/s, 0 seconds passed
-
-========== Downloading /home/username/models/intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.bin
-... 100%, 2378 KB, 5333 KB/s, 0 seconds passed
-
 ################|| Post-processing ||################
 ```
 
@@ -330,16 +268,15 @@ Models in the Intermediate Representation format always include a pair of `.xml`
 
 This guide uses the public SqueezeNet 1.1 Caffe\* model to run the Image Classification Sample. See the example to download a model in the <a href="#download-models">Download Models</a> section to learn how to download this model.
 
-The `squeezenet1.1` model is downloaded in the Caffe* format. You must use the Model Optimizer to convert the model to the IR. 
-The `vehicle-license-plate-detection-barrier-0106`, `vehicle-attributes-recognition-barrier-0039`, `license-plate-recognition-barrier-0001` models are downloaded in the Intermediate Representation format. You don't need to use the Model Optimizer to convert these models.
+The `squeezenet1.1` model is downloaded in the Caffe* format. You must use the Model Optimizer to convert the model to the IR.
 
-1. Create an `<ir_dir>` directory to contain the model's Intermediate Representation (IR). 
+1. Create an `<ir_dir>` directory to contain the model's Intermediate Representation (IR).
 
 2. The Inference Engine can perform inference on different precision formats, such as `FP32`, `FP16`, `INT8`. To prepare an IR with specific precision, run the Model Optimizer with the appropriate `--data_type` option.
 
 3. Run the Model Optimizer script:
    ```sh
-   cd /opt/intel/openvino_2021/deployment_tools/model_optimizer
+   cd /opt/intel/openvino_2022/tools/model_optimizer
    ```
    ```sh  
    python3 ./mo.py --input_model <model_dir>/<model_file> --data_type <model_precision> --output_dir <ir_dir>
@@ -352,7 +289,7 @@ The `vehicle-license-plate-detection-barrier-0106`, `vehicle-attributes-recognit
 The following command converts the public SqueezeNet 1.1 Caffe\* model to the FP16 IR and saves to the `~/models/public/squeezenet1.1/ir` output directory:
 
 ```sh
-   cd /opt/intel/openvino_2021/deployment_tools/model_optimizer
+   cd /opt/intel/openvino_2022/tools/model_optimizer
    ```
    ```sh  
    python3 ./mo.py --input_model ~/models/public/squeezenet1.1/squeezenet1.1.caffemodel --data_type FP16 --output_dir ~/models/public/squeezenet1.1/ir
@@ -360,9 +297,9 @@ The following command converts the public SqueezeNet 1.1 Caffe\* model to the FP
 
 After the Model Optimizer script is completed, the produced IR files (`squeezenet1.1.xml`, `squeezenet1.1.bin`) are in the specified `~/models/public/squeezenet1.1/ir` directory.
 
-Copy the `squeezenet1.1.labels` file from the `/opt/intel/openvino_2021/deployment_tools/demo/` to `<ir_dir>`. This file contains the classes that ImageNet uses. Therefore, the inference results show text instead of classification numbers:
+Copy the `squeezenet1.1.labels` file from the `/opt/intel/openvino_2022/samples/scripts/` to `<ir_dir>`. This file contains the classes that ImageNet uses. Therefore, the inference results show text instead of classification numbers:
    ```sh   
-   cp /opt/intel/openvino_2021/deployment_tools/demo/squeezenet1.1.labels <ir_dir>
+   cp /opt/intel/openvino_2022/samples/scripts/squeezenet1.1.labels <ir_dir>
    ```
 </details>
 
@@ -373,22 +310,22 @@ Many sources are available from which you can download video media to use the co
 - https://images.google.com
 
 As an alternative, the Intel® Distribution of OpenVINO™ toolkit includes two sample images that you can use for running code samples and demo applications:
-* `/opt/intel/openvino_2021/deployment_tools/demo/car.png`
-* `/opt/intel/openvino_2021/deployment_tools/demo/car_1.bmp`
+* `/opt/intel/openvino_2022/samples/scripts/car.png`
+* `/opt/intel/openvino_2022/samples/scripts/car_1.bmp`
 
 ### <a name="run-image-classification"></a>Step 4: Run the Image Classification Code Sample
 
-> **NOTE**: The Image Classification code sample is automatically compiled when you ran the Image Classification demo script. If you want to compile it manually, see the *Build the Sample Applications on Linux* section in the [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md). 
+> **NOTE**: The Image Classification code sample is automatically compiled when you ran the Image Classification sample script. If you want to compile it manually, see the *Build the Sample Applications on Linux* section in the [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md).
 
 To run the **Image Classification** code sample with an input image on the IR: 
 
 1. Set up the OpenVINO environment variables:
    ```sh
-   source /opt/intel/openvino_2021/bin/setupvars.sh
+   source /opt/intel/openvino_2022/setupvars.sh
    ``` 
 2. Go to the code samples build directory:
    ```sh
-   cd ~/inference_engine_samples_build/intel64/Release
+   cd ~/inference_engine_cpp_samples_build/intel64/Release
    ```
 3. Run the code sample executable, specifying the input media file, the IR of your model, and a target device on which you want to perform inference:
    ```sh
@@ -397,35 +334,35 @@ To run the **Image Classification** code sample with an input image on the IR:
 <details>
     <summary><strong>Click for examples of running the Image Classification code sample on different devices</strong></summary>
 
-The following commands run the Image Classification Code Sample using the `car.png` file from the `/opt/intel/openvino_2021/deployment_tools/demo/` directory as an input image, the IR of your model from `~/models/public/squeezenet1.1/ir` and on different hardware devices:
+The following commands run the Image Classification Code Sample using the `car.png` file from the `/opt/intel/openvino_2022/samples/scripts/` directory as an input image, the IR of your model from `~/models/public/squeezenet1.1/ir` and on different hardware devices:
 
 **CPU:**
    ```sh
-   ./classification_sample_async -i /opt/intel/openvino_2021/deployment_tools/demo/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d CPU
+   ./classification_sample_async -i /opt/intel/openvino_2022/samples/scripts/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d CPU
    ```
 
    **GPU:**
    
    > **NOTE**: Running inference on Intel® Processor Graphics (GPU) requires additional hardware configuration steps. For details, see the Steps for Intel® Processor Graphics (GPU) section in the [installation instructions](../install_guides/installing-openvino-linux.md).
    ```sh
-   ./classification_sample_async -i /opt/intel/openvino_2021/deployment_tools/demo/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d GPU
+   ./classification_sample_async -i /opt/intel/openvino_2022/samples/scripts/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d GPU
    ```
    
    **MYRIAD:** 
 
    > **NOTE**: Running inference on VPU devices (Intel® Neural Compute Stick 2) with the MYRIAD plugin requires additional hardware configuration steps. For details, see the Steps for Intel® Neural Compute Stick 2 section in the [installation instructions](../install_guides/installing-openvino-linux.md).
    ```sh   
-   ./classification_sample_async -i /opt/intel/openvino_2021/deployment_tools/demo/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d MYRIAD
+   ./classification_sample_async -i /opt/intel/openvino_2022/samples/scripts/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d MYRIAD
    ```
    
    **HDDL:**
 
   > **NOTE**: Running inference on the Intel® Vision Accelerator Design with Intel® Movidius™ VPUs device with the HDDL plugin requires additional hardware configuration steps. For details, see the Steps for Intel® Vision Accelerator Design with Intel® Movidius™ VPUs section in the [installation instructions](../install_guides/installing-openvino-linux.md).
   ```sh   
-  ./classification_sample_async -i /opt/intel/openvino_2021/deployment_tools/demo/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d HDDL
+  ./classification_sample_async -i /opt/intel/openvino_2022/samples/scripts/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d HDDL
   ```
 
-When the Sample Application completes, you see the label and confidence for the top-10 categories on the display. Below is a sample output with inference results on CPU:    
+When the Sample Application completes, you see the label and confidence for the top-10 categories on the display. Below is a sample output with inference results on CPU:
 ```sh
 Top 10 results:
 
@@ -450,58 +387,7 @@ Average running time of one iteration: 2.6642941 ms
 
 Throughput: 375.3339402 FPS
 
-[ INFO ] Execution successful
-```
-
-</details>
-
-### <a name="run-security-barrier"></a>Step 5: Run the Security Barrier Camera Demo Application
-
-> **NOTE**: The Security Barrier Camera Demo Application is automatically compiled when you ran the Inference Pipeline demo scripts. If you want to build it manually, see the [Demo Applications Overview](@ref omz_demos) section.
-
-To run the **Security Barrier Camera Demo Application** using an input image on the prepared IRs:
-
-1. Set up the OpenVINO environment variables:
-   ```sh
-   source /opt/intel/openvino_2021/bin/setupvars.sh
-   ``` 
-2. Go to the demo application build directory:
-   ```sh
-   cd ~/inference_engine_demos_build/intel64/Release
-   ```
-3. Run the demo executable, specifying the input media file, list of model IRs, and a target device on which to perform inference:
-   ```sh
-   ./security_barrier_camera_demo -i <path_to_media> -m <path_to_vehicle-license-plate-detection_model_xml> -m_va <path_to_vehicle_attributes_model_xml> -m_lpr <path_to_license_plate_recognition_model_xml> -d <target_device>
-   ```
-
-<details>
-    <summary><strong>Click for examples of running the Security Barrier Camera demo application on different devices</strong></summary>
-
-**CPU:**
-
-```sh
-./security_barrier_camera_demo -i /opt/intel/openvino_2021/deployment_tools/demo/car_1.bmp -m /home/username/models/intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.xml -m_va /home/username/models/intel/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.xml -m_lpr /home/username/models/intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.xml -d CPU
-```
-
-**GPU:**
-   
-> **NOTE**: Running inference on Intel® Processor Graphics (GPU) requires additional hardware configuration steps. For details, see the Steps for Intel® Processor Graphics (GPU) section in the [installation instructions](../install_guides/installing-openvino-linux.md).
-```sh
-./security_barrier_camera_demo -i /opt/intel/openvino_2021/deployment_tools/demo/car_1.bmp -m <path_to_model>/vehicle-license-plate-detection-barrier-0106.xml -m_va <path_to_model>/vehicle-attributes-recognition-barrier-0039.xml -m_lpr <path_to_model>/license-plate-recognition-barrier-0001.xml -d GPU
-```
-
-**MYRIAD:** 
-   
-> **NOTE**: Running inference on the Intel® Neural Compute Stick 2 device with the MYRIAD plugin requires additional hardware configuration steps. For details, see the Steps for Intel® Neural Compute Stick 2 section in the [installation instructions](../install_guides/installing-openvino-linux.md).
-```sh   
-./classification_sample_async -i <DLDT_DIR>/inference-engine/samples/sample_data/car.png -m <ir_dir>/squeezenet1.1.xml -d MYRIAD
-```
-
-**HDDL:**
-
-> **NOTE**: Running inference on the Intel® Vision Accelerator Design with Intel® Movidius™ VPUs device with the HDDL plugin requires additional hardware configuration steps. For details, see the Steps for Intel® Vision Accelerator Design with Intel® Movidius™ VPUs section in the [installation instructions](../install_guides/installing-openvino-linux.md).
-```sh   
-./classification_sample_async -i <DLDT_DIR>/inference-engine/samples/sample_data/car.png -m <ir_dir>/squeezenet1.1.xml -d HDDL
+[ INFO ] Classification sample execution successful
 ```
 
 </details>
@@ -510,10 +396,10 @@ To run the **Security Barrier Camera Demo Application** using an input image on
 
 Following are some basic guidelines for executing the OpenVINO™ workflow using the code samples and demo applications:
 
-1. Before using the OpenVINO™ samples, always set up the environment: 
+1. Before using the OpenVINO™ samples, always set up the environment:
 ```sh
-source /opt/intel/openvino_2021/bin/setupvars.sh
-``` 
+source /opt/intel/openvino_2022/setupvars.sh
+```
 2. Have the directory path for the following:
 - Code Sample binaries located in `~/inference_engine_cpp_samples_build/intel64/Release`
 - Demo Application binaries located in `~/inference_engine_demos_build/intel64/Release`
@@ -527,10 +413,10 @@ This section explains how to build and use the sample and demo applications prov
 To build all the demos and samples:
 
 ```sh
-cd $INTEL_OPENVINO_DIR/inference_engine_samples/cpp
-# to compile C samples, go here also: cd <INSTALL_DIR>/inference_engine/samples/c
+cd $INTEL_OPENVINO_DIR/samples/cpp
+# to compile C samples, go here also: cd <INSTALL_DIR>/samples/c
 build_samples.sh
-cd $INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/demos
+cd $INTEL_OPENVINO_DIR/extras/open_model_zoo/demos
 build_demos.sh
 ```
 
@@ -553,7 +439,7 @@ With the sample information specified, the command might look like this:
 -m ~/ir/fp32/mobilenet-ssd.xml -d CPU
 ```
 
-## <a name="advanced-samples"></a> Advanced Demo Use 
+## <a name="advanced-samples"></a> Advanced Demo Use
 
 Some demo applications let you use multiple models for different purposes. In these cases, the output of the first model is usually used as the input for later models.
 
diff --git a/docs/get_started/get_started_macos.md b/docs/get_started/get_started_macos.md
index 0cdff6a05a310e..2f8461ce0f9ea6 100644
--- a/docs/get_started/get_started_macos.md
+++ b/docs/get_started/get_started_macos.md
@@ -1,10 +1,10 @@
 # Get Started with OpenVINO™ Toolkit on macOS* {#openvino_docs_get_started_get_started_macos}
 
-The OpenVINO™ toolkit optimizes and runs Deep Learning Neural Network models on Intel® hardware. This guide helps you get started with the OpenVINO™ toolkit you installed on macOS*. 
+The OpenVINO™ toolkit optimizes and runs Deep Learning Neural Network models on Intel® hardware. This guide helps you get started with the OpenVINO™ toolkit you installed on macOS*.
 
 In this guide, you will:
 * Learn the OpenVINO™ inference workflow
-* Run demo scripts that illustrate the workflow and perform the steps for you
+* Run sample scripts that illustrate the workflow and perform the steps for you
 * Run the workflow steps yourself, using detailed instructions with a code sample and demo application    
 
 ## <a name="openvino-components"></a>OpenVINO™ toolkit Components
@@ -13,8 +13,8 @@ The toolkit consists of three primary components:
 * **Intermediate Representation:** The Model Optimizer output. A model converted to a format that has been optimized for Intel® architecture and is usable by the Inference Engine.
 * **Inference Engine:** The software libraries that run inference against the IR (optimized model) to produce inference results.
 
-In addition, demo scripts, code samples and demo applications are provided to help you get up and running with the toolkit:
-* **Demo Scripts** - Batch scripts that automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios.  
+In addition, sample scripts, code samples and demo applications are provided to help you get up and running with the toolkit:
+* **Sample Scripts** - Batch scripts that automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios.  
 * **[Code Samples](../IE_DG/Samples_Overview.md)** - Small console applications that show you how to:
     * Utilize specific OpenVINO capabilities in an application.
     * Perform specific tasks, such as loading a model, running inference, querying specific device capabilities, and more.
@@ -27,18 +27,18 @@ By default, the Intel® Distribution of OpenVINO™ is installed to the followin
 * For root or administrator: `/opt/intel/openvino_<version>/`
 * For regular users: `/home/<USER>/intel/openvino_<version>/`
 
-For simplicity, a symbolic link to the latest installation is also created: `/home/<user>/intel/openvino_2021/`.
+For simplicity, a symbolic link to the latest installation is also created: `/home/<user>/intel/openvino_2022/`.
 
-If you installed the Intel® Distribution of OpenVINO™ toolkit to a directory other than the default, replace `/opt/intel` or `/home/<USER>/` with the directory in which you installed the software. 
+If you installed the Intel® Distribution of OpenVINO™ toolkit to a directory other than the default, replace `/opt/intel` or `/home/<USER>/` with the directory in which you installed the software.
 
-The primary tools for deploying your models and applications are installed to the `<INSTALL_DIR>/deployment_tools` directory.
+The primary tools for deploying your models and applications are installed to the `<INSTALL_DIR>/tools` directory.
 <details>
     <summary><strong>Click for the Intel® Distribution of OpenVINO™ toolkit directory structure</strong></summary>
-   
+
 
 | Directory&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; | Description                                                                           |  
 |:----------------------------------------|:--------------------------------------------------------------------------------------|
-| `demo/`                                 | Demo scripts. Demonstrate pipelines for inference scenarios, automatically perform steps and print detailed output to the console. For more information, see the [Use OpenVINO: Demo Scripts](#use-openvino-demo-scripts) section.|
+| `demo/`                                 | Sample scripts. Demonstrate pipelines for inference scenarios, automatically perform steps and print detailed output to the console. For more information, see the [Use OpenVINO: Sample Scripts](#use-openvino-sample-scripts) section.|
 | `inference_engine/`                     | Inference Engine directory. Contains Inference Engine API binaries and source files, samples and extensions source files, and resources like hardware drivers.|
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`external/`     | Third-party dependencies and drivers.|
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`include/`      | Inference Engine header files. For API documentation, see the [Inference Engine API Reference](./annotated.html). |
@@ -49,7 +49,7 @@ The primary tools for deploying your models and applications are installed to th
 | `model_optimizer/`                      | Model Optimizer directory. Contains configuration scripts, scripts to run the Model Optimizer and other files. See the [Model Optimizer Developer Guide](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md).|
 | `ngraph/`                               | nGraph directory. Includes the nGraph header and library files. |
 | `open_model_zoo/`                       | Open Model Zoo directory. Includes the Model Downloader tool to download [pre-trained OpenVINO](@ref omz_models_group_intel) and public models, OpenVINO models documentation, demo applications and the Accuracy Checker tool to evaluate model accuracy.|
-| &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`demos/`        | Demo applications for inference scenarios. Also includes documentation and build scripts.| 
+| &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`demos/`        | Sample applications for inference scenarios. Also includes documentation and build scripts.| 
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`intel_models/` | Pre-trained OpenVINO models and associated documentation. See the [Overview of OpenVINO™ Toolkit Pre-Trained Models](@ref omz_models_group_intel).|
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`models`        | Intel's trained and public models that can be obtained with Model Downloader.|
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`tools/`        | Model Downloader and Accuracy Checker tools. |
@@ -64,42 +64,42 @@ The simplified OpenVINO™ workflow is:
 2. **Run the trained model through the Model Optimizer** to convert the model to an IR, which consists of a pair of `.xml` and `.bin` files that are used as the input for Inference Engine.
 3. **Use the Inference Engine API in the application** to run inference against the IR (optimized model) and output inference results. The application can be an OpenVINO™ sample, demo, or your own application.
 
-## Use the Demo Scripts to Learn the Workflow
+## Use the Sample Scripts to Learn the Workflow
 
-The demo scripts in `<INSTALL_DIR>/deployment_tools/demo` give you a starting point to learn the OpenVINO workflow. These scripts automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios. The demo steps let you see how to: 
+The sample scripts in `<INSTALL_DIR>/samples/scripts` give you a starting point to learn the OpenVINO workflow. These scripts automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios. The sample steps let you see how to:
 * Compile several samples from the source files delivered as part of the OpenVINO toolkit
 * Download trained models
 * Perform pipeline steps and see the output on the console
 
-> **NOTE**: You must have Internet access to run the demo scripts. If your Internet access is through a proxy server, make sure the operating system environment proxy information is configured.
+> **NOTE**: You must have Internet access to run the sample scripts. If your Internet access is through a proxy server, make sure the operating system environment proxy information is configured.
 
-The demo scripts can run inference on any [supported target device](https://software.intel.com/en-us/openvino-toolkit/hardware). Although the default inference device is CPU, you can use the `-d` parameter to change the inference device. The general command to run the scripts looks as follows:
+The sample scripts can run inference on any [supported target device](https://software.intel.com/en-us/openvino-toolkit/hardware). Although the default inference device is CPU, you can use the `-d` parameter to change the inference device. The general command to run the scripts looks as follows:
 
 ```sh
 ./<script_name> -d [CPU, MYRIAD]
 ```
 
-Before running the demo applications on Intel® Neural Compute Stick 2 device, you must complete additional configuration steps. For details, see the Steps for Intel® Neural Compute Stick 2 section in the [installation instructions](../install_guides/installing-openvino-macos.md).
+Before running the sample or demo applications on Intel® Neural Compute Stick 2 device, you must complete additional configuration steps. For details, see the Steps for Intel® Neural Compute Stick 2 section in the [installation instructions](../install_guides/installing-openvino-macos.md).
 
-The following paragraphs describe each demo script.
+The following paragraphs describe each sample script.
 
-### Image Classification Demo Script
-The `demo_squeezenet_download_convert_run` script illustrates the image classification pipeline.
+### Image Classification Sample Script
+The `run_sample_squeezenet` script illustrates the image classification pipeline.
 
-The script: 
-1. Downloads a SqueezeNet model. 
+The script:
+1. Downloads a SqueezeNet model.
 2. Runs the Model Optimizer to convert the model to the IR.
 3. Builds the Image Classification Sample Async application.
 4. Runs the compiled sample with the `car.png` image located in the `demo` directory.
 
 <details>
-    <summary><strong>Click for an example of running the Image Classification demo script</strong></summary>
+    <summary><strong>Click for an example of running the Image Classification sample script</strong></summary>
 
 To run the script to view the sample image and perform inference on the CPU:
 
 ```sh
 open car.png
-./demo_squeezenet_download_convert_run.sh
+./run_sample_squeezenet.sh
 ```
 
 When the script completes, you see the label and confidence for the top-10 categories:
@@ -108,7 +108,7 @@ When the script completes, you see the label and confidence for the top-10 categ
 
 Top 10 results:
 
-Image /opt/intel/openvino_2021/deployment_tools/demo/car.png
+Image /opt/intel/openvino_2022/samples/scripts/car.png
 
 classid probability label
 ------- ----------- -----
@@ -123,65 +123,36 @@ classid probability label
 468     0.0013083   cab, hack, taxi, taxicab
 661     0.0007443   Model T
 
-[ INFO ] Execution successful
+[ INFO ] Classification sample execution successful
 ```
 
 </details>
 
-### Inference Pipeline Demo Script
-The `demo_security_barrier_camera` uses vehicle recognition in which vehicle attributes build on each other to narrow in on a specific attribute.
+### Benchmark Sample Script
+The `run_sample_benchmark_app` script illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices.
 
 The script:
-1. Downloads three pre-trained model IRs.
-2. Builds the Security Barrier Camera Demo application.
-3. Runs the application with the downloaded models and the `car_1.bmp` image from the `demo` directory to show an inference pipeline. 
-
-This application:
-
-1. Identifies an object identified as a vehicle. 
-2. Uses the vehicle identification as input to the second model, which identifies specific vehicle attributes, including the license plate.
-3. Uses the the license plate as input to the third model, which recognizes specific characters in the license plate.
-
-<details>
-    <summary><strong>Click for an example of Running the Pipeline demo script</strong></summary>
-    
-To run the script performing inference on a CPU:
-
-```sh
-./demo_security_barrier_camera.sh
-```
-
-When the verification script completes, you see an image that displays the resulting frame with detections rendered as bounding boxes, and text:
-
-![](../img/inference_pipeline_script_mac.png) 
-
-</details>
-
-### Benchmark Demo Script
-The `demo_benchmark_app` script illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices.
-
-The script: 
 1. Downloads a SqueezeNet model.
 2. Runs the Model Optimizer to convert the model to the IR.
 3. Builds the Inference Engine Benchmark tool.
 4. Runs the tool with the `car.png` image located in the `demo` directory.
 
 <details>
-    <summary><strong>Click for an example of running the Benchmark demo script</strong></summary>
+    <summary><strong>Click for an example of running the Benchmark sample script</strong></summary>
 
 To run the script that performs inference on a CPU:
 
 ```sh
-./demo_benchmark_app.sh
+./run_sample_benchmark_app.sh
 ```
 When the verification script completes, you see the performance counters, resulting latency, and throughput values displayed on the screen.
 </details>
 
 ## <a name="using-sample-application"></a>Use Code Samples and Demo Applications to Learn the Workflow
 
-This section guides you through a simplified workflow for the Intel® Distribution of OpenVINO™ toolkit using code samples and demo applications. 
+This section guides you through a simplified workflow for the Intel® Distribution of OpenVINO™ toolkit using code samples and demo applications.
 
-You will perform the following steps: 
+You will perform the following steps:
 
 1. <a href="#download-models">Use the Model Downloader to download suitable models.</a>
 2. <a href="#convert-models-to-intermediate-representation">Convert the models with the Model Optimizer.</a> 
@@ -197,9 +168,9 @@ Inputs you need to specify when using a code sample or demo application:
 - **One or more media files**. The media is typically a video file, but can be a still photo.
 - **One or more target device** on which you run inference. The target device can be the CPU, or VPU accelerator.
 
-### Build the Code Samples and Demo Applications 
+### Build the Code Samples and Demo Applications
 
-To perform sample inference, run the Image Classification code sample and Security Barrier Camera demo application that are automatically compiled when you run the Image Classification and Inference Pipeline demo scripts. The binary files are in the `~/inference_engine_samples_build/intel64/Release` and `~/inference_engine_demos_build/intel64/Release` directories, respectively.
+The Image Classification Sample that was automatically compiled when you ran the Image Classification sample script. The binary file is in the `~/inference_engine_cpp_samples_build/intel64/Release` directory.
 
 You can also build all available sample code and demo applications from the source files delivered with the OpenVINO toolkit. To learn how to do this, see the instructions in the [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md) and [Demo Applications Overview](@ref omz_demos) sections.
 
@@ -211,21 +182,21 @@ You must have a model that is specific for you inference task. Example model typ
 - Custom (Often based on SSD)
 
 Options to find a model suitable for the OpenVINO™ toolkit are:
-- Download public and Intel's pre-trained models from the [Open Model Zoo](https://github.com/openvinotoolkit/open_model_zoo) using the [Model Downloader tool](@ref omz_tools_downloader). 
+- Download public and Intel's pre-trained models from the [Open Model Zoo](https://github.com/openvinotoolkit/open_model_zoo) using the [Model Downloader tool](@ref omz_tools_downloader).
 - Download from GitHub*, Caffe* Zoo, TensorFlow* Zoo, and other resources.
 - Train your own model.
-        
+
 This guide uses the Model Downloader to get pre-trained models. You can use one of the following options to find a model:
 
-* **List the models available in the downloader**: 
+* **List the models available in the downloader**:
 ```sh
-cd /opt/intel/openvino_2021/deployment_tools/tools/model_downloader/
+cd /opt/intel/openvino_2022/extras/open_model_zoo/tools/downloader/
 ```
 ```sh
 python3 info_dumper.py --print_all
 ```
 
-* **Use `grep` to list models that have a specific name pattern**: 
+* **Use `grep` to list models that have a specific name pattern**:
 ```sh
 python3 info_dumper.py --print_all | grep <model_name>
 ```
@@ -236,14 +207,11 @@ sudo python3 ./downloader.py --name <model_name> --output_dir <models_dir>
 ```
 > **NOTE:** Always run the downloader with `sudo`.
 
-Download the following models if you want to run the Image Classification Sample and Security Barrier Camera Demo application:
+Download the following models if you want to run the Image Classification Sample:
 
 |Model Name                                     | Code Sample or Demo App                             |
 |-----------------------------------------------|-----------------------------------------------------|
 |`squeezenet1.1`                                | Image Classification Sample                         |
-|`vehicle-license-plate-detection-barrier-0106` | Security Barrier Camera Demo application            |
-|`vehicle-attributes-recognition-barrier-0039`  | Security Barrier Camera Demo application            |
-|`license-plate-recognition-barrier-0001`       | Security Barrier Camera Demo application            |
 
 <details>
     <summary><strong>Click for an example of downloading the SqueezeNet Caffe* model</strong></summary>
@@ -270,41 +238,6 @@ Your screen looks similar to this after the download:
 ```
 </details>
 
-<details>
-    <summary><strong>Click for an example of downloading models for the Security Barrier Camera Demo application</strong></summary>
-
-To download all three pre-trained models in FP16 precision to the `~/models` folder:   
-
-```sh
-./downloader.py --name vehicle-license-plate-detection-barrier-0106,vehicle-attributes-recognition-barrier-0039,license-plate-recognition-barrier-0001 --output_dir ~/models --precisions FP16
-```   
-Your screen looks similar to this after the download:
-```
-################|| Downloading models ||################
-
-========== Downloading /Users/username/models/intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.xml
-... 100%, 207 KB, 313926 KB/s, 0 seconds passed
-
-========== Downloading /Users/username/models/intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.bin
-... 100%, 1256 KB, 2552 KB/s, 0 seconds passed
-
-========== Downloading /Users/username/models/intel/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.xml
-... 100%, 32 KB, 172042 KB/s, 0 seconds passed
-
-========== Downloading /Users/username/models/intel/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.bin
-... 100%, 1222 KB, 2712 KB/s, 0 seconds passed
-
-========== Downloading /Users/username/models/intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.xml
-... 100%, 47 KB, 217130 KB/s, 0 seconds passed
-
-========== Downloading /Users/username/models/intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.bin
-... 100%, 2378 KB, 4222 KB/s, 0 seconds passed
-
-################|| Post-processing ||################
-```
-
-</details>   
-
 ### <a name="convert-models-to-intermediate-representation"></a> Step 2: Convert the Models to the Intermediate Representation
 
 In this step, your trained models are ready to run through the Model Optimizer to convert them to the Intermediate Representation (IR) format. This is required before using the Inference Engine with the model.
@@ -317,16 +250,15 @@ The conversion may also create a `model_name.mapping` file, but it is not needed
 
 This guide uses the public SqueezeNet 1.1 Caffe\* model to run the Image Classification Sample. See the example to download a model in the <a href="#download-models">Download Models</a> section to learn how to download this model.
 
-The `squeezenet1.1` model is downloaded in the Caffe* format. You must use the Model Optimizer to convert the model to the IR. 
-The `vehicle-license-plate-detection-barrier-0106`, `vehicle-attributes-recognition-barrier-0039`, `license-plate-recognition-barrier-0001` models are downloaded in the Intermediate Representation format. You don't need to use the Model Optimizer to convert these models.
+The `squeezenet1.1` model is downloaded in the Caffe* format. You must use the Model Optimizer to convert the model to the IR.
 
-1. Create an `<ir_dir>` directory to contain the model's IR. 
+1. Create an `<ir_dir>` directory to contain the model's IR.
 
 2. The Inference Engine can perform inference on different precision formats, such as `FP32`, `FP16`, `INT8`. To prepare an IR with specific precision, run the Model Optimizer with the appropriate `--data_type` option.
 
 3. Run the Model Optimizer script:
    ```sh
-   cd /opt/intel/openvino_2021/deployment_tools/model_optimizer
+   cd /opt/intel/openvino_2022/tools/model_optimizer
    ```
    ```sh  
    python3 ./mo.py --input_model <model_dir>/<model_file> --data_type <model_precision> --output_dir <ir_dir>
@@ -339,17 +271,17 @@ The `vehicle-license-plate-detection-barrier-0106`, `vehicle-attributes-recognit
 The following command converts the public SqueezeNet 1.1 Caffe\* model to the FP16 IR and saves to the `~/models/public/squeezenet1.1/ir` output directory:
 
 ```sh
-   cd /opt/intel/openvino_2021/deployment_tools/model_optimizer
+   cd /opt/intel/openvino_2022/tools/model_optimizer
    ```
-   ```sh  
+   ```sh
    python3 ./mo.py --input_model ~/models/public/squeezenet1.1/squeezenet1.1.caffemodel --data_type FP16 --output_dir ~/models/public/squeezenet1.1/ir
    ```
 
 After the Model Optimizer script is completed, the produced IR files (`squeezenet1.1.xml`, `squeezenet1.1.bin`) are in the specified `~/models/public/squeezenet1.1/ir` directory.
 
-Copy the `squeezenet1.1.labels` file from the `/opt/intel/openvino_2021/deployment_tools/demo/` to `<ir_dir>`. This file contains the classes that ImageNet uses. Therefore, the inference results show text instead of classification numbers:
-   ```sh   
-   cp /opt/intel/openvino_2021/deployment_tools/demo/squeezenet1.1.labels <ir_dir>
+Copy the `squeezenet1.1.labels` file from the `/opt/intel/openvino_2022/samples/scripts/` to `<ir_dir>`. This file contains the classes that ImageNet uses. Therefore, the inference results show text instead of classification numbers:
+   ```sh
+   cp /opt/intel/openvino_2022/samples/scripts/squeezenet1.1.labels <ir_dir>
    ```
 </details>
 
@@ -360,22 +292,22 @@ Many sources are available from which you can download video media to use the co
 - https://images.google.com
 
 As an alternative, the Intel® Distribution of OpenVINO™ toolkit includes two sample images that you can use for running code samples and demo applications:
-* `/opt/intel/openvino_2021/deployment_tools/demo/car.png`
-* `/opt/intel/openvino_2021/deployment_tools/demo/car_1.bmp`
+* `/opt/intel/openvino_2022/samples/scripts/car.png`
+* `/opt/intel/openvino_2022/samples/scripts/car_1.bmp`
 
 ### <a name="run-image-classification"></a>Step 4: Run the Image Classification Code Sample
 
-> **NOTE**: The Image Classification code sample is automatically compiled when you ran the Image Classification demo script. If you want to compile it manually, see the [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md) document. 
+> **NOTE**: The Image Classification code sample is automatically compiled when you ran the Image Classification sample script. If you want to compile it manually, see the [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md) document.
 
 To run the **Image Classification** code sample with an input image on the IR: 
 
 1. Set up the OpenVINO environment variables:
    ```sh
-   source /opt/intel/openvino_2021/bin/setupvars.sh
+   source /opt/intel/openvino_2022/setupvars.sh
    ``` 
 2. Go to the code samples build directory:
    ```sh
-   cd ~/inference_engine_samples_build/intel64/Release
+   cd ~/inference_engine_cpp_samples_build/intel64/Release
    ```
 3. Run the code sample executable, specifying the input media file, the IR of your model, and a target device on which you want to perform inference:
    ```sh
@@ -384,26 +316,26 @@ To run the **Image Classification** code sample with an input image on the IR:
 <details>
     <summary><strong>Click for examples of running the Image Classification code sample on different devices</strong></summary>
 
-The following commands run the Image Classification Code Sample using the `car.png` file from the `/opt/intel/openvino_2021/deployment_tools/demo/` directory as an input image, the IR of your model from `~/models/public/squeezenet1.1/ir` and on different hardware devices:
+The following commands run the Image Classification Code Sample using the `car.png` file from the `/opt/intel/openvino_2022/samples/scripts/` directory as an input image, the IR of your model from `~/models/public/squeezenet1.1/ir` and on different hardware devices:
 
 **CPU:**
    ```sh
-   ./classification_sample_async -i /opt/intel/openvino_2021/deployment_tools/demo/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d CPU
+   ./classification_sample_async -i /opt/intel/openvino_2022/samples/scripts/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d CPU
    ```
 
-   
-   **MYRIAD:** 
-   
+
+   **MYRIAD:**
+
    > **NOTE**: Running inference on VPU devices (Intel® Neural Compute Stick 2) with the MYRIAD plugin requires additional hardware configuration steps. For details, see the Steps for Intel® Neural Compute Stick 2 section in the [installation instructions](../install_guides/installing-openvino-macos.md).
-   ```sh   
-   ./classification_sample_async -i /opt/intel/openvino_2021/deployment_tools/demo/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d MYRIAD
+   ```sh
+   ./classification_sample_async -i /opt/intel/openvino_2022/samples/scripts/car.png -m ~/models/public/squeezenet1.1/ir/squeezenet1.1.xml -d MYRIAD
    ```
 
-When the Sample Application completes, you see the label and confidence for the top-10 categories on the display. Below is a sample output with inference results on CPU:    
+When the Sample Application completes, you see the label and confidence for the top-10 categories on the display. Below is a sample output with inference results on CPU:
 ```sh
 Top 10 results:
 
-Image /opt/intel/openvino_2021/deployment_tools/demo/car.png
+Image /opt/intel/openvino_2022/samples/scripts/car.png
 
 classid probability label
 ------- ----------- -----
@@ -418,44 +350,7 @@ classid probability label
 864     0.0012045   tow truck, tow car, wrecker
 581     0.0005833   grille, radiator grille
 
-[ INFO ] Execution successful
-```
-
-</details>
-
-### <a name="run-security-barrier"></a>Step 5: Run the Security Barrier Camera Demo Application
-
-> **NOTE**: The Security Barrier Camera Demo Application is automatically compiled when you run the Inference Pipeline demo scripts. If you want to build it manually, see the instructions in the [Demo Applications Overview](@ref omz_demos) section.
-
-To run the **Security Barrier Camera Demo Application** using an input image on the prepared IRs:
-
-1. Set up the OpenVINO environment variables:
-   ```sh
-   source /opt/intel/openvino_2021/bin/setupvars.sh
-   ``` 
-2. Go to the demo application build directory:
-   ```sh
-   cd ~/inference_engine_demos_build/intel64/Release
-   ```
-3. Run the demo executable, specifying the input media file, list of model IRs, and a target device on which to perform inference:
-   ```sh
-   ./security_barrier_camera_demo -i <path_to_media> -m <path_to_vehicle-license-plate-detection_model_xml> -m_va <path_to_vehicle_attributes_model_xml> -m_lpr <path_to_license_plate_recognition_model_xml> -d <target_device>
-   ```
-
-<details>
-    <summary><strong>Click for examples of running the Security Barrier Camera demo application on different devices</strong></summary>
-
-**CPU:**
-
-```sh
-./security_barrier_camera_demo -i /opt/intel/openvino_2021/deployment_tools/demo/car_1.bmp -m ~/models/intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.xml -m_va ~/models/intel/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.xml -m_lpr ~/models/intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.xml -d CPU
-```
-
-**MYRIAD:** 
-   
-> **NOTE**: Running inference on VPU devices (Intel® Neural Compute Stick 2) with the MYRIAD plugin requires additional hardware configuration steps. For details, see the Steps for Intel® Neural Compute Stick 2 section in the [installation instructions](../install_guides/installing-openvino-macos.md).
-```sh   
-./classification_sample_async -i <INSTALL_DIR>/inference-engine/samples/sample_data/car.png -m <ir_dir>/squeezenet1.1.xml -d MYRIAD
+[ INFO ] Classification sample execution successful
 ```
 
 </details>
@@ -464,10 +359,10 @@ To run the **Security Barrier Camera Demo Application** using an input image on
 
 Following are some basic guidelines for executing the OpenVINO™ workflow using the code samples and demo applications:
 
-1. Before using the OpenVINO™ samples, always set up the environment: 
+1. Before using the OpenVINO™ samples, always set up the environment:
 ```sh
-source /opt/intel/openvino_2021/bin/setupvars.sh
-``` 
+source /opt/intel/openvino_2022/setupvars.sh
+```
 2. Have the directory path for the following:
 - Code Sample binaries located in `~/inference_engine_cpp_samples_build/intel64/Release`
 - Demo Application binaries located in `~/inference_engine_demos_build/intel64/Release`
@@ -481,10 +376,10 @@ This section explains how to build and use the sample and demo applications prov
 To build all the demos and samples:
 
 ```sh
-cd $INTEL_OPENVINO_DIR/inference_engine_samples/cpp
-# to compile C samples, go here also: cd <INSTALL_DIR>/inference_engine/samples/c
+cd $INTEL_OPENVINO_DIR/samples/cpp
+# to compile C samples, go here also: cd <INSTALL_DIR>/samples/c
 build_samples.sh
-cd $INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/demos
+cd $INTEL_OPENVINO_DIR/extras/open_model_zoo/demos
 build_demos.sh
 ```
 
@@ -503,11 +398,11 @@ Template to call sample code or a demo application:
 With the sample information specified, the command might look like this:
 
 ```sh
-cd $INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/demos/object_detection_demo
+cd cd $INTEL_OPENVINO_DIR/extras/open_model_zoo/demos/object_detection_demo
 ./object_detection_demo -i ~/Videos/catshow.mp4 -m ~/ir/fp32/mobilenet-ssd.xml -d CPU
 ```
 
-## <a name="advanced-samples"></a> Advanced Demo Use 
+## <a name="advanced-samples"></a> Advanced Demo Use
 
 Some demo applications let you use multiple models for different purposes. In these cases, the output of the first model is usually used as the input for later models.
 
diff --git a/docs/get_started/get_started_raspbian.md b/docs/get_started/get_started_raspbian.md
index d810958d723f4c..398131290c6af6 100644
--- a/docs/get_started/get_started_raspbian.md
+++ b/docs/get_started/get_started_raspbian.md
@@ -22,12 +22,12 @@ This guide assumes you completed all Intel® Distribution of OpenVINO™ toolkit
 
 The OpenVINO toolkit for Raspbian* OS is distributed without installer. This document refers to the directory to which you unpacked the toolkit package as `<INSTALL_DIR>`.
 
-The primary tools for deploying your models and applications are installed to the `<INSTALL_DIR>/deployment_tools` directory.
+The primary tools for deploying your models and applications are installed to the `<INSTALL_DIR>/tools` directory.
 <details>
-    <summary><strong>Click for the <code>deployment_tools</code> directory structure</strong></summary>
-   
+    <summary><strong>Click for the <code>tools</code> directory structure</strong></summary>
+
 
-| Directory&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; | Description                                                                           |  
+| Directory&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; | Description                                                                           |
 |:----------------------------------------|:--------------------------------------------------------------------------------------|
 | `inference_engine/`                     | Inference Engine directory. Contains Inference Engine API binaries and source files, samples and extensions source files, and resources like hardware drivers.|
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`external/`     | Third-party dependencies and drivers.|
@@ -42,7 +42,7 @@ The primary tools for deploying your models and applications are installed to th
 
 The OpenVINO™ workflow on Raspbian* OS is as follows:
 1. **Get a pre-trained model** for your inference task. If you want to use your model for inference, the model must be converted to the `.bin` and `.xml` Intermediate Representation (IR) files, which are used as input by Inference Engine. On Raspberry PI, OpenVINO™ toolkit includes only the Inference Engine module. The Model Optimizer is not supported on this platform. To get the optimized models you can use one of the following options:
-   
+
    * Download public and Intel's pre-trained models from the [Open Model Zoo](https://github.com/openvinotoolkit/open_model_zoo) using [Model Downloader tool](@ref omz_tools_downloader).
     <br> For more information on pre-trained models, see [Pre-Trained Models Documentation](@ref omz_models_group_intel)
    
@@ -62,7 +62,7 @@ Follow the steps below to run pre-trained Face Detection network using Inference
    ```
 2. Build the Object Detection Sample with the following command:
    ```sh
-   cmake -DCMAKE_BUILD_TYPE=Release -DCMAKE_CXX_FLAGS="-march=armv7-a" /opt/intel/openvino_2021/deployment_tools/inference_engine/samples/cpp
+   cmake -DCMAKE_BUILD_TYPE=Release -DCMAKE_CXX_FLAGS="-march=armv7-a" /opt/intel/openvino_2022/samples/cpp
    make -j2 object_detection_sample_ssd
    ```
 3. Download the pre-trained Face Detection model with the [Model Downloader tool](@ref omz_tools_downloader):
@@ -82,10 +82,10 @@ The application outputs an image (`out_0.bmp`) with detected faced enclosed in r
 
 Following are some basic guidelines for executing the OpenVINO™ workflow using the code samples:
 
-1. Before using the OpenVINO™ samples, always set up the environment: 
+1. Before using the OpenVINO™ samples, always set up the environment:
 ```sh
-source <INSTALL_DIR>/bin/setupvars.sh
-``` 
+source <INSTALL_DIR>/setupvars.sh
+```
 2. Have the directory path for the following:
    - Code Sample binaries
    - Media: Video or image. Many sources are available from which you can download video media to use the code samples and demo applications, like https://videos.pexels.com and https://images.google.com.
diff --git a/docs/get_started/get_started_windows.md b/docs/get_started/get_started_windows.md
index 7f0bc1ff2bcfae..90e15e09772125 100644
--- a/docs/get_started/get_started_windows.md
+++ b/docs/get_started/get_started_windows.md
@@ -4,7 +4,7 @@ The OpenVINO™ toolkit optimizes and runs Deep Learning Neural Network models o
 
 In this guide, you will:
 * Learn the OpenVINO™ inference workflow
-* Run demo scripts that illustrate the workflow and perform the steps for you
+* Run ыфьзду scripts that illustrate the workflow and perform the steps for you
 * Run the workflow steps yourself, using detailed instructions with a code sample and demo application
 
 ## <a name="openvino-components"></a>OpenVINO™ toolkit Components
@@ -14,8 +14,8 @@ The toolkit consists of three primary components:
 * **Inference Engine:** The software libraries that run inference against the IR (optimized model) to produce inference results.
 
 
-In addition, demo scripts, code samples and demo applications are provided to help you get up and running with the toolkit:
-* **Demo Scripts** - Batch scripts that automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios.  
+In addition, sample scripts, code samples and demo applications are provided to help you get up and running with the toolkit:
+* **Sample Scripts** - Batch scripts that automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios.
 * **[Code Samples](../IE_DG/Samples_Overview.md)** - Small console applications that show you how to:
     * Utilize specific OpenVINO capabilities in an application.
     * Perform specific tasks, such as loading a model, running inference, querying specific device capabilities, and more.
@@ -24,16 +24,16 @@ In addition, demo scripts, code samples and demo applications are provided to he
 ## <a name="openvino-installation"></a>Intel® Distribution of OpenVINO™ toolkit Installation and Deployment Tools Directory Structure
 This guide assumes you completed all Intel® Distribution of OpenVINO™ toolkit installation and configuration steps. If you have not yet installed and configured the toolkit, see [Install Intel® Distribution of OpenVINO™ toolkit for Windows*](../install_guides/installing-openvino-windows.md).
 
-By default, the installation directory is `C:\Program Files (x86)\Intel\openvino_<version>`, referred to as `<INSTALL_DIR>`. If you installed the Intel® Distribution of OpenVINO™ toolkit to a directory other than the default, replace `C:\Program Files (x86)\Intel` with the directory in which you installed the software. For simplicity, a shortcut to the latest installation is also created: `C:\Program Files (x86)\Intel\openvino_2021`.
+By default, the installation directory is `C:\Program Files (x86)\Intel\openvino_<version>`, referred to as `<INSTALL_DIR>`. If you installed the Intel® Distribution of OpenVINO™ toolkit to a directory other than the default, replace `C:\Program Files (x86)\Intel` with the directory in which you installed the software. For simplicity, a shortcut to the latest installation is also created: `C:\Program Files (x86)\Intel\openvino_2022`.
 
-The primary tools for deploying your models and applications are installed to the `<INSTALL_DIR>\deployment_tools` directory.
+The primary tools for deploying your models and applications are installed to the `<INSTALL_DIR>\tools` directory.
 <details>
-    <summary><strong>Click for the <code>deployment_tools</code> directory structure</strong></summary>
-   
+    <summary><strong>Click for the <code>tools</code> directory structure</strong></summary>
+
 
-| Directory&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; | Description                                                                           |  
+| Directory&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; | Description                                                                           |
 |:----------------------------------------|:--------------------------------------------------------------------------------------|
-| `demo\`                                 | Demo scripts. Demonstrate pipelines for inference scenarios, automatically perform steps and print detailed output to the console. For more information, see the [Use OpenVINO: Demo Scripts](#use-openvino-demo-scripts) section.|
+| `demo\`                                 | Sample scripts. Demonstrate pipelines for inference scenarios, automatically perform steps and print detailed output to the console. For more information, see the [Use OpenVINO: Demo Scripts](#use-openvino-demo-scripts) section.|
 | `inference_engine\`                     | Inference Engine directory. Contains Inference Engine API binaries and source files, samples and extensions source files, and resources like hardware drivers.|
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`bin\`          | Inference Engine binaries.|
 | &nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;`external\`     | Third-party dependencies and drivers.|
@@ -61,45 +61,44 @@ The simplified OpenVINO™ workflow is:
 2. **Run the trained model through the Model Optimizer** to convert the model to an IR, which consists of a pair of `.xml` and `.bin` files that are used as the input for Inference Engine.
 3. **Use the Inference Engine API in the application** to run inference against the IR (optimized model) and output inference results. The application can be an OpenVINO™ sample, demo, or your own application.
 
-## Use the Demo Scripts to Learn the Workflow
+## Use the Sample Scripts to Learn the Workflow
 
-The demo scripts in `<INSTALL_DIR>\deployment_tools\demo` give you a starting point to learn the OpenVINO workflow. These scripts automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios. The demo steps demonstrate how to: 
+The sample scripts in `<INSTALL_DIR>\samples\scripts` give you a starting point to learn the OpenVINO workflow. These scripts automatically perform the workflow steps to demonstrate running inference pipelines for different scenarios. The demo steps demonstrate how to:
 * Compile several samples from the source files delivered as part of the OpenVINO toolkit
 * Download trained models
 * Perform pipeline steps and see the output on the console
 
-> **REQUIRED**: You must have Internet access to run the demo scripts. If your Internet access is through a proxy server, make sure the operating system environment proxy information is configured.
+> **REQUIRED**: You must have Internet access to run the sample scripts. If your Internet access is through a proxy server, make sure the operating system environment proxy information is configured.
 
-The demo scripts can run inference on any [supported target device](https://software.intel.com/en-us/openvino-toolkit/hardware). Although the default inference device is CPU, you can use the `-d` parameter to change the inference device. The general command to run the scripts looks as follows:
+The sample scripts can run inference on any [supported target device](https://software.intel.com/en-us/openvino-toolkit/hardware). Although the default inference device is CPU, you can use the `-d` parameter to change the inference device. The general command to run the scripts looks as follows:
 
 ```bat
 .\<script_name> -d [CPU, GPU, MYRIAD, HDDL]
 ```
 
-Before running the demo applications on Intel® Processor Graphics or Intel® Vision Accelerator Design with Intel® Movidius™ VPUs, you must complete additional hardware configuration steps. For details, see the following sections in the [installation instructions](../install_guides/installing-openvino-windows.md):
+Before running the sample or demo applications on Intel® Processor Graphics or Intel® Vision Accelerator Design with Intel® Movidius™ VPUs, you must complete additional hardware configuration steps. For details, see the following sections in the [installation instructions](../install_guides/installing-openvino-windows.md):
 * Additional Installation Steps for Intel® Processor Graphics (GPU)
 * Additional Installation Steps for Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
 
-The following paragraphs describe each demo script.
+The following paragraphs describe each sample script.
 
-### Image Classification Demo Script
-The `demo_squeezenet_download_convert_run` script illustrates the image classification pipeline.
+### Image Classification Sample Script
+The `run_sample_squeezenet` script illustrates the image classification pipeline.
 
-The script: 
-1. Downloads a SqueezeNet model. 
+The script:
+1. Downloads a SqueezeNet model.
 2. Runs the Model Optimizer to convert the model to the IR.
 3. Builds the Image Classification Sample Async application.
 4. Runs the compiled sample with the `car.png` image located in the `demo` directory.
 
 <details>
-    <summary><strong>Click for an example of running the Image Classification demo script</strong></summary>
+    <summary><strong>Click for an example of running the Image Classification sample script</strong></summary>
 
-To run the script to perform inference on a CPU:
+To preview the image that the script will classify open the `car.png` file in any image viewer.
 
-1. Open the `car.png` file in any image viewer to see what the demo will be classifying.
-2. Run the following script:
+To run the script to perform inference on a CPU:
 ```bat
-.\demo_squeezenet_download_convert_run.bat
+.\run_sample_squeezenet.bat
 ```
 
 When the script completes, you see the label and confidence for the top-10 categories:
@@ -108,7 +107,7 @@ When the script completes, you see the label and confidence for the top-10 categ
 
 Top 10 results:
 
-Image C:\Program Files (x86)\Intel\openvino_2021\deployment_tools\demo\car.png
+Image C:\Program Files (x86)\Intel\openvino_2022\samples\scripts\car.png
 
 classid probability label
 ------- ----------- -----
@@ -123,56 +122,27 @@ classid probability label
 468     0.0013083   cab, hack, taxi, taxicab
 661     0.0007443   Model T
 
-[ INFO ] Execution successful
+[ INFO ] Classification sample execution successful
 ```
 
 </details>
 
-### Inference Pipeline Demo Script
-The `demo_security_barrier_camera` uses vehicle recognition in which vehicle attributes build on each other to narrow in on a specific attribute.
+### Benchmark Sample Script
+The `run_sample_benchmark_app` script illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices.
 
 The script:
-1. Downloads three pre-trained model IRs.
-2. Builds the Security Barrier Camera Demo application.
-3. Runs the application with the downloaded models and the `car_1.bmp` image from the `demo` directory to show an inference pipeline.
-
-This application:
-
-1. Identifies an object identified as a vehicle.
-2. Uses the vehicle identification as input to the second model, which identifies specific vehicle attributes, including the license plate.
-3. Uses the the license plate as input to the third model, which recognizes specific characters in the license plate.
-
-<details>
-    <summary><strong>Click for an example of Running the Pipeline demo script</strong></summary>
-    
-To run the script performing inference on Intel® Processor Graphics:
-
-```bat
-.\demo_security_barrier_camera.bat -d GPU
-```
-
-When the verification script completes, you see an image that displays the resulting frame with detections rendered as bounding boxes, and text:
-
-![](../img/inference_pipeline_script_win.png) 
-
-</details>
-
-### Benchmark Demo Script
-The `demo_benchmark_app` script illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices. 
-
-The script: 
 1. Downloads a SqueezeNet model.
 2. Runs the Model Optimizer to convert the model to the IR.
 3. Builds the Inference Engine Benchmark tool.
 4. Runs the tool with the `car.png` image located in the `demo` directory.
 
 <details>
-    <summary><strong>Click for an example of running the Benchmark demo script</strong></summary>
+    <summary><strong>Click for an example of running the Benchmark sample script</strong></summary>
 
 To run the script that performs inference (runs on CPU by default):
 
 ```bat
-.\demo_benchmark_app.bat
+.\run_sample_benchmark_app.bat
 ```
 When the verification script completes, you see the performance counters, resulting latency, and throughput values displayed on the screen.
 </details>
@@ -181,7 +151,7 @@ When the verification script completes, you see the performance counters, result
 
 This section guides you through a simplified workflow for the Intel® Distribution of OpenVINO™ toolkit using code samples and demo applications. 
 
-You will perform the following steps: 
+You will perform the following steps:
 
 1. <a href="#download-models">Use the Model Downloader to download suitable models.</a>
 2. <a href="#convert-models-to-intermediate-representation">Convert the models with the Model Optimizer.</a> 
@@ -199,7 +169,7 @@ Inputs you need to specify when using a code sample or demo application:
 
 ### Build the Code Samples and Demo Applications
 
-To perform sample inference, run the Image Classification code sample and Security Barrier Camera demo application that are automatically compiled when you run the Image Classification and Inference Pipeline demo scripts. The binary files are in the `C:\Users\<USER_ID>\Intel\OpenVINO\inference_engine_cpp_samples_build\intel64\Release` and `C:\Users\<USER_ID>\Intel\OpenVINO\inference_engine_demos_build\intel64\Release` directories, respectively.
+The Image Classification Sample that was automatically compiled when you ran the Image Classification sample script. The binary file is in the `C:\Users\<USER_ID>\Documents\Intel\OpenVINO\inference_engine_cpp_samples_build\intel64\Release` directory.
 
 You can also build all available sample code and demo applications from the source files delivered with the OpenVINO™ toolkit. To learn how to do this, see the instruction in the [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md) and [Demo Applications Overview](@ref omz_demos) sections.
 
@@ -214,18 +184,18 @@ Options to find a model suitable for the OpenVINO™ toolkit are:
 - Download public and Intel's pre-trained models from the [Open Model Zoo](https://github.com/openvinotoolkit/open_model_zoo) using the [Model Downloader tool](@ref omz_tools_downloader).
 - Download from GitHub*, Caffe* Zoo, TensorFlow* Zoo, and other resources.
 - Train your own model.
-        
+
 This guide uses the Model Downloader to get pre-trained models. You can use one of the following options to find a model:
 
-* **List the models available in the downloader**: 
+* **List the models available in the downloader**:
 ```bat
-cd <INSTALL_DIR>\deployment_tools\tools\model_downloader\
+cd <INSTALL_DIR>\tools\model_downloader\
 ```
 ```bat
 python info_dumper.py --print_all
 ```
 
-* **Use `grep` to list models that have a specific name pattern**: 
+* **Use `grep` to list models that have a specific name pattern**:
 ```bat
 python info_dumper.py --print_all | grep <model_name>
 ```
@@ -240,9 +210,6 @@ Download the following models if you want to run the Image Classification Sample
 |Model Name                                     | Code Sample or Demo App                             |
 |-----------------------------------------------|-----------------------------------------------------|
 |`squeezenet1.1`                                | Image Classification Sample                         |
-|`vehicle-license-plate-detection-barrier-0106` | Security Barrier Camera Demo application            |
-|`vehicle-attributes-recognition-barrier-0039`  | Security Barrier Camera Demo application            |
-|`license-plate-recognition-barrier-0001`       | Security Barrier Camera Demo application            |
 
 <details>
     <summary><strong>Click for an example of downloading the SqueezeNet Caffe* model</strong></summary>
@@ -269,41 +236,6 @@ Your screen looks similar to this after the download:
 ```
 </details>
 
-<details>
-    <summary><strong>Click for an example of downloading models for the Security Barrier Camera Demo application</strong></summary>
-
-To download all three pre-trained models in FP16 precision to the `C:\Users\<USER_ID>\Documents\models` folder:   
-
-```bat
-python .\downloader.py --name vehicle-license-plate-detection-barrier-0106,vehicle-attributes-recognition-barrier-0039,license-plate-recognition-barrier-0001 --output_dir C:\Users\username\Documents\models --precisions FP16
-```   
-Your screen looks similar to this after the download:
-```
-################|| Downloading models ||################
-
-========== Downloading C:\Users\username\Documents\models\intel\vehicle-license-plate-detection-barrier-0106\FP16\vehicle-license-plate-detection-barrier-0106.xml
-... 100%, 207 KB, 13810 KB/s, 0 seconds passed
-
-========== Downloading C:\Users\username\Documents\models\intel\vehicle-license-plate-detection-barrier-0106\FP16\vehicle-license-plate-detection-barrier-0106.bin
-... 100%, 1256 KB, 70 KB/s, 17 seconds passed
-
-========== Downloading C:\Users\username\Documents\models\intel\vehicle-attributes-recognition-barrier-0039\FP16\vehicle-attributes-recognition-barrier-0039.xml
-... 100%, 32 KB, ? KB/s, 0 seconds passed
-
-========== Downloading C:\Users\username\Documents\models\intel\vehicle-attributes-recognition-barrier-0039\FP16\vehicle-attributes-recognition-barrier-0039.bin
-... 100%, 1222 KB, 277 KB/s, 4 seconds passed
-
-========== Downloading C:\Users\username\Documents\models\intel\license-plate-recognition-barrier-0001\FP16\license-plate-recognition-barrier-0001.xml
-... 100%, 47 KB, ? KB/s, 0 seconds passed
-
-========== Downloading C:\Users\username\Documents\models\intel\license-plate-recognition-barrier-0001\FP16\license-plate-recognition-barrier-0001.bin
-... 100%, 2378 KB, 120 KB/s, 19 seconds passed
-
-################|| Post-processing ||################
-```
-
-</details>   
-
 ### <a name="convert-models-to-intermediate-representation"></a> Step 2: Convert the Models to the Intermediate Representation
 
 In this step, your trained models are ready to run through the Model Optimizer to convert them to the Intermediate Representation (IR) format. This is required before using the Inference Engine with the model.
@@ -314,18 +246,17 @@ Models in the Intermediate Representation format always include a pair of `.xml`
 
 This guide uses the public SqueezeNet 1.1 Caffe\* model to run the Image Classification Sample. See the example to download a model in the <a href="#download-models">Download Models</a> section to learn how to download this model.
 
-The `squeezenet1.1` model is downloaded in the Caffe* format. You must use the Model Optimizer to convert the model to the IR. 
-The `vehicle-license-plate-detection-barrier-0106`, `vehicle-attributes-recognition-barrier-0039`, `license-plate-recognition-barrier-0001` models are downloaded in the IR format. You do not need to use the Model Optimizer to convert these models.
+The `squeezenet1.1` model is downloaded in the Caffe* format. You must use the Model Optimizer to convert the model to the IR.
 
-1. Create an `<ir_dir>` directory to contain the model's IR. 
+1. Create an `<ir_dir>` directory to contain the model's IR.
 
 2. The Inference Engine can perform inference on different precision formats, such as `FP32`, `FP16`, `INT8`. To prepare an IR with specific precision, run the Model Optimizer with the appropriate `--data_type` option.
 
 3. Run the Model Optimizer script:
    ```bat
-   cd <INSTALL_DIR>\deployment_tools\model_optimizer
+   cd <INSTALL_DIR>\tools\model_optimizer
    ```
-   ```bat 
+   ```bat
    python .\mo.py --input_model <model_dir>\<model_file> --data_type <model_precision> --output_dir <ir_dir>
    ```
    The produced IR files are in the `<ir_dir>` directory.
@@ -336,43 +267,43 @@ The `vehicle-license-plate-detection-barrier-0106`, `vehicle-attributes-recognit
 The following command converts the public SqueezeNet 1.1 Caffe\* model to the FP16 IR and saves to the `C:\Users\<USER_ID>\Documents\models\public\squeezenet1.1\ir` output directory:
 
 ```bat
-   cd <INSTALL_DIR>\deployment_tools\model_optimizer
+   cd <INSTALL_DIR>\tools\model_optimizer
    ```
-   ```bat  
+   ```bat
    python .\mo.py --input_model C:\Users\username\Documents\models\public\squeezenet1.1\squeezenet1.1.caffemodel --data_type FP16 --output_dir C:\Users\username\Documents\models\public\squeezenet1.1\ir
    ```
 
 After the Model Optimizer script is completed, the produced IR files (`squeezenet1.1.xml`, `squeezenet1.1.bin`) are in the specified `C:\Users\<USER_ID>\Documents\models\public\squeezenet1.1\ir` directory.
 
-Copy the `squeezenet1.1.labels` file from the `<INSTALL_DIR>\deployment_tools\demo\` to `<ir_dir>`. This file contains the classes that ImageNet uses. Therefore, the inference results show text instead of classification numbers:
-   ```batch   
-   cp <INSTALL_DIR>\deployment_tools\demo\squeezenet1.1.labels <ir_dir>
+Copy the `squeezenet1.1.labels` file from the `<INSTALL_DIR>\samples\scripts\` to `<ir_dir>`. This file contains the classes that ImageNet uses. Therefore, the inference results show text instead of classification numbers:
+   ```batch
+   cp <INSTALL_DIR>\samples\scripts\squeezenet1.1.labels <ir_dir>
    ```
 </details>
 
 ### <a name="download-media"></a> Step 3: Download a Video or a Still Photo as Media
 
-Many sources are available from which you can download video media to use the code samples and demo applications. Possibilities include: 
+Many sources are available from which you can download video media to use the code samples and demo applications. Possibilities include:
 - https://videos.pexels.com
 - https://images.google.com
 
 As an alternative, the Intel® Distribution of OpenVINO™ toolkit includes two sample images that you can use for running code samples and demo applications:
-* `<INSTALL_DIR>\deployment_tools\demo\car.png`
-* `<INSTALL_DIR>\deployment_tools\demo\car_1.bmp`
+* `<INSTALL_DIR>\samples\scripts\car.png`
+* `<INSTALL_DIR>\samples\scripts\car_1.bmp`
 
 ### <a name="run-image-classification"></a>Step 4: Run the Image Classification Code Sample
 
-> **NOTE**: The Image Classification code sample is automatically compiled when you run the Image Classification demo script. If you want to compile it manually, see the Build the Sample Applications on Microsoft Windows* OS section in [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md).
+> **NOTE**: The Image Classification code sample is automatically compiled when you run the Image Classification sample script. If you want to compile it manually, see the Build the Sample Applications on Microsoft Windows* OS section in [Inference Engine Code Samples Overview](../IE_DG/Samples_Overview.md).
 
-To run the **Image Classification** code sample with an input image on the IR: 
+To run the **Image Classification** code sample with an input image on the IR:
 
 1. Set up the OpenVINO environment variables:
    ```bat
-   <INSTALL_DIR>\openvino\bin\setupvars.sh
-   ``` 
+   <INSTALL_DIR>\setupvars.sh
+   ```
 2. Go to the code samples build directory:
    ```bat
-   cd C:\Users\<USER_ID>\Documents\Intel\OpenVINO\inference_engine_samples_build\intel64\Release
+   cd C:\Users\<USER_ID>\Documents\Intel\OpenVINO\inference_engine_cpp_samples_build\intel64\Release
    ```
 3. Run the code sample executable, specifying the input media file, the IR of your model, and a target device on which you want to perform inference:
    ```bat
@@ -381,31 +312,31 @@ To run the **Image Classification** code sample with an input image on the IR:
 <details>
     <summary><strong>Click for examples of running the Image Classification code sample on different devices</strong></summary>
 
-The following commands run the Image Classification Code Sample using the `car.png` file from the `<INSTALL_DIR>\deployment_tools\demo` directory as an input image, the IR of your model from `C:\Users\<USER_ID>\Documents\models\public\squeezenet1.1\ir` and on different hardware devices:
+The following commands run the Image Classification Code Sample using the `car.png` file from the `<INSTALL_DIR>\samples\scripts` directory as an input image, the IR of your model from `C:\Users\<USER_ID>\Documents\models\public\squeezenet1.1\ir` and on different hardware devices:
 
 **CPU:**
    ```bat
-   .\classification_sample_async -i <INSTALL_DIR>\deployment_tools\demo\car.png -m C:\Users\<USER_ID>\Documents\models\public\squeezenet1.1\ir\squeezenet1.1.xml -d CPU
+   .\classification_sample_async -i <INSTALL_DIR>\samples\scripts\car.png -m C:\Users\<USER_ID>\Documents\models\public\squeezenet1.1\ir\squeezenet1.1.xml -d CPU
    ```
 
    **GPU:**
    
    > **NOTE**: Running inference on Intel® Processor Graphics (GPU) requires additional hardware configuration steps. For details, see the Steps for Intel® Processor Graphics (GPU) section in the [installation instructions](../install_guides/installing-openvino-windows.md).
    ```bat
-   .\classification_sample_async -i <INSTALL_DIR>\deployment_tools\demo\car.png -m C:\Users\<USER_ID>\models\public\squeezenet1.1\ir\squeezenet1.1.xml -d GPU
+   .\classification_sample_async -i <INSTALL_DIR>\samples\scripts\car.png -m C:\Users\<USER_ID>\models\public\squeezenet1.1\ir\squeezenet1.1.xml -d GPU
    ```
    
-   **MYRIAD:** 
+   **MYRIAD:**
 
-  ```bat   
-   .\classification_sample_async -i <INSTALL_DIR>\deployment_tools\demo\car.png -m C:\Users\<USER_ID>\models\public\squeezenet1.1\ir\squeezenet1.1.xml -d MYRIAD
+  ```bat
+   .\classification_sample_async -i <INSTALL_DIR>\samples\scripts\car.png -m C:\Users\<USER_ID>\models\public\squeezenet1.1\ir\squeezenet1.1.xml -d MYRIAD
    ```
 
-When the Sample Application completes, you see the label and confidence for the top-10 categories on the display. Below is a sample output with inference results on CPU:    
+When the Sample Application completes, you see the label and confidence for the top-10 categories on the display. Below is a sample output with inference results on CPU:
 ```bat
 Top 10 results:
 
-Image C:\Program Files (x86)\Intel\openvino_2021\deployment_tools\demo\car.png
+Image C:\Program Files (x86)\Intel\openvino_2022\samples\scripts\car.png
 
 classid probability label
 ------- ----------- -----
@@ -420,50 +351,7 @@ classid probability label
 864     0.0012045   tow truck, tow car, wrecker
 581     0.0005833   grille, radiator grille
 
-[ INFO ] Execution successful
-```
-
-</details>
-
-### <a name="run-security-barrier"></a>Step 5: Run the Security Barrier Camera Demo Application
-
-> **NOTE**: The Security Barrier Camera Demo Application is automatically compiled when you run the Inference Pipeline demo scripts. If you want to build it manually, see the instructions in the [Demo Applications Overview](@ref omz_demos) section.
-
-To run the **Security Barrier Camera Demo Application** using an input image on the prepared IRs:
-
-1. Set up the OpenVINO environment variables:
-   ```bat
-   <INSTALL_DIR>\bin\setupvars.bat
-   ``` 
-2. Go to the demo application build directory:
-   ```bat
-   cd C:\Users\<USER_ID>\Documents\Intel\OpenVINO\inference_engine_demos_build\intel64\Release
-   ```
-3. Run the demo executable, specifying the input media file, list of model IRs, and a target device on which to perform inference:
-   ```bat
-   .\security_barrier_camera_demo -i <path_to_media> -m <path_to_vehicle-license-plate-detection_model_xml> -m_va <path_to_vehicle_attributes_model_xml> -m_lpr <path_to_license_plate_recognition_model_xml> -d <target_device>
-   ```
-
-<details>
-    <summary><strong>Click for examples of running the Security Barrier Camera demo application on different devices</strong></summary>
-
-**CPU:**
-
-```bat
-.\security_barrier_camera_demo -i <INSTALL_DIR>\deployment_tools\demo\car_1.bmp -m C:\Users\username\Documents\models\intel\vehicle-license-plate-detection-barrier-0106\FP16\vehicle-license-plate-detection-barrier-0106.xml -m_va C:\Users\username\Documents\models\intel\vehicle-attributes-recognition-barrier-0039\FP16\vehicle-attributes-recognition-barrier-0039.xml -m_lpr C:\Users\username\Documents\models\intel\license-plate-recognition-barrier-0001\FP16\license-plate-recognition-barrier-0001.xml -d CPU
-```
-
-**GPU:**
-   
-> **NOTE**: Running inference on Intel® Processor Graphics (GPU) requires additional hardware configuration steps. For details, see the Steps for Intel® Processor Graphics (GPU) section in the [installation instructions](../install_guides/installing-openvino-windows.md).
-```bat
-.\security_barrier_camera_demo -i <INSTALL_DIR>\deployment_tools\demo\car_1.bmp -m <path_to_model>/vehicle-license-plate-detection-barrier-0106.xml -m_va <path_to_model>/vehicle-attributes-recognition-barrier-0039.xml -m_lpr <path_to_model>/license-plate-recognition-barrier-0001.xml -d GPU
-```
-
-**MYRIAD:** 
-   
-```bat   
-.\classification_sample_async -i <INSTALL_DIR>\inference-engine\samples\sample_data\car.png -m <ir_dir>\squeezenet1.1.xml -d MYRIAD
+[ INFO ] Classification sample execution successful
 ```
 
 </details>
@@ -472,10 +360,10 @@ To run the **Security Barrier Camera Demo Application** using an input image on
 
 Below you can find basic guidelines for executing the OpenVINO™ workflow using the code samples and demo applications:
 
-1. Before using the OpenVINO™ samples, always set up the environment: 
+1. Before using the OpenVINO™ samples, always set up the environment:
 ```bat
-<INSTALL_DIR>\bin\setupvars.bat
-``` 
+<INSTALL_DIR>\setupvars.bat
+```
 2. Make sure to have the directory path for the following:
 - Code Sample binaries located in `C:\Users\<USER_ID>\Documents\Intel\OpenVINO\inference_engine_cpp_samples_build\intel64\Release`
 - Demo Application binaries located in `C:\Users\<USER_ID>\Documents\Intel\OpenVINO\inference_engine_demos_build\intel64\Release`
@@ -490,9 +378,9 @@ To build all the demos and samples:
 
 ```sh
 cd $INTEL_OPENVINO_DIR\inference_engine_samples\cpp
-# to compile C samples, go here also: cd <INSTALL_DIR>\inference_engine\samples\c
+# to compile C samples, go here also: cd <INSTALL_DIR>\samples\c
 build_samples_msvc.bat
-cd $INTEL_OPENVINO_DIR\deployment_tools\open_model_zoo\demos
+cd $INTEL_OPENVINO_DIR\extras\open_model_zoo\demos
 build_demos_msvc.bat
 ```
 
@@ -515,7 +403,7 @@ With the sample information specified, the command might look like this:
 -m C:\Users\<USER_ID>\Documents\ir\fp32\mobilenet-ssd.xml -d CPU
 ```
 
-## <a name="advanced-samples"></a> Advanced Demo Use 
+## <a name="advanced-samples"></a> Advanced Demo Use
 
 Some demo applications let you use multiple models for different purposes. In these cases, the output of the first model is usually used as the input for later models.
 
diff --git a/docs/how_tos/MonoDepth_how_to.md b/docs/how_tos/MonoDepth_how_to.md
index 329eac9e063b49..69f2feba9d7c43 100644
--- a/docs/how_tos/MonoDepth_how_to.md
+++ b/docs/how_tos/MonoDepth_how_to.md
@@ -11,7 +11,7 @@ Tested on OpenVINO™ 2021, Ubuntu 18.04.
 
 Define the OpenVINO™ install directory:
 ```
-export OV=/opt/intel/openvino_2021/
+export OV=/opt/intel/openvino_2022/
 ```
 Define the working directory. Make sure the directory exist:
 ```
@@ -22,19 +22,19 @@ export WD=~/MonoDepth_Python/
 
 Initialize OpenVINO™:
 ```
-source $OV/bin/setupvars.sh
+source $OV/setupvars.sh
 ```
 
 Install the Model Optimizer prerequisites:
 ```
-cd $OV/deployment_tools/model_optimizer/install_prerequisites/
+cd $OV/tools/model_optimizer/install_prerequisites/
 sudo ./install_prerequisites.sh
 ```
 
 Install the Model Downloader prerequisites:
 
 ```
-cd $OV/deployment_tools/tools/model_downloader/
+cd $OV/extras/open_model_zoo/tools/downloader/
 python3 -mpip install --user -r ./requirements.in
 sudo python3 -mpip install --user -r ./requirements-pytorch.in
 sudo python3 -mpip install --user -r ./requirements-caffe2.in
@@ -44,7 +44,7 @@ sudo python3 -mpip install --user -r ./requirements-caffe2.in
 
 Download all models from the Demo Models list:
 ```
-python3 $OV/deployment_tools/tools/model_downloader/downloader.py --list $OV/deployment_tools/inference_engine/demos/python_demos/monodepth_demo/models.lst -o $WD
+python3 $OV/extras/open_model_zoo/tools/downloader/downloader.py --list $OV/deployment_tools/inference_engine/demos/python_demos/monodepth_demo/models.lst -o $WD
 ```
 
 ## 4. Convert Models to Intermediate Representation (IR)
@@ -52,7 +52,7 @@ python3 $OV/deployment_tools/tools/model_downloader/downloader.py --list $OV/dep
 Use the convert script to convert the models to ONNX*, and then to IR format:
 ```
 cd $WD
-python3 $OV/deployment_tools/tools/model_downloader/converter.py --list $OV/deployment_tools/inference_engine/demos/python_demos/monodepth_demo/models.lst
+python3 $OV/extras/open_model_zoo/tools/downloader/converter.py --list $OV/deployment_tools/inference_engine/demos/python_demos/monodepth_demo/models.lst
 ```
 
 ## 5. Run Demo
diff --git a/docs/how_tos/POT_how_to_example.md b/docs/how_tos/POT_how_to_example.md
index 28adc19062b4a6..ea06a7a322f533 100644
--- a/docs/how_tos/POT_how_to_example.md
+++ b/docs/how_tos/POT_how_to_example.md
@@ -16,21 +16,21 @@ Install OpenVINO™ toolkit and Model Optimizer, Accuracy Checker, and Post-trai
 
 1. Define the OpenVINO™ install directory:
 ```
-export OV=/opt/intel/openvino_2021/
+export OV=/opt/intel/openvino_2022/
 ```
 2. Install the Model Optimizer prerequisites:
 ```
-cd $OV/deployment_tools/model_optimizer/install_prerequisites
+cd $OV/tools/model_optimizer/install_prerequisites
 sudo ./install_prerequisites.sh
 ```
 3. Install the Accuracy Checker requirements:
 ```
-cd $OV/deployment_tools/open_model_zoo/tools/accuracy_checker
+cd $OV/tools/accuracy_checker
 sudo python3 setup.py install
 ```
 4. Install the Post-training Optimization Tool:
 ```
-cd $OV/deployment_tools/tools/post_training_optimization_toolkit
+cd $OV/tools/post_training_optimization_toolkit
 sudo python3 setup.py install
 ```
 
@@ -46,14 +46,14 @@ mkdir ~/POT
 cd ~/POT
 ```
 ```
-python3 $OV/deployment_tools/tools/model_downloader/downloader.py --name mobilenet-v2-pytorch -o .
+python3 $OV/extras/open_model_zoo/tools/downloader/downloader.py --name mobilenet-v2-pytorch -o .
 ```
 
 ## 3. Prepare Model for Inference
 
 Install requirements for PyTorch using the commands below:
 ```
-cd $OV/deployment_tools/open_model_zoo/tools/downloader
+cd $OV/extras/open_model_zoo/tools/downloader
 ```
 ```
 python3 -mpip install --user -r ./requirements-pytorch.in
@@ -61,13 +61,13 @@ python3 -mpip install --user -r ./requirements-pytorch.in
 
 You can find the parameters for Mobilnet v2 conversion here:
 ```
-vi /opt/intel/openvino_2021/deployment_tools/open_model_zoo/models/public/mobilenet-v2-pytorch/model.yml
+vi /opt/intel/openvino_2022/extras/open_model_zoo/models/public/mobilenet-v2-pytorch/model.yml
 ```
 
 Convert the model from PyTorch to ONNX*:
 ```
 cd ~/POT/public/mobilenet-v2-pytorch
-python3 /opt/intel/openvino_2021/deployment_tools/open_model_zoo/tools/downloader/pytorch_to_onnx.py  \
+python3 /opt/intel/openvino_2022/extras/open_model_zoo/tools/downloader/pytorch_to_onnx.py  \
     --model-name=MobileNetV2 \
     --model-path=.  \
     --weights=mobilenet-v2.pth \
@@ -100,17 +100,17 @@ mv mobilenet-v2.bin ~/POT/model.bin
 
 Edit the configuration files:
 ```
-sudo vi $OV/deployment_tools/open_model_zoo/tools/accuracy_checker/dataset_definitions.yml
+sudo vi $OV/tools/accuracy_checker/dataset_definitions.yml
 (edit imagenet_1000_classes)
 ```
 ```
-export DEFINITIONS_FILE=/opt/intel/openvino_2021/deployment_tools/open_model_zoo/tools/accuracy_checker/dataset_definitions.yml
+export DEFINITIONS_FILE=/opt/intel/openvino_2022/tools/accuracy_checker/dataset_definitions.yml
 ```
 
 Copy the JSON file to my directory and edit:
 
 ```
-cp $OV/deployment_tools/tools/post_training_optimization_toolkit/configs/examples/quantization/classification/mobilenetV2_pytorch_int8.json ~/POT
+cp $OV/tools/post_training_optimization_toolkit/configs/examples/quantization/classification/mobilenetV2_pytorch_int8.json ~/POT
 ```
 ```
 vi mobilenetV2_pytorch_int8.json
@@ -119,7 +119,7 @@ vi mobilenetV2_pytorch_int8.json
 Copy the YML file to my directory and edit:
 
 ```
-cp /opt/intel/openvino_2021/deployment_tools/open_model_zoo/tools/accuracy_checker/configs/mobilenet-v2.yml ~/POT
+cp /opt/intel/openvino_2022/tools/accuracy_checker/configs/mobilenet-v2.yml ~/POT
 ```
 ```
 vi mobilenet-v2.yml
diff --git a/docs/how_tos/how-to-links.md b/docs/how_tos/how-to-links.md
index f263f22b5d236c..869c6f7736c651 100644
--- a/docs/how_tos/how-to-links.md
+++ b/docs/how_tos/how-to-links.md
@@ -17,36 +17,30 @@ To learn about what is *custom operation* and how to work with them in the Deep
  
 ## Introducing OpenVINO™ and Computer Vision | IoT Developer Show Season 2 | Intel Software
 
-[![](https://img.youtube.com/vi/M6Nyh2JDLQs/0.jpg)](https://www.youtube.com/watch?v=M6Nyh2JDLQs)
 <iframe width="560" height="315" src="https://www.youtube.com/embed/M6Nyh2JDLQs" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
 
 
 ## OpenVINO™ Toolkit and Two Hardware Development Kits | IoT Developer Show Season 2 | Intel Software
 
-[![](https://img.youtube.com/vi/GtJPBYjuyVU/0.jpg)](https://www.youtube.com/watch?v=GtJPBYjuyVU)
 <iframe width="560" height="315" src="https://www.youtube.com/embed/GtJPBYjuyVU" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
 
 
 ## Intel Demonstration of High Performance Vision Deployment - The OpenVINO Toolkit in Action
 
-[![](https://img.youtube.com/vi/1_iI_4Zgufw/0.jpg)](https://www.youtube.com/watch?v=1_iI_4Zgufw)
 <iframe width="560" height="315" src="https://www.youtube.com/embed/1_iI_4Zgufw" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
 
 
 ## Computer Vision at the Edge with OpenVINO by Krishnakumar Shetti at ODSC_India
 
-[![](https://img.youtube.com/vi/RfRCrq35LXg/0.jpg)](https://www.youtube.com/watch?v=RfRCrq35LXg)
 <iframe width="560" height="315" src="https://www.youtube.com/embed/RfRCrq35LXg" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
 
 
 ## Model optimizer concept
 
-[![](https://img.youtube.com/vi/Kl1ptVb7aI8/0.jpg)](https://www.youtube.com/watch?v=Kl1ptVb7aI8)
 <iframe width="560" height="315" src="https://www.youtube.com/embed/Kl1ptVb7aI8" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
 
 ## Computer Vision with Intel
 
-[![](https://img.youtube.com/vi/FZZD4FCvO9c/0.jpg)](https://www.youtube.com/watch?v=FZZD4FCvO9c)
 <iframe width="560" height="315" src="https://www.youtube.com/embed/FZZD4FCvO9c" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
 
 
diff --git a/docs/img/OpenVINO-diagram.png b/docs/img/OpenVINO-diagram.png
index f069f8cf947598..0402da8ff8a064 100644
--- a/docs/img/OpenVINO-diagram.png
+++ b/docs/img/OpenVINO-diagram.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:00ec72e982f658698b599dd8cbcbd50996a1982c4223bce93b807fa6b0c0c825
-size 233866
+oid sha256:93dd39fa3196a41ff6d1523ef473c5d0c5c584c24074b4b628e80bc09bd80fbe
+size 112452
diff --git a/docs/img/inference_pipeline_script_lnx.png b/docs/img/inference_pipeline_script_lnx.png
deleted file mode 100644
index a4ff0ba7f8e93f..00000000000000
--- a/docs/img/inference_pipeline_script_lnx.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9ca0811c19b4108054bfa66d99107e469409d7a0200745da96dd3e8fdac79daf
-size 397011
diff --git a/docs/img/inference_pipeline_script_mac.png b/docs/img/inference_pipeline_script_mac.png
deleted file mode 100644
index ebceb4a24353ed..00000000000000
--- a/docs/img/inference_pipeline_script_mac.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:619da8838c460aa26253fa6cfed3d3346fcf7c7c5deb8f178e9bd55dc78c9c8f
-size 2017750
diff --git a/docs/img/inference_pipeline_script_win.png b/docs/img/inference_pipeline_script_win.png
deleted file mode 100644
index a42f193d454aa6..00000000000000
--- a/docs/img/inference_pipeline_script_win.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c08b4d12634d3e17a7ed198cdc15be7b8e4b1fe33728d5f38d0998faa7ea8e7e
-size 568383
diff --git a/docs/img/int8vsfp32.png b/docs/img/int8vsfp32.png
index 9ecbdc8be7b08d..cc361c56905cdd 100644
--- a/docs/img/int8vsfp32.png
+++ b/docs/img/int8vsfp32.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e14f77f61f12c96ccf302667d51348a1e03579679155199910e3ebdf7d6adf06
-size 37915
+oid sha256:8cbe1a1c1dc477edc6909a011c1467b375f4f2ba868007befa4b2eccbaa2f2b1
+size 28229
diff --git a/docs/img/throughput_ovms_3dunet.png b/docs/img/throughput_ovms_3dunet.png
index 261310190a593a..cebe9eb4c68410 100644
--- a/docs/img/throughput_ovms_3dunet.png
+++ b/docs/img/throughput_ovms_3dunet.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e5a472a62de53998194bc1471539139807e00cbb75fd9edc605e7ed99b5630af
-size 18336
+oid sha256:d4cbf542d393f920c5731ce973f09836e08aaa35987ef0a19355e3e895179936
+size 17981
diff --git a/docs/img/throughput_ovms_bertlarge_fp32.png b/docs/img/throughput_ovms_bertlarge_fp32.png
index 8fb4e484e174ce..06cbe83946b982 100644
--- a/docs/img/throughput_ovms_bertlarge_fp32.png
+++ b/docs/img/throughput_ovms_bertlarge_fp32.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2f7c58da93fc7966e154bdade48d408401b097f4b0306b7c85aa4256ad72b59d
-size 18118
+oid sha256:c57a6e967b6515a34e0c62c4dd850bebc2e009f75f17ddd0a5d74a1028e84668
+size 19028
diff --git a/docs/img/throughput_ovms_bertlarge_int8.png b/docs/img/throughput_ovms_bertlarge_int8.png
index 90e6e3a94265d7..f1e8dc767c35f6 100644
--- a/docs/img/throughput_ovms_bertlarge_int8.png
+++ b/docs/img/throughput_ovms_bertlarge_int8.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:104d8cd5eac2d1714db85df9cba5c2cfcc113ec54d428cd6e979e75e10473be6
-size 17924
+oid sha256:690e57d94f5c0c0ea31fc04a214b56ab618eac988a72c89b3542f52b4f44d513
+size 19507
diff --git a/docs/img/throughput_ovms_bertsmall_fp32.png b/docs/img/throughput_ovms_bertsmall_fp32.png
new file mode 100644
index 00000000000000..7e1a1785d5539b
--- /dev/null
+++ b/docs/img/throughput_ovms_bertsmall_fp32.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5663cfab7a1611e921fc0b775d946009d6f7a7019e5e9dc6ebe96ccb6c6f1d7f
+size 20145
diff --git a/docs/img/throughput_ovms_bertsmall_int8.png b/docs/img/throughput_ovms_bertsmall_int8.png
new file mode 100644
index 00000000000000..d5edcccac5f6e0
--- /dev/null
+++ b/docs/img/throughput_ovms_bertsmall_int8.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aad18293f64089992862e6a17b5271cc982da89b6b7493516a59252368945c87
+size 20998
diff --git a/docs/img/throughput_ovms_mobilenet3large_fp32.png b/docs/img/throughput_ovms_mobilenet3large_fp32.png
new file mode 100644
index 00000000000000..bae4a1b9a7c4e9
--- /dev/null
+++ b/docs/img/throughput_ovms_mobilenet3large_fp32.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:70daf9e0016e56d8c7bb2f0efe2ac592434962bb8bea95f9120acd7b14d8b5b0
+size 21763
diff --git a/docs/img/throughput_ovms_mobilenet3small_fp32.png b/docs/img/throughput_ovms_mobilenet3small_fp32.png
new file mode 100644
index 00000000000000..2add38465111b1
--- /dev/null
+++ b/docs/img/throughput_ovms_mobilenet3small_fp32.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3db1f5acdad5880e44965eb71a33ac47aee331ee2f4318e2214786ea5a1e5289
+size 21923
diff --git a/docs/img/throughput_ovms_resnet50_fp32_bs_1.png b/docs/img/throughput_ovms_resnet50_fp32_bs_1.png
new file mode 100644
index 00000000000000..8f559af5292153
--- /dev/null
+++ b/docs/img/throughput_ovms_resnet50_fp32_bs_1.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67a7444a934da6e70c77c937fc7a830d1ba2fbde99f3f3260479c39b9b7b1cee
+size 20279
diff --git a/docs/img/throughput_ovms_resnet50_int8.png b/docs/img/throughput_ovms_resnet50_int8.png
index fdd92852fa9d13..8601a4c244e2ca 100644
--- a/docs/img/throughput_ovms_resnet50_int8.png
+++ b/docs/img/throughput_ovms_resnet50_int8.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:32116d6d1acc20d8cb2fa10e290e052e3146ba1290f1c5e4aaf16a85388b6ec6
-size 19387
+oid sha256:5d96e146a1b7d4e48b683de3ed7665c41244ec68cdad94eb79ac497948af9b08
+size 21255
diff --git a/docs/img/throughput_ovms_ssdmobilenet1_fp32.png b/docs/img/throughput_ovms_ssdmobilenet1_fp32.png
new file mode 100644
index 00000000000000..bb7603e4833654
--- /dev/null
+++ b/docs/img/throughput_ovms_ssdmobilenet1_fp32.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d1ab823ea109f908b3e38bf88a7004cfdc374746b5ec4870547fade0f7684035
+size 20084
diff --git a/docs/img/throughput_ovms_yolo3_fp32.png b/docs/img/throughput_ovms_yolo3_fp32.png
new file mode 100644
index 00000000000000..50090422314df4
--- /dev/null
+++ b/docs/img/throughput_ovms_yolo3_fp32.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b16674fabd80d73e455c276ef262f3d0a1cf6b00152340dd4e2645330f358432
+size 19341
diff --git a/docs/img/throughput_ovms_yolo3tiny_fp32.png b/docs/img/throughput_ovms_yolo3tiny_fp32.png
new file mode 100644
index 00000000000000..54316feffba70b
--- /dev/null
+++ b/docs/img/throughput_ovms_yolo3tiny_fp32.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48bc60c34f141a3cb232ae8370468f2861ac36cb926be981ff3153f05d4d5187
+size 19992
diff --git a/docs/img/throughput_ovms_yolo4_fp32.png b/docs/img/throughput_ovms_yolo4_fp32.png
new file mode 100644
index 00000000000000..c1bb655a5cd411
--- /dev/null
+++ b/docs/img/throughput_ovms_yolo4_fp32.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f472d1fa6058d7ce988e9a2da8b5c6c106d8aa7e90bf2d383d2eaf685a725ab4
+size 19107
diff --git a/docs/img/workflow_steps.png b/docs/img/workflow_steps.png
index 7e8f3030c5d6b7..fee04b7cb33ebe 100644
--- a/docs/img/workflow_steps.png
+++ b/docs/img/workflow_steps.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b630a7deb8bbcf1d5384c351baff7505dc96a1a5d59b5f6786845d549d93d9ab
-size 36881
+oid sha256:5281f26cbaa468dc4cafa4ce2fde35d338fe0f658bbb796abaaf793e951939f6
+size 13943
diff --git a/docs/index.md b/docs/index.md
index 4f1012b5353adb..7cc4eb90f7bfcf 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -45,7 +45,7 @@ Useful documents for model optimization:
 ### Running and Tuning Inference
 The other core component of OpenVINO™ is the [Inference Engine](IE_DG/Deep_Learning_Inference_Engine_DevGuide.md), which manages the loading and compiling of the optimized neural network model, runs inference operations on input data, and outputs the results. Inference Engine can execute synchronously or asynchronously, and its plugin architecture manages the appropriate compilations for execution on multiple Intel® devices, including both workhorse CPUs and specialized graphics and video processing platforms (see below, Packaging and Deployment).
 
-You can use OpenVINO™ Tuning Utilities with the Inference Engine to trial and test inference on your model. The Benchmark utility uses an input model to run iterative tests for throughput or latency measures, and the [Cross Check Utility](../inference-engine/tools/cross_check_tool/README.md) compares performance of differently configured inferences. 
+You can use OpenVINO™ Tuning Utilities with the Inference Engine to trial and test inference on your model. The Benchmark utility uses an input model to run iterative tests for throughput or latency measures, and the [Cross Check Utility](../tools/cross_check_tool/README.md) compares performance of differently configured inferences.
 
 For a full browser-based studio integrating these other key tuning utilities, try the [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction).
 ![](img/OV-diagram-step3.png)
@@ -81,7 +81,7 @@ The Inference Engine's plug-in architecture can be extended to meet other specia
 * [Deployment Manager Guide](./install_guides/deployment-manager-tool.md)
 
 
-## OpenVINO™ Toolkit Components 
+## OpenVINO™ Toolkit Components
 
 Intel® Distribution of OpenVINO™ toolkit includes the following components:
 
@@ -90,11 +90,11 @@ Intel® Distribution of OpenVINO™ toolkit includes the following components:
 - [Inference Engine Samples](IE_DG/Samples_Overview.md): A set of simple console applications demonstrating how to use the Inference Engine in your applications.
 - [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction): A web-based graphical environment that allows you to easily use various sophisticated OpenVINO™ toolkit components.
 - [Post-training Optimization Tool](@ref pot_README): A tool to calibrate a model and then execute it in the INT8 precision.
-- Additional Tools: A set of tools to work with your models including [Benchmark App](../inference-engine/tools/benchmark_tool/README.md), [Cross Check Tool](../inference-engine/tools/cross_check_tool/README.md), [Compile tool](../inference-engine/tools/compile_tool/README.md).
-- [Open Model Zoo](@ref omz_models_group_intel)     
+- Additional Tools: A set of tools to work with your models including [Benchmark App](../tools/benchmark_tool/README.md), [Cross Check Tool](../tools/cross_check_tool/README.md), [Compile tool](../tools/compile_tool/README.md).
+- [Open Model Zoo](@ref omz_models_group_intel)
     - [Demos](@ref omz_demos): Console applications that provide robust application templates to help you implement specific deep learning scenarios.
     - Additional Tools: A set of tools to work with your models including [Accuracy Checker Utility](@ref omz_tools_accuracy_checker) and [Model Downloader](@ref omz_tools_downloader).
-    - [Documentation for Pretrained Models](@ref omz_models_group_intel): Documentation for pre-trained models that are available in the [Open Model Zoo repository](https://github.com/openvinotoolkit/open_model_zoo).
+    - [Documentation for Pre-trained Models](@ref omz_models_group_intel): Documentation for pre-trained models that are available in the [Open Model Zoo repository](https://github.com/openvinotoolkit/open_model_zoo).
 - Deep Learning Streamer (DL Streamer): Streaming analytics framework, based on GStreamer, for constructing graphs of media analytics components. DL Streamer can be installed by the Intel® Distribution of OpenVINO™ toolkit installer. Its open-source version is available on [GitHub](https://github.com/openvinotoolkit/dlstreamer_gst). For the DL Streamer documentation, see:
     - [DL Streamer Samples](@ref gst_samples_README)
     - [API Reference](https://openvinotoolkit.github.io/dlstreamer_gst/)
@@ -104,3 +104,9 @@ Intel® Distribution of OpenVINO™ toolkit includes the following components:
 - [Intel® Media SDK](https://software.intel.com/en-us/media-sdk) (in Intel® Distribution of OpenVINO™ toolkit for Linux only)
 
 OpenVINO™ Toolkit opensource version is available on [GitHub](https://github.com/openvinotoolkit/openvino). For building the Inference Engine from the source code, see the <a href="https://github.com/openvinotoolkit/openvino/wiki/BuildingCode">build instructions</a>.
+
+
+## OpenVINO™ API 2.0 
+
+The new OpenVINO™ API 2.0 was introduced to make OpenVINO™ interface more user-friendly and align OpenVINO™ with other frameworks.
+The [migration guide](@ref ov_2_0_transition_guide) should allow to simplify the process of migration application from old API to OpenVINO™ API 2.0.
diff --git a/docs/install_guides/PAC_Configure.md b/docs/install_guides/PAC_Configure.md
deleted file mode 100644
index 7f4f46ee18f1e8..00000000000000
--- a/docs/install_guides/PAC_Configure.md
+++ /dev/null
@@ -1,21 +0,0 @@
-# Configuration Guide for Intel® Distribution of OpenVINO™ toolkit 2020.4 and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA on CentOS or Ubuntu* {#openvino_docs_install_guides_PAC_Configure}
-
-## Product Change Notice
-Intel® Distribution of OpenVINO™ toolkit for Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA
-
-<table>
-  <tr>
-    <td><strong>Change Notice Begins</strong></td>
-    <td>July 2020</td>
-  </tr>
-  <tr>
-    <td><strong>Change Date</strong></td>
-    <td>October 2020</td>
-  </tr>
-</table> 
-
-Intel will be transitioning to the next-generation programmable deep-learning solution based on FPGAs in order to increase the level of customization possible in FPGA deep-learning. As part of this transition, future standard releases (i.e., non-LTS releases) of Intel® Distribution of OpenVINO™ toolkit will no longer include the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA.
-
-Intel® Distribution of OpenVINO™ toolkit 2020.3.X LTS release will continue to support Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA. For questions about next-generation programmable deep-learning solutions based on FPGAs, please talk to your sales representative or contact us to get the latest FPGA updates.
-
-For documentation for previous releases of Intel® Distribution of OpenVINO™ toolkit for Linux* with FPGA Support, see documentation for the [2020.4 version](https://docs.openvinotoolkit.org/2020.4/openvino_docs_install_guides_PAC_Configure.html) and lower.
diff --git a/docs/install_guides/PAC_Configure_2018R5.md b/docs/install_guides/PAC_Configure_2018R5.md
deleted file mode 100644
index 1378c0c6f2cb09..00000000000000
--- a/docs/install_guides/PAC_Configure_2018R5.md
+++ /dev/null
@@ -1,247 +0,0 @@
-# Configuration Guide for Intel® Distribution of OpenVINO™ toolkit 2018R5 and the Intel® Programmable Acceleration Card with Intel® Arria® 10 FPGA GX on CentOS*  {#openvino_docs_install_guides_PAC_Configure_2018R5}
-
-## Get Started
-
-The following describes the set-up of the Intel® Distribution of OpenVINO™ toolkit on CentOS* 7.4. This is based upon a completely fresh install of CentOS 7.4 with developer tools included. This document was written for the Intel® Distribution of OpenVINO™ toolkit 2018 R5 release and may be largely applicable for later versions. Official Intel® documentation for the install process can be found in the following locations and it is highly recommended that these are read, especially for new users. This document serves as a guide, and in some cases, adds additional detail, specifically for an install with `sudo` privileges on CentOS 7.4.
-
-[Intel® Acceleration Stack for FPGAs Quick Start Guide](https://www.intel.com/content/dam/altera-www/global/en_US/pdfs/literature/ug/ug-qs-ias-v1-1.pdf)
-
-[OpenCL™ on Intel® PAC Quick Start Guide](https://www.intel.com/content/dam/altera-www/global/en_US/pdfs/literature/ug/ug-qs-ias-opencl-a10-v1-1.pdf)
-
-[Installing the Intel® Distribution of OpenVINO™ toolkit for Linux*](https://docs.openvinotoolkit.org/latest/_docs_install_guides_installing_openvino_linux.html)
-
-(Optional): Install NTFS support for transferring large installers if already downloaded on another machine.
-```sh
-sudo yum -y install epel-release
-```
-```sh
-sudo yum -y install ntfs-3g
-```
-
-## Install Intel® PAC and the Intel® Programmable Acceleration Card Stack
-
-1. Download version 1.1 of the Acceleration Stack for Runtime from the [Intel FPGA Acceleration Hub](https://www.altera.com/solutions/acceleration-hub/downloads.html). 
-This downloads as `a10_gx_pac_ias_1_1_pv_rte_installer.tar.gz`. Let it download to `~/Downloads`.
-
-2. Create a new directory to install to:
-```sh
-mkdir -p ~/tools/intelrtestack
-```
-
-3. Untar and launch the installer:
-```sh
-cd ~/Downloads
-```
-```sh
-tar xf a10_gx_pac_ias_1_1_pv_rte_installer.tar.gz
-```
-```sh
-cd a10_gx_pac_ias_1_1_pv_rte_installer
-```
-```sh
-sudo ./setup.sh
-```
-
-4. Select **Y** to install OPAE and accept license and when asked, specify `~/tools/intelrtestack` as the install path. During the installation there should be a message stating the directory already exists as it was created in the first command above.  Select Y to install to this directory. If this message is not seen, it suggests that there was a typo when entering the install location.
-
-5. Tools are installed to the following directories:
-   * `Intel® Quartus® software Programmer: ~/tools/inteltrestack/intelFPGA_pro/qprogrammer`
-   * `OpenCL™ Run Time Environment: ~/tools/intelrtestack/intelFPGA_pro/aclrte-linux64`
-   * `Intel® Acceleration Stack for FPGAs: ~/tools/intelrtestack/a10_gx_pac_ias_1_1_pv`
-
-6. Install E10/E40 Software Patch
-```sh
-source ~/tools/intelrtestack/init_env.sh
-```
-```sh
-cd $OPAE_PLATFORM_ROOT/hw
-```
-```sh
-sudo wget https://www.intel.com/content/dam/altera-www/global/en_US/others/solutions/acceleration-hub/a10_gx_pac_ias_1_1_pv_eth.patch
-```
-```sh
-sudo patch -s -p0 < a10_gx_pac_ias_1_1_pv_eth.patch
-```
-
-7. Check the version of the FPGA Interface Manager firmware on the PAC board.
-```sh
-sudo fpgainfo fme
-```
-
-8. If the reported `Pr Interface Id` is not `9926ab6d-6c92-5a68-aabc-a7d84c545738` then follow the instructions in section 4 of the [Intel® Acceleration Stack for FPGAs Quick Start Guide](https://www.intel.com/content/dam/altera-www/global/en_US/pdfs/literature/ug/ug-qs-ias-v1-1.pdf) to update the FME.
-
-9. Run the built in self-test to verify operation of the Acceleration Stack and Intel® PAC in a non-virtualized environment.
-```sh
-sudo sh -c "echo 20 > /sys/kernel/mm/hugepages/hugepages-2048kB/nr_hugepages"
-```
-```sh
-sudo fpgabist $OPAE_PLATFORM_ROOT/hw/samples/nlb_mode_3/bin/nlb_mode_3.gbs
-```
-
-## Extract and Verify the Intel® Acceleration Stack for FPGAs OpenCL™ BSP
-
-1. Extract the BSP
-```sh
-cd $OPAE_PLATFORM_ROOT/opencl
-```
-```sh
-sudo tar xf opencl_bsp.tar.gz
-```
-
-2. Create an initialization script `~/init_openvino.sh` with the following content that can be run upon opening a new terminal or rebooting. This will source the script ran above as well as setting up the OpenCL™ environment.
-```sh
-source \$HOME/tools/intelrtestack/init_env.sh
-```
-```sh
-export CL_CONTEXT_COMPILER_MODE_ALTERA=3
-```
-```sh
-export CL_CONTEXT_COMPILER_MODE_INTELFPGA=3
-```
-```sh
-export INTELFPGAOCLSDKROOT="\$HOME/tools/intelrtestack/intelFPGA_pro/aclrte-linux64"
-```
-```sh
-export ALTERAOCLSDKROOT="\$INTELFPGAOCLSDKROOT"
-```
-```sh
-export AOCL_BOARD_PACKAGE_ROOT="\$OPAE_PLATFORM_ROOT/opencl/opencl_bsp"
-```
-```sh
-\$AOCL_BOARD_PACKAGE_ROOT/linux64/libexec/setup_permissions.sh```
-```sh
-source $INTELFPGAOCLSDKROOT/init_opencl.sh
-```
-
-3. Source the script:
-```sh
-source ~/init_openvino.sh
-```
-
-4. Some of the settings made in the child scripts need a reboot to take effect.  Reboot the machine and source the script again. Note that this script should be sourced each time a new terminal is opened for use with the Intel® Acceleration Stack for FPGAs and Intel® Distribution of OpenVINO™ toolkit.
-```sh
-source ~/init_openvino.sh
-```
-
-5. Install the OpenCL™ driver:
-```sh
-cd ~
-```
-```sh
-sudo -E ./tools/intelrtestack/intelFPGA_pro/aclrte-linux64/bin/aocl install
-```
-Select **Y** when asked to install the BSP. Note that the following warning can be safely ignored.
-```sh
-WARNING: install not implemented.  Please refer to DCP Quick Start User Guide.
-```
-
-6. Program the Intel® PAC board with a pre-compiled `.aocx` file (OpenCL™ based FPGA bitstream).
-```sh
-cd \$OPAE_PLATFORM_ROOT/opencl
-```
-```sh 
-aocl program acl0 hello_world.aocx
-```
-
-7. Build and run the Hello World application:
-```sh
-sudo tar xf exm_opencl_hello_world_x64_linux.tgz
-```
-```sh
-sudo chmod -R a+w hello_world
-```
-```sh
-cd hello_world
-```
-```sh
-make
-```
-```sh
-cp ../hello_world.aocx ./bin
-```
-```sh
-./bin/host
-```
-
-## Add Intel® Distribution of OpenVINO™ toolkit with FPGA Support to Environment Variables
-
-1. To run the Intel® Distribution of OpenVINO™ toolkit, add the last four commands to the `~/init_openvino.sh` script. The previous content is shown as well.
-```sh
-source \$HOME/tools/intelrtestack/init_env.sh
-export CL_CONTEXT_COMPILER_MODE_ALTERA=3
-export CL_CONTEXT_COMPILER_MODE_INTELFPGA=3
-export INTELFPGAOCLSDKROOT="\$HOME/tools/intelrtestack/intelFPGA_pro/aclrte-linux64"
-export ALTERAOCLSDKROOT="\$INTELFPGAOCLSDKROOT"
-export AOCL_BOARD_PACKAGE_ROOT="\$OPAE_PLATFORM_ROOT/opencl/opencl_bsp"
-\$AOCL_BOARD_PACKAGE_ROOT/linux64/libexec/setup_permissions.sh
-source $INTELFPGAOCLSDKROOT/init_opencl.sh
-export IE_INSTALL="/opt/intel/openvino/deployment_tools"
-source \$IE_INSTALL/../bin/setupvars.sh
-export PATH="\$PATH:\$HOME/inference_engine_samples/intel64/Release"
-alias mo="python3.6 \$IE_INSTALL/model_optimizer/mo.py"
-```
-
-2. Source the script
-```sh
-source ~/init_openvino.sh
-```
-
-## Program a Bitstream
-
-The bitstream you program should correspond to the topology you want to deploy. In this section, you program a SqueezeNet bitstream and deploy the classification sample with a SqueezeNet model.
-
-> **IMPORTANT**: Only use bitstreams from the installed version of the Intel® Distribution of OpenVINO™ toolkit. Bitstreams from older versions of the Intel® Distribution of OpenVINO™ toolkit are incompatible with later versions. For example, you cannot use the `1-0-1_RC_FP16_Generic` bitstream, when the Intel® Distribution of OpenVINO™ toolkit supports the `2-0-1_RC_FP16_Generic bitstream`.
-
-There are different folders for each FPGA card type which were downloaded in the Intel® Distribution of OpenVINO™ toolkit package. 
-For the Intel® Programmable Acceleration Card with Intel® Arria® 10 FPGA GX, the pre-trained bitstreams are in the `/opt/intel/openvino/bitstreams/a10_dcp_bitstreams` directory. This example uses a SqueezeNet bitstream with low precision for the classification sample.
-
-Program the bitstream for Intel® Programmable Acceleration Card with Intel® Arria® 10 FPGA GX:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_dcp_bitstreams/5-0_RC_FP11_SqueezeNet.aocx
-```
-
-## Use the Intel® Distribution of OpenVINO™ toolkit
-
-1. Run inference with the Intel® Distribution of OpenVINO™ toolkit independent of the demo scripts using the SqueezeNet model that was download by the scripts. For convenience, copy the necessary files to a local directory. If the workstation has been rebooted or a new terminal is opened, source the script above first.
-```sh
-mkdir ~/openvino_test
-```
-```sh
-cd ~/openvino_test
-```
-```sh
-cp ~/openvino_models/classification/squeezenet/1.1/caffe/squeezenet1.1.* .
-```
-```sh
-cp ~/openvino_models/ir/squeezenet1.1/squeezenet1.1.labels .
-```
-
-2. Note that the `squeezenet1.1.labels` file contains the classes used by ImageNet and is included here so that the inference results show text rather than classification numbers.  Convert the model with the [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).  Note that the command below uses the alias defined in the script above and is not referred to in other documentation.
-```sh
-mo --input_model squeezenet1.1.caffemodel
-```
-
-3. Now run Inference on the CPU using one of the built in Inference Engine samples:
-```sh
-classification_sample_async -m squeezenet1.1.xml -i $IE_INSTALL/demo/car.png
-```
-
-4. Add the `-d` option to run on FPGA:
-```sh
-classification_sample_async -m squeezenet1.1.xml -i $IE_INSTALL/demo/car.png -d HETERO:FPGA,CPU
-```
-
-5. Increase the number of iterations with the `-ni` option to reduce the impact of initialization:
-```sh
-classification_sample_async -m squeezenet1.1.xml -i $IE_INSTALL/demo/car.png -d HETERO:FPGA,CPU -ni 100
-```
-
-Congratulations, You are done with the Intel® Distribution of OpenVINO™ toolkit installation for FPGA. 
-
-## Additional Resources
-
-Intel® Distribution of OpenVINO™ toolkit home page: [https://software.intel.com/en-us/openvino-toolkit](https://software.intel.com/en-us/openvino-toolkit)
-
-Intel® Distribution of OpenVINO™ toolkit documentation: [https://docs.openvinotoolkit.org](https://docs.openvinotoolkit.org)
-
-Inference Engine FPGA plugin documentation: [https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html)
diff --git a/docs/install_guides/PAC_Configure_2019RX.md b/docs/install_guides/PAC_Configure_2019RX.md
deleted file mode 100644
index 150ca475d65a8e..00000000000000
--- a/docs/install_guides/PAC_Configure_2019RX.md
+++ /dev/null
@@ -1,247 +0,0 @@
-# Configuration Guide for Intel® Distribution of OpenVINO™ toolkit 2019R1/2019R2/2019R3/2020.1 and the Intel® Programmable Acceleration Card with Intel® Arria® 10 FPGA GX on CentOS or Ubuntu*  {#openvino_docs_install_guides_PAC_Configure_2019RX}
-
-## Get Started
-
-The following describes the set-up of the Intel® Distribution of OpenVINO™ toolkit on CentOS* 7.4 or Ubuntu* 16.04, kernel 4.15.  This is based upon a completely fresh install of the OS with developer tools included.  This document was written for the Intel® Distribution of OpenVINO™ toolkit 2019 release 1, 2, and 3 and may be largely applicable for later versions.  Official Intel® documentation for the install process can be found in the following locations and it is highly recommended that these are read, especially for new users. This document serves as a guide, and in some cases, adds additional detail where necessary.
-
-[Intel® Acceleration Stack for FPGAs Quick Start Guide](https://www.intel.com/content/dam/altera-www/global/en_US/pdfs/literature/ug/ug-qs-ias-v1-1.pdf)
-
-[OpenCL™ on Intel® PAC Quick Start Guide](https://www.intel.com/content/dam/altera-www/global/en_US/pdfs/literature/ug/ug-qs-ias-opencl-a10-v1-1.pdf)
-
-[Installing the Intel® Distribution of OpenVINO™ toolkit for Linux*](https://docs.openvinotoolkit.org/latest/_docs_install_guides_installing_openvino_linux.html)
-
-(Optional): Install NTFS support for transferring large installers if already downloaded on another machine.
-```sh
-sudo yum -y install epel-release
-```
-```sh
-sudo yum -y install ntfs-3g
-```
-
-## Install Intel® PAC and the Intel® Programmable Acceleration Card Stack
-
-1. Download version 1.2 of the Acceleration Stack for Runtime from the [Intel FPGA Acceleration Hub](https://www.altera.com/solutions/acceleration-hub/downloads.html). 
-This downloads as `a10_gx_pac_ias_1_2_pv_rte_installer.tar.gz`. Let it download to `~/Downloads`.
-
-2. Create a new directory to install to:
-```sh
-mkdir -p ~/tools/intelrtestack
-```
-
-3. Untar and launch the installer:
-```sh
-cd ~/Downloads
-```
-```sh
-tar xf a10_gx_pac_ias_1_2_pv_rte_installer.tar.gz
-```
-```sh
-cd a10_gx_pac_ias_1_2_pv_rte_installer
-```
-```sh
-./setup.sh
-```
-
-4. Select **Y** to install OPAE and accept license and when asked, specify `/home/<user>/tools/intelrtestack` as the absolute install path. During the installation there should be a message stating the directory already exists as it was created in the first command above.  Select **Y** to install to this directory. If this message is not seen, it suggests that there was a typo when entering the install location.
-
-5. Tools are installed to the following directories:
-   * OpenCL™ Runtime Environment: `~/tools/intelrtestack/opencl_rte/aclrte-linux64`
-   * Intel® Acceleration Stack for FPGAs: `~/tools/intelrtestack/a10_gx_pac_ias_1_2_pv`
-  
-7. Check the version of the FPGA Interface Manager firmware on the PAC board.
-```sh
-sudo fpgainfo fme
-```
-
-8. If the reported `Pr Interface Id` is not `69528db6-eb31-577a-8c36-68f9faa081f6` then follow the instructions in section 4 of the [Intel® Acceleration Stack for FPGAs Quick Start Guide](https://www.intel.com/content/dam/altera-www/global/en_US/pdfs/literature/ug/ug-qs-ias-v1-2.pdf) to update the FME.
-
-9. Run the built in self-test to verify operation of the Acceleration Stack and Intel® PAC in a non-virtualized environment.
-```sh
-sudo sh -c "echo 20 > /sys/kernel/mm/hugepages/hugepages-2048kB/nr_hugepages"
-```
-```sh
-source ~/tools/intelrtestack/init_env.sh
-```
-```sh
-sudo fpgabist $OPAE_PLATFORM_ROOT/hw/samples/nlb_mode_3/bin/nlb_mode_3.gbs
-```
-
-## Verify the Intel® Acceleration Stack for FPGAs OpenCL™ BSP
-
-1. Remove any previous FCD files that may be from previous installations of hardware in the `/opt/Intel/OpenCL/Boards/` directory:
-```sh
-cd /opt/Intel/OpenCL/Boards
-sudo rm -rf *.fcd
-```
-
-2. Install `lsb_release` on your system if you are using CentOS:
-```sh
-sudo yum install redhat-lsb-core
-``` 
-
-3. Create an initialization script `~/init_openvino.sh` with the following content that can be run upon opening a new terminal or rebooting. This will source the script ran above as well as setting up the OpenCL™ environment.
-```sh
-source $HOME/tools/intelrtestack/init_env.sh
-```
-```sh
-export CL_CONTEXT_COMPILER_MODE_ALTERA=3
-```
-```sh
-export CL_CONTEXT_COMPILER_MODE_INTELFPGA=3
-```
-```sh
-export INTELFPGAOCLSDKROOT="/opt/altera/aocl-pro-rte/aclrte-linux64"
-```
-```sh
-export ALTERAOCLSDKROOT="$INTELFPGAOCLSDKROOT"
-```
-```sh
-export AOCL_BOARD_PACKAGE_ROOT="$OPAE_PLATFORM_ROOT/opencl/opencl_bsp"
-```
-```sh
-$AOCL_BOARD_PACKAGE_ROOT/linux64/libexec/setup_permissions.sh
-```
-```sh
-source $INTELFPGAOCLSDKROOT/init_opencl.sh
-```
-
-4. Source the script:
-```sh
-source ~/init_openvino.sh
-```
-
-5. Some of the settings made in the child scripts need a reboot to take effect.  Reboot the machine and source the script again. Note that this script should be sourced each time a new terminal is opened for use with the Intel® Acceleration Stack for FPGAs and Intel® Distribution of OpenVINO™ toolkit.
-```sh
-source ~/init_openvino.sh
-```
-
-6. Install the OpenCL™ driver:
-```sh
-cd ~
-```
-```sh
-sudo -E ./tools/intelrtestack/opencl_rte/aclrte-linux64/bin/aocl install
-```
-Select **Y** when asked to install the BSP. Note that the following warning can be safely ignored.
-```sh
-WARNING: install not implemented.  Please refer to DCP Quick Start User Guide.
-```
-
-7. Program the Intel® PAC board with a pre-compiled `.aocx` file (OpenCL™ based FPGA bitstream).
-```sh
-cd $OPAE_PLATFORM_ROOT/opencl
-```
-```sh 
-aocl program acl0 hello_world.aocx
-```
-
-8. Build and run the Hello World application:
-```sh
-sudo tar xf exm_opencl_hello_world_x64_linux.tgz
-```
-```sh
-sudo chmod -R a+w hello_world
-```
-```sh
-cd hello_world
-```
-```sh
-make
-```
-```sh
-cp ../hello_world.aocx ./bin
-```
-```sh
-./bin/host
-```
-
-## Add Intel® Distribution of OpenVINO™ toolkit with FPGA Support to Environment Variables
-
-1. To run the Intel® Distribution of OpenVINO™ toolkit, add the last four commands to the `~/init_openvino.sh` script. The previous content is shown as well.
-```sh
-source $HOME/tools/intelrtestack/init_env.sh
-export CL_CONTEXT_COMPILER_MODE_ALTERA=3
-export CL_CONTEXT_COMPILER_MODE_INTELFPGA=3
-export INTELFPGAOCLSDKROOT="/opt/altera/aocl-pro-rte/aclrte-linux64"
-export ALTERAOCLSDKROOT="$INTELFPGAOCLSDKROOT"
-export AOCL_BOARD_PACKAGE_ROOT="$OPAE_PLATFORM_ROOT/opencl/opencl_bsp"
-$AOCL_BOARD_PACKAGE_ROOT/linux64/libexec/setup_permissions.sh
-source $INTELFPGAOCLSDKROOT/init_opencl.sh
-export IE_INSTALL="/opt/intel/openvino/deployment_tools"
-source $IE_INSTALL/../bin/setupvars.sh
-export PATH="$PATH:$HOME/inference_engine_samples_build/intel64/Release"
-alias mo="python3.6 $IE_INSTALL/model_optimizer/mo.py"
-```
-For Ubuntu systems, it is recommended to use python3.5 above instead of python3.6.
-
-2. Source the script
-```sh
-source ~/init_openvino.sh
-```
-
-## Program a Bitstream
-
-The bitstream you program should correspond to the topology you want to deploy. In this section, you program a SqueezeNet bitstream and deploy the classification sample with a SqueezeNet model.
-
-> **IMPORTANT**: Only use bitstreams from the installed version of the Intel® Distribution of OpenVINO™ toolkit. Bitstreams from older versions of the Intel® Distribution of OpenVINO™ toolkit are incompatible with later versions. For example, you cannot use the `1-0-1_RC_FP16_Generic` bitstream, when the Intel® Distribution of OpenVINO™ toolkit supports the `2-0-1_RC_FP16_Generic bitstream`.
-
-There are different folders for each FPGA card type which were downloaded in the Intel® Distribution of OpenVINO™ toolkit package. 
-For the Intel® Programmable Acceleration Card with Intel® Arria® 10 FPGA GX, the pre-trained bitstreams are in the `/opt/intel/openvino/bitstreams/a10_dcp_bitstreams` directory. This example uses a SqueezeNet bitstream with low precision for the classification sample.
-
-Program the bitstream for Intel® Programmable Acceleration Card with Intel® Arria® 10 FPGA GX.
-For R1:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_dcp_bitstreams/2019R1_RC_FP11_ResNet_SqueezeNet_VGG.aocx
-```
-Or for R2:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_dcp_bitstreams/2019R2_RC_FP11_ResNet_SqueezeNet_VGG.aocx
-```
-Or for R3:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_dcp_bitstreams/2019R3_PV_RC_FP11_InceptionV1_ResNet_SqueezeNet_TinyYolo_VGG.aocx
-```
-Or for 2020.1:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_dcp_bitstreams/2019R4_RC_FP11_ResNet_SqueezeNet_TinyYolo.aocx
-```
-
-## Use the Intel® Distribution of OpenVINO™ toolkit
-
-1. Run inference with the Intel® Distribution of OpenVINO™ toolkit independent of the demo scripts using the SqueezeNet model that was download by the scripts. For convenience, copy the necessary files to a local directory. If the workstation has been rebooted or a new terminal is opened, source the script above first.
-```sh
-mkdir ~/openvino_test
-```
-```sh
-cd ~/openvino_test
-```
-```sh
-cp ~/openvino_models/models/public/squeezenet1.1/squeezenet1.1.* .
-```
-```sh
-cp ~/openvino_models/ir/public/squeezenet1.1/FP16/squeezenet1.1.labels .
-```
-
-2. Note that the `squeezenet1.1.labels` file contains the classes used by ImageNet and is included here so that the inference results show text rather than classification numbers.  Convert the model with the [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).  Note that the command below uses the alias defined in the script above and is not referred to in other documentation.
-```sh
-mo --input_model squeezenet1.1.caffemodel
-```
-
-3. Now run Inference on the CPU using one of the built in Inference Engine samples:
-```sh
-classification_sample_async -m squeezenet1.1.xml -i $IE_INSTALL/demo/car.png
-```
-
-4. Add the `-d` option to run on FPGA:
-```sh
-classification_sample_async -m squeezenet1.1.xml -i $IE_INSTALL/demo/car.png -d HETERO:FPGA,CPU
-```
-
-Congratulations, You are done with the Intel® Distribution of OpenVINO™ toolkit installation for FPGA. 
-## Additional Resources
-
-Intel® Distribution of OpenVINO™ toolkit home page: [https://software.intel.com/en-us/openvino-toolkit](https://software.intel.com/en-us/openvino-toolkit)
-
-Intel® Distribution of OpenVINO™ toolkit documentation: [https://docs.openvinotoolkit.org](https://docs.openvinotoolkit.org)
-
-Inference Engine FPGA plugin documentation: [https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html)
diff --git a/docs/install_guides/VisionAcceleratorFPGA_Configure.md b/docs/install_guides/VisionAcceleratorFPGA_Configure.md
deleted file mode 100644
index 07ff86e8fb8280..00000000000000
--- a/docs/install_guides/VisionAcceleratorFPGA_Configure.md
+++ /dev/null
@@ -1,21 +0,0 @@
-# Configuration Guide for the Intel® Distribution of OpenVINO™ toolkit 2020.4 and the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA SG2 (IEI's Mustang-F100-A10) on Linux* {#openvino_docs_install_guides_VisionAcceleratorFPGA_Configure}
-
-## Product Change Notice
-Intel® Distribution of OpenVINO™ toolkit for Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA
-
-<table>
-  <tr>
-    <td><strong>Change Notice Begins</strong></td>
-    <td>July 2020</td>
-  </tr>
-  <tr>
-    <td><strong>Change Date</strong></td>
-    <td>October 2020</td>
-  </tr>
-</table> 
-
-Intel will be transitioning to the next-generation programmable deep-learning solution based on FPGAs in order to increase the level of customization possible in FPGA deep-learning. As part of this transition, future standard releases (i.e., non-LTS releases) of Intel® Distribution of OpenVINO™ toolkit will no longer include the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA.
-
-Intel® Distribution of OpenVINO™ toolkit 2020.3.X LTS release will continue to support Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA. For questions about next-generation programmable deep-learning solutions based on FPGAs, please talk to your sales representative or contact us to get the latest FPGA updates.
-
-For documentation for previous releases of Intel® Distribution of OpenVINO™ toolkit for Linux* with FPGA Support, see documentation for the [2020.4 version](https://docs.openvinotoolkit.org/2020.4/openvino_docs_install_guides_VisionAcceleratorFPGA_Configure.html) and lower.
diff --git a/docs/install_guides/VisionAcceleratorFPGA_Configure_2018R5.md b/docs/install_guides/VisionAcceleratorFPGA_Configure_2018R5.md
deleted file mode 100644
index 328c824fa35967..00000000000000
--- a/docs/install_guides/VisionAcceleratorFPGA_Configure_2018R5.md
+++ /dev/null
@@ -1,330 +0,0 @@
-# Configuration Guide for the Intel® Distribution of OpenVINO™ toolkit 2018R5 and the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA (IEI's Mustang-F100-A10) on Linux* {#openvino_docs_install_guides_VisionAcceleratorFPGA_Configure_2018R5}
-
-> **NOTES:**
->  * For a first-time installation, use all steps.
->  * Use steps 1 and 2 only after receiving a new FPGA card.
->  * Repeat steps 2-5 when installing a new version of the Intel® Distribution of OpenVINO™ toolkit.
->  * Use steps 3-5 when a Neural Network topology used by an Intel® Distribution of OpenVINO™ toolkit application changes.
-
-## 1. Configure and Install the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA
-
-1. Download `fpga_support_files.tgz` from the [Intel Registration Center](http://registrationcenter-download.intel.com/akdlm/irc_nas/12954/fpga_support_files.tgz). The files in this `.tgz` archive are required to ensure your FPGA card and the Intel® Distribution of OpenVINO™ toolkit work correctly.
-
-2. Go to the directory where you downloaded the `fpga_support_files.tgz` archive.
-
-3. Unpack the `.tgz` file:
-```sh
-tar -xvzf fpga_support_files.tgz
-```
-A directory named `fpga_support_files` is created.
-
-4. Go to the `fpga_support_files` directory:
-```sh
-cd fpga_support_files
-```
-
-5. Source `setup_env.sh` to set your environment variables:
-```sh
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-6. Configure the FPGA Driver Blacklist:
-```sh
-sudo mv config/blacklist-altera-cvp.conf /etc/modprobe.d
-```
-
-7. Switch to superuser:
-```sh
-sudo su
-```
-
-8. Use the `setup_env.sh` script from `fpga_support_files.tgz` to set your environment variables:
-```sh
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-9. Change directory to `Downloads/fpga_support_files/`:
-```sh
-cd /home/<user>/Downloads/fpga_support_files/
-```
-
-10. Run the FPGA dependencies script, which allows OpenCL to support Ubuntu* and recent kernels:
-```sh
-./install_openvino_fpga_dependencies.sh
-```
-
-11. When asked, select the FPGA card, Intel® GPU, and Intel® Neural Compute Stick 2, then you can install the correct dependencies.
-
-12. If you installed the 4.14 kernel as part of the installation script, you will need to reboot the machine and select the new kernel in the Ubuntu (grub) boot menu. You will also need to rerun `setup_env.sh` to set up your environmental variables again.
-
-13. Install OpenCL™ devices. Enter **Y** when prompted to install:
-```sh
-aocl install
-```
-
-14. Reboot the machine:
-```sh
-reboot
-```
-
-15. Use the `setup_env.sh` script from `fpga_support_files.tgz` to set your environment variables:
-```sh
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-16. Run `aocl diagnose`:
-```sh
-aocl diagnose
-```
-Your screen displays `DIAGNOSTIC_PASSED`.
-
-## 2. Set Up the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA for 2018R5
-
-For the 2018R5 release, the Intel® Distribution of OpenVINO™ toolkit introduced a new board support package (BSP) `a10_1150_sg1` for the Intel® Vision Accelerator Design with an Intel® Arria®  10 FPGA, which is included into the `fpga_support_files.tgz` archive. To program the bitstreams for the Intel® Distribution of OpenVINO™ toolkit R5, you need to program the BSP into the board using the USB blaster.
-
-> **NOTE**: These steps apply only if you update to the Intel® Distribution of OpenVINO™ toolkit R5. Otherwise, you can skip them.
-
-1. Go to the `config` folder of the `fpga_support_files` directory where the `a10_1150_sg1` is located:
-```sh
-cd /home/<user>/Downloads/fpga_support_files/config/
-```
-
-2. Copy the `a10_1150_sg1` folder to the `board` directory:
-```sh
-sudo cp -rf a10_1150_sg1 /opt/altera/aocl-pro-rte/aclrte-linux64/board/
-```
-
-3. Convert the BSP files from DOS to UNIX:
-```sh
-sudo chmod +x a10_1150_sg1
-find a10_1150_sg1 -type f -print0 | xargs -0 dos2unix
-```
-
-4. Set up the USB Blaster:
-
-    1. Connect the cable between the board and the host system. Use the letter codes in the diagram below for the connection points:
-
-    2. Connect the B end of the cable to point B on the board.
-
-    3. Connect the F end of the cable to point F on the FPGA download cable.
-
-    4. From point F end of the cable to point F on the FPGA download cable, the connection is as shown:
-![](../img/VisionAcceleratorJTAG.png)
-
-5. Source the `setup_env.sh` script from the `fpga_support_files` to set up the environment variables:
-```sh
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-6. Update the Intel® FPGA Download Cable rules to program the board without root permissions and to flash the initialization bitstreams so that the Intel® FPGA Download Cable can communicate with the board:
-```sh
-sudo cp config/51-usbblaster.rules /etc/udev/rules.d
-```
-
-7. Load the USB rules:
-```sh
-sudo udevadm control --reload-rules && udevadm trigger
-```
-
-8. Unplug and re-plug the Intel® FPGA Download Cable to enable JTAG connection.
-
-9. Run `jtagconfig` to ensure that your Intel FPGA Download Cable driver is ready to use:
-```sh
-jtagconfig
-```
-Your output is similar to:
-```sh
-1) USB-Blaster [1-6]
-02E660DD   10AX115H1(.|E2|ES)/10AX115H2/..
-```
-
-10. Download [Intel® Quartus® Prime Software Lite Edition 17.1](http://fpgasoftware.intel.com/17.1/?edition=lite). Install the Intel® Quartus® Prime Software Lite to the `/home/<user>/intelFPGA/17.1` directory.
-> **NOTE**: You will need the complete the Intel® Quartus® Prime Software Lite version when you want to program the `boardtest_1ddr_top.aocx` into the flash for permanent availability.
-
-11. Export the Intel® Quartus® Prime Software Lite environment variable:
-```sh
-export QUARTUS_ROOTDIR=/home/<user>/intelFPGA/17.1/quartus
-```
-
-12. Use `jtagconfig` to slow the clock:
-```sh
-jtagconfig --setparam 1 JtagClock 6M
-```
-
-13. (OPTIONAL) Confirm the clock is set to 6M:
-```sh
-jtagconfig --getparam 1 JtagClock
-```
-You should see the following:
-```sh
-6M
-```
-
-14. Go to `/opt/altera/aocl-pro-rte/aclrte-linux64/board/a10_1150_sg1/bringup`, where `boardtest_1ddr_top.aocx `is located:
-```sh
-cd /opt/altera/aocl-pro-rte/aclrte-linux64/board/a10_1150_sg1/bringup
-```
-
-15. Program the `boardtest_1ddr_top.aocx` file to the flash to be made permanently available even after power cycle:
-```sh
-aocl flash acl0 boardtest_1ddr_top.aocx
-```
-> **NOTE**: You will need the USB Blaster for this.
-
-16. Reboot the host system.
-
-17. Check if the host system recognizes the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA board. Confirm you can detect the PCIe card:
-```sh
-lspci | grep -i Altera
-```
-Your output is similar to:
-```sh
-01:00.0 Processing accelerators: Altera Corporation Device 2494 (rev 01)
-```
-
-18. Source the `setup_env.sh` script from the `fpga_support_files` directory to setup the environment variables:
-```sh
-source /home/<user>/Downloads/fpga_support_file/setup_env.sh
-```
-
-19. Uninstall the previous BSP before installing the OpenCL drivers for the R5 BSP:
-```sh
-aocl uninstall /opt/altera/aocl-pro-rte/aclrte-linux64/board/<BSP_package>/
-```
-
-20. Export and source the environment script:
-```sh
-export AOCL_BOARD_PACKAGE_ROOT=/opt/altera/aocl-pro-rte/aclrte-linux64/board/a10_1150_sg1
-```
-```sh
-source /opt/altera/aocl-pro-rte/aclrte-linux64/init_opencl.sh
-```
-
-21. Install OpenCL™ devices:
-```sh
-aocl install
-```
-
-22. Run the `diagnose` command:
-```sh
-aocl diagnose
-```
-You should see `DIAGNOSTIC_PASSED` before proceeding to the next steps.
-
-## 3. Program a Bitstream
-
-The bitstream you program should correspond to the topology you want to deploy. In this section, you program a SqueezeNet bitstream and deploy the classification sample with a SqueezeNet model that you used the Model Optimizer to convert in the steps before.
-
-> **IMPORTANT**: Only use bitstreams from the installed version of the Intel® Distribution of OpenVINO™ toolkit. Bitstreams from older versions of the Intel® Distribution of OpenVINO™ toolkit are incompatible with later versions of the Intel® Distribution of OpenVINO™ toolkit. For example, you cannot use the `1-0-1_A10DK_FP16_Generic` bitstream, when the Intel® Distribution of OpenVINO™ toolkit supports the `2-0-1_A10DK_FP16_Generic` bitstream.
-
-Depending on how many bitstreams you selected, there are different folders for each FPGA card type which were downloaded in the Intel® Distribution of OpenVINO™ toolkit package:
-
-1. For the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA the pre-trained bistreams are in `/opt/intel/openvino/bitstreams/a10_vision_design_bitstreams`. This example uses a SqueezeNet bitstream with low precision for the classification sample.
-
-2. Rerun the environment setup script:
-```sh
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-3. Change to your home directory:
-```sh
-cd /home/<user>
-```
-
-4. Program the bitstream for the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_vision_design_bitstreams/5-0_PL1_FP11_SqueezeNet.aocx
-```
-
-### Optional Steps to Flash the FPGA Card
-
-> **NOTE**:
->	- To avoid having to reprogram the board after a power down, a bitstream will be programmed to permanent memory on the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA. This will take about 20 minutes.
->	- The following steps 1-5 need to be done only once for a new Intel® Arria 10 FPGA card.
-
-1. Plug in the micro USB cable to the card and your host system.
-
-2. Run `jtagconfig` to ensure that the cable is properly inserted:
-```sh
-jtagconfig
-```
-
-3. Use `jtagconfig` to slow the clock:
-```sh
-jtagconfig --setparam 1 JtagClock 6M
-```
-
-4. Store the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA bitstream on the board:
-```sh
-aocl flash acl0 /opt/intel/openvino/bitstreams/a10_vision_design_bitstreams/5-0_PL1_FP11_SqueezeNet.aocx
-```
-Your output is similar to:
-```sh
-USB-BlasterII [1-14]
-02E660DD 10AX115H1(.|E2|ES)/10AX115H2/..
-020A40DD 5M(1270ZF324|2210Z)/EPM2210
-```
-
-## 4. Setup a Neural Network Model for FPGA
-
-In this section, you will create an FP16 model suitable for hardware accelerators. For more information, see the [FPGA plugin](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html) section in the Inference Engine Developer Guide.
-
-
-1. Create a directory for the FP16 SqueezeNet Model:
-```sh
-mkdir /home/<user>/squeezenet1.1_FP16
-```
-
-2. Go to `/home/<user>/squeezenet1.1_FP16`:
-```sh
-cd /home/<user>/squeezenet1.1_FP16
-```
-
-3. Use the Model Optimizer to convert an FP16 SqueezeNet Caffe* model into an optimized Intermediate Representation (IR):
-```sh
-python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo.py --input_model /home/<user>/openvino_models/FP32/classification/squeezenet/1.1/caffe/squeezenet1.1.caffemodel --data_type FP16 --output_dir .
-```
-
-4. The `squeezenet1.1.labels` file contains the classes `ImageNet` uses. This file is included so that the inference results show text instead of classification numbers. Copy `squeezenet1.1.labels` to the your optimized model location:
-```sh
-cp /home/<user>/openvino_models/ir/squeezenet1.1/FP32/squeezenet1.1.labels  .
-```
-
-5. Copy a sample image to the release directory. You will use this with your optimized model:
-```sh
-sudo cp /opt/intel/openvino/deployment_tools/demo/car.png  ~/inference_engine_samples/intel64/Release
-```
-
-## 5. Run a Sample Application
-
-1. Go to the samples directory
-```sh
-cd /home/<user>/inference_engine_samples/intel64/Release
-```
-
-2. Use an Inference Engine sample to run a sample application on the CPU:
-```sh
-./classification_sample_async -i car.png -m ~/openvino_models/ir/squeezenet1.1/FP32/squeezenet1.1.xml
-```
-Note the CPU throughput in Frames Per Second (FPS). This tells you how quickly the inference is done on the hardware. Now run the inference using the FPGA.
-
-3. Add the `-d` option to target the FPGA:
-```sh
-./classification_sample_async -i car.png -m ~/squeezenet1.1_FP16/squeezenet1.1.xml -d HETERO:FPGA,CPU
-```
-The throughput on FPGA is listed and may show a lower FPS. This is due to the initialization time. To account for that, the next step increases the iterations to get a better sense of the speed the FPGA can run inference at.
-
-4. Use `-ni` to increase the number of iterations, This option reduces the initialization impact:
-```sh
-./classification_sample_async -i car.png -m ~/squeezenet1.1_FP16/squeezenet1.1.xml -d HETERO:FPGA,CPU -ni 100
-```
-
-Congratulations, you are done with the Intel® Distribution of OpenVINO™ toolkit installation for FPGA. 
-
-## Additional Resources
-
-Intel® Distribution of OpenVINO™ toolkit home page: [https://software.intel.com/en-us/openvino-toolkit](https://software.intel.com/en-us/openvino-toolkit)
-
-Intel® Distribution of OpenVINO™ toolkit documentation: [https://docs.openvinotoolkit.org/](https://docs.openvinotoolkit.org/)
-
-Inference Engine FPGA plugin documentation: [https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html)
diff --git a/docs/install_guides/VisionAcceleratorFPGA_Configure_2019R1.md b/docs/install_guides/VisionAcceleratorFPGA_Configure_2019R1.md
deleted file mode 100644
index 8de131e8c45161..00000000000000
--- a/docs/install_guides/VisionAcceleratorFPGA_Configure_2019R1.md
+++ /dev/null
@@ -1,281 +0,0 @@
-# Configuration Guide for the Intel® Distribution of OpenVINO™ toolkit 2019R1 and the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA (IEI's Mustang-F100-A10) on Linux* {#openvino_docs_install_guides_VisionAcceleratorFPGA_Configure_2019R1}
-
-> **NOTES:**
->  * For a first-time installation, use all steps.
->  * Use step 1 only after receiving a new FPGA card.
->  * Repeat steps 2-4 when installing a new version of the Intel® Distribution of OpenVINO™ toolkit.
->  * Use steps 3-4 when a Neural Network topology used by an Intel® Distribution of OpenVINO™ toolkit application changes.
-
-## 1. Configure and Set Up the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA
-
-For the 2019R1.x releases, the Intel® Distribution of OpenVINO™ toolkit introduced a new board support package (BSP) `a10_1150_sg1` for the Intel® Vision Accelerator Design with an Intel® Arria®  10 FPGA, which is included in the `fpga_support_files.tgz` archive below. To program the bitstreams for the Intel® Distribution of OpenVINO™ toolkit 2019R1.x, you need to program the BSP into the board using the USB blaster.
-
-1. Download [Intel® Quartus® Prime Programmer and Tools Standard Edition 18.1](http://fpgasoftware.intel.com/18.1/?edition=standard&platform=linux&download_manager=direct#tabs-4). Install the Intel® Quartus® Prime Programmer and Tools Software to the `/home/<user>/intelFPGA/18.1` directory.
-
-2. Download `fpga_support_files.tgz` from the [Intel Registration Center](http://registrationcenter-download.intel.com/akdlm/irc_nas/12954/fpga_support_files.tgz) to the `~/Downloads` directory. The files in this `.tgz` archive are required to ensure your FPGA card and the Intel® Distribution of OpenVINO™ toolkit work correctly.
-
-3. Go to the directory where you downloaded the `fpga_support_files.tgz` archive.
-
-4. Unpack the `.tgz` file:
-```sh
-tar -xvzf fpga_support_files.tgz
-```
-A directory named `fpga_support_files` is created.
-
-5. Go to the `fpga_support_files` directory:
-```sh
-cd fpga_support_files
-```
-	
-6. Switch to superuser:
-```sh
-sudo su
-```
-	
-7. Use the `setup_env.sh` script from `fpga_support_files.tgz` to set your environment variables:
-```sh
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-8. Uninstall any previous BSP before installing the OpenCL BSP for the 2019R1.x BSP:
-```sh
-aocl uninstall /opt/altera/aocl-pro-rte/aclrte-linux64/board/<BSP_package>/
-```
-
-9. Change directory to `Downloads/fpga_support_files/`:
-```sh
-cd /home/<user>/Downloads/fpga_support_files/
-```
-	
-10. Run the FPGA dependencies script, which allows OpenCL to support Ubuntu* and recent kernels:
-```sh
-./install_openvino_fpga_dependencies.sh
-```
-
-11. When asked, select the appropriate hardware accelerators you plan to use so it installs the correct dependencies.
-
-12. If you installed the 4.14 kernel as part of the installation script, you will need to reboot the machine and select the new kernel in the Ubuntu (grub) boot menu. You will also need to rerun `setup_env.sh` to set up your environmental variables again.
-		
-13. Export the Intel® Quartus® Prime Programmer environment variable:
-```sh
-export QUARTUS_ROOTDIR=/home/<user>/intelFPGA/18.1/qprogrammer
-```
-	
-14. Set up the USB Blaster:
-		
-    1. Connect the cable between the board and the host system. Use the letter codes in the diagram below for the connection points:
-				
-    2. Connect the B end of the cable to point B on the board.
-
-    3. Connect the F end of the cable to point F on the FPGA download cable.
-				
-    4. From point F end of the cable to point F on the FPGA download cable, the connection is as shown:
-![](../img/VisionAcceleratorJTAG.png)
-
-15. Run `jtagconfig` to ensure that your Intel FPGA Download Cable driver is ready to use:
-```sh
-jtagconfig
-```
-Your output is similar to:
-```sh
-1) USB-Blaster [1-6]
-02E660DD   10AX115H1(.|E2|ES)/10AX115H2/.. 
-```
-
-16. Use `jtagconfig` to slow the clock. The message "No parameter named JtagClock" can be safely ignored.
-```sh
-jtagconfig --setparam 1 JtagClock 6M
-```
-	
-17. (OPTIONAL) Confirm the clock is set to 6M:
-```sh
-jtagconfig --getparam 1 JtagClock
-```
-You should see the following:
-```sh
-6M
-```
-
-18. Go to `/opt/altera/aocl-pro-rte/aclrte-linux64/board/a10_1150_sg1/bringup`, where `sg1_boardtest_2ddr_base.sof`is located:
-```sh
-cd /opt/altera/aocl-pro-rte/aclrte-linux64/board/a10_1150_sg1/bringup
-```
-	
-19. Program the new sof file to the board:
-```sh
-quartus_pgm -c 1 -m JTAG -o "p;sg1_boardtest_2ddr_base.sof"
-```
-
-20. Soft reboot:
-```sh
-sudo reboot
-```
-
-21. Open up a new terminal and restore sudo access and the environment variables:
-```sh
-sudo su
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-22. Install OpenCL™ devices. Enter **Y** when prompted to install:
-```sh
-aocl install
-```
-	
-23. Reboot the machine:
-```sh
-reboot
-```
-	
-24. Open up a new terminal and restore sudo access and the environment variables:
-```sh
-sudo su
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-export QUARTUS_ROOTDIR=/home/<user>/intelFPGA/18.1/qprogrammer
-```
-	
-25. Run `aocl diagnose`:
-```sh
-aocl diagnose
-```
-Your screen displays `DIAGNOSTIC_PASSED`.
-
-26. Use `jtagconfig` to slow the clock. The message "No parameter named JtagClock" can be safely ignored.
-```sh
-jtagconfig --setparam 1 JtagClock 6M
-```
-	
-27. Go to `/opt/intel/openvino/bitstreams/a10_vision_design_bitstreams/`, where `2019R1_PL1_FP11_ResNet_SqueezeNet_VGG.aocx `is located:
-```sh
-cd /opt/intel/openvino/bitstreams/a10_vision_design_bitstreams/
-```
-	
-28. Program the `2019R1_PL1_FP11_ResNet_SqueezeNet_VGG.aocx` file to the flash to be made permanently available even after power cycle:
-```sh
-aocl flash acl0 2019R1_PL1_FP11_ResNet_SqueezeNet_VGG.aocx
-```
-> **NOTE**: You will need the USB Blaster for this.
-
-29. Hard reboot the host system including powering off.
-
-30. Now Soft reboot the host system to ensure the new PCIe device is seen properly
-```sh
-reboot
-```
-
-31. Open up a new terminal and restore sudo access and the environment variables:
-```sh
-sudo su
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-
-32. Check if the host system recognizes the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA board. Confirm you can detect the PCIe card:
-```sh
-lspci | grep -i Altera
-```
-Your output is similar to:
-```sh
-01:00.0 Processing accelerators: Altera Corporation Device 2494 (rev 01)
-```
-
-33. Run `aocl diagnose`:
-```sh
-aocl diagnose
-```
-You should see `DIAGNOSTIC_PASSED` before proceeding to the next steps.
-
-## 2. Program a Bitstream
-
-The bitstream you program should correspond to the topology you want to deploy. In this section, you program a SqueezeNet bitstream and deploy the classification sample with a SqueezeNet model that you used the Model Optimizer to convert in the steps before.
-
-> **IMPORTANT**: Only use bitstreams from the installed version of the Intel® Distribution of OpenVINO™ toolkit. Bitstreams from older versions of the Intel® Distribution of OpenVINO™ toolkit are incompatible with later versions of the Intel® Distribution of OpenVINO™ toolkit. For example, you cannot use the `1-0-1_A10DK_FP16_Generic` bitstream, when the Intel® Distribution of OpenVINO™ toolkit supports the `2-0-1_A10DK_FP16_Generic` bitstream.
-
-Depending on how many bitstreams you selected, there are different folders for each FPGA card type which were downloaded in the Intel® Distribution of OpenVINO™ toolkit package:
-
-1. For the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA the pre-trained bistreams are in `/opt/intel/openvino/bitstreams/a10_vision_design_bitstreams`. This example uses a SqueezeNet bitstream with low precision for the classification sample.
-
-2. Rerun the environment setup script:
-```sh
-source /home/<user>/Downloads/fpga_support_files/setup_env.sh
-```
-	
-3. Change to your home directory:
-```sh
-cd /home/<user>
-```
-	
-4. Program the bitstream for the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_vision_design_bitstreams/2019R1_PL1_FP11_ResNet_SqueezeNet_VGG.aocx
-```
-			
-### Steps to Flash the FPGA Card
-
-> **NOTE**:
->	- To avoid having to reprogram the board after a power down, a bitstream will be programmed to permanent memory on the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA. This will take about 20 minutes.
->	- The steps can be followed in the [Configure and Setup the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA](#1-configure-and-setup-the-intel-vision-accelerator-design-with-an-intel-arria-10-fpga) section of this guide from steps 14-18 and 28-36.
-
-
-## 3. Setup a Neural Network Model for FPGA
-
-In this section, you will create an FP16 model suitable for hardware accelerators. For more information, see the [FPGA plugin](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html) section in the Inference Engine Developer Guide.
-
-
-1. Create a directory for the FP16 SqueezeNet Model:
-```sh
-mkdir /home/<user>/squeezenet1.1_FP16
-```
-	
-2. Go to `/home/<user>/squeezenet1.1_FP16`:
-```sh
-cd /home/<user>/squeezenet1.1_FP16
-```
-
-3. Use the Model Optimizer to convert the FP32 SqueezeNet Caffe* model into an FP16 optimized Intermediate Representation (IR). The model files were downloaded when you ran the the Image Classification verification script while [installing the Intel® Distribution of OpenVINO™ toolkit for Linux* with FPGA Support](installing-openvino-linux-fpga.md). To convert, run the Model Optimizer script with the following arguments:	
-```sh
-python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo.py --input_model /home/<user>/openvino_models/models/FP32/classification/squeezenet/1.1/caffe/squeezenet1.1.caffemodel --data_type FP16 --output_dir .
-```
-	
-4. The `squeezenet1.1.labels` file contains the classes `ImageNet` uses. This file is included so that the inference results show text instead of classification numbers. Copy `squeezenet1.1.labels` to the your optimized model location:
-```sh
-cp /home/<user>/openvino_models/ir/FP32/classification/squeezenet/1.1/caffe/squeezenet1.1.labels  .
-```
-	
-5. Copy a sample image to the release directory. You will use this with your optimized model:
-```sh
-sudo cp /opt/intel/openvino/deployment_tools/demo/car.png  ~/inference_engine_samples_build/intel64/Release
-```
-	
-## 4. Run a Sample Application
-
-1. Go to the samples directory
-```sh
-cd /home/<user>/inference_engine_samples_build/intel64/Release
-```
-
-2. Use an Inference Engine sample to run a sample application on the CPU:
-```sh
-./classification_sample_async -i car.png -m ~/openvino_models/ir/FP32/classification/squeezenet/1.1/caffe/squeezenet1.1.xml
-```
-Note the CPU throughput in Frames Per Second (FPS). This tells you how quickly the inference is done on the hardware. Now run the inference using the FPGA.
-
-3. Add the `-d` option to target the FPGA:
-```sh
-./classification_sample_async -i car.png -m ~/squeezenet1.1_FP16/squeezenet1.1.xml -d HETERO:FPGA,CPU
-```
-The throughput on FPGA is listed and may show a lower FPS. This is due to the initialization time. To account for that, the next step increases the iterations to get a better sense of the speed the FPGA can run inference at.
-
-4. Use `-ni` to increase the number of iterations, This option reduces the initialization impact:
-```sh
-./classification_sample_async -i car.png -m ~/squeezenet1.1_FP16/squeezenet1.1.xml -d HETERO:FPGA,CPU -ni 100
-```
-
-Congratulations, you are done with the Intel® Distribution of OpenVINO™ toolkit installation for FPGA. 
-
-## Additional Resources
-
-Intel® Distribution of OpenVINO™ toolkit home page: [https://software.intel.com/en-us/openvino-toolkit](https://software.intel.com/en-us/openvino-toolkit)
-
-Intel® Distribution of OpenVINO™ toolkit documentation: [https://docs.openvinotoolkit.org/](https://docs.openvinotoolkit.org/)
-
-Inference Engine FPGA plugin documentation: [https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html)
diff --git a/docs/install_guides/VisionAcceleratorFPGA_Configure_2019R3.md b/docs/install_guides/VisionAcceleratorFPGA_Configure_2019R3.md
deleted file mode 100644
index 06d8ebbc86939a..00000000000000
--- a/docs/install_guides/VisionAcceleratorFPGA_Configure_2019R3.md
+++ /dev/null
@@ -1,281 +0,0 @@
-# Configuration Guide for the Intel® Distribution of OpenVINO™ toolkit 2019R3 and the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA SG1 and SG2 (IEI's Mustang-F100-A10) on Linux* {#openvino_docs_install_guides_VisionAcceleratorFPGA_Configure_2019R3}
-
-## 1. Configure and Set Up the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA
-
-1. Download [Intel® Quartus® Prime Programmer and Tools Standard Edition 18.1](http://fpgasoftware.intel.com/18.1/?edition=standard&platform=linux&download_manager=direct#tabs-4). Install the Intel® Quartus® Prime Programmer and Tools Software to the `/home/<user>/intelFPGA/18.1` directory.
-
-2. Download `fpga_support_files.tgz` from the [Intel Registration Center](http://registrationcenter-download.intel.com/akdlm/irc_nas/12954/fpga_support_files.tgz) to the `~/Downloads` directory. The files in this `.tgz` archive are required to ensure your FPGA card and the Intel® Distribution of OpenVINO™ toolkit work correctly.
-
-3. Go to the directory where you downloaded the `fpga_support_files.tgz` archive.
-
-4. Unpack the `.tgz` file:
-```sh
-tar -xvzf fpga_support_files.tgz
-```
-A directory named `fpga_support_files` is created.
-
-5. Switch to superuser:
-```sh
-sudo su
-```
-	
-6. Change directory to `Downloads/fpga_support_files/`:
-```sh
-cd /home/<user>/Downloads/fpga_support_files/
-```
-
-7. Copy the USB Blaster Rules file:
-```sh
-cp config/51-usbblaster.rules /etc/udev/rules.d
-udevadm control --reload-rules
-udevadm trigger
-```
-
-8. Copy aocl fixes for latest kernels:
-```sh
-cp fixes/Command.pm /opt/altera/aocl-pro-rte/aclrte-linux64/share/lib/perl/acl/
-cp config/blacklist-altera-cvp.conf /etc/modprobe.d/
-```
-
-9. Copy flash files so we don't need a full Quartus installation:
-```sh
-cp -r config/aocl_flash/linux64/* /home/<user>/intelFPGA/18.1/qprogrammer/linux64
-```
-
-10. Unpack the BSP for your appropriate Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA SG1 or SG2:
-```sh
-cd /opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/BSP/
-tar -xvzf a10_1150_sg<#>_r3.tgz
-chmod -R 755 /opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams
-```
-> **NOTE**: If you do not know which version of the board you have, please refer to the product label on the fan cover side or by the product SKU: Mustang-F100-A10-R10 => SG1; Mustang-F100-A10E-R10 => SG2
-
-11. Create an initialization script `/home/<user>/init_openvino.sh` with the following content that can be run upon opening a new terminal or rebooting. This will setup your proper environment variables.
-```sh
-export AOCL_BOARD_PACKAGE_ROOT=/opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/BSP/a10_1150_sg<#>
-export QUARTUS_ROOTDIR=/home/<user>/intelFPGA/18.1/qprogrammer
-export PATH=$PATH:/opt/altera/aocl-pro-rte/aclrte-linux64/bin:/opt/altera/aocl-pro-rte/aclrte-linux64/host/linux64/bin:/home/<user>/intelFPGA/18.1/qprogrammer/bin
-export INTELFPGAOCLSDKROOT=/opt/altera/aocl-pro-rte/aclrte-linux64
-export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:$AOCL_BOARD_PACKAGE_ROOT/linux64/lib
-export CL_CONTEXT_COMPILER_MODE_INTELFPGA=3
-source /opt/altera/aocl-pro-rte/aclrte-linux64/init_opencl.sh
-source /opt/intel/openvino/bin/setupvars.sh 
-```
-
-12. Source the script.
-```sh
-source /home/<user>/init_openvino.sh
-```
-
-13. Uninstall any previous BSP before installing the OpenCL BSP for the 2019R3 BSP:
-```sh
-aocl uninstall /opt/altera/aocl-pro-rte/aclrte-linux64/board/<BSP_package>/
-```
-
-14. Set up the USB Blaster:
-		
-    1. Connect the cable between the board and the host system. Use the letter codes in the diagram below for the connection points:
-				
-    2. Connect the B end of the cable to point B on the board.
-
-    3. Connect the F end of the cable to point F on the FPGA download cable.
-				
-    4. From point F end of the cable to point F on the FPGA download cable, the connection is as shown:
-![](../img/VisionAcceleratorJTAG.png)
-
-15. Run `jtagconfig` to ensure that your Intel FPGA Download Cable driver is ready to use:
-```sh
-jtagconfig
-```
-Your output is similar to:
-```sh
-1) USB-Blaster [1-6]
-02E660DD   10AX115H1(.|E2|ES)/10AX115H2/.. 
-```
-
-16. Use `jtagconfig` to slow the clock. The message "No parameter named JtagClock" can be safely ignored.
-```sh
-jtagconfig --setparam 1 JtagClock 6M
-```
-	
-17. (OPTIONAL) Confirm the clock is set to 6M:
-```sh
-jtagconfig --getparam 1 JtagClock
-```
-You should see the following:
-```sh
-6M
-```
-
-18. Go to `/opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/BSP/a10_1150_sg<#>/bringup`, where `sg<#>_boardtest_2ddr_base.sof`is located:
-```sh
-cd /opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/BSP/a10_1150_sg<#>/bringup
-```
-	
-19. Program the new sof file to the board:
-```sh
-quartus_pgm -c 1 -m JTAG -o "p;sg<#>_boardtest_2ddr_base.sof"
-```
-
-20. Soft reboot:
-```sh
-reboot
-```
-
-21. Source the environment variable script you made.
-```sh
-sudo su
-source /home/<user>/init_openvino.sh
-```
-
-22. Install OpenCL™ devices. Enter **Y** when prompted to install:
-```sh
-aocl install
-```
-	
-23. Reboot the machine:
-```sh
-reboot
-```
-	
-24. Source the environment variable script you made.
-```sh
-sudo su
-source /home/<user>/init_openvino.sh
-```
-
-25. Run `aocl diagnose`:
-```sh
-aocl diagnose
-```
-Your screen displays `DIAGNOSTIC_PASSED`.
-
-26. Use `jtagconfig` to slow the clock. The message "No parameter named JtagClock" can be safely ignored.
-```sh
-jtagconfig --setparam 1 JtagClock 6M
-```
-	
-27. Go to `/opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/`, where `2019R3_PV_PL<#>_FP11_InceptionV1_SqueezeNet.aocx `is located:
-```sh
-cd /opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/
-```
-	
-28. Program the `2019R3_PV_PL<#>_FP11_InceptionV1_SqueezeNet.aocx` file to the flash to be made permanently available even after power cycle:
-```sh
-aocl flash acl0 2019R3_PV_PL<#>_FP11_InceptionV1_SqueezeNet.aocx
-```
-> **NOTE**: You will need the USB Blaster for this.
-
-29. Hard reboot the host system including powering off.
-
-30. Source the environment variable script you made.
-```sh
-sudo su
-source /home/<user>/init_openvino.sh
-```
-
-31. Check if the host system recognizes the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA board. Confirm you can detect the PCIe card:
-```sh
-lspci | grep -i Altera
-```
-Your output is similar to:
-```sh
-01:00.0 Processing accelerators: Altera Corporation Device 2494 (rev 01)
-```
-
-32. Run `aocl diagnose`:
-```sh
-aocl diagnose
-```
-You should see `DIAGNOSTIC_PASSED` before proceeding to the next steps.
-
-## 2. Program a Bitstream
-
-The bitstream you program should correspond to the topology you want to deploy. In this section, you program a SqueezeNet bitstream and deploy the classification sample with a SqueezeNet model that you used the Model Optimizer to convert in the steps before.
-
-> **IMPORTANT**: Only use bitstreams from the installed version of the Intel® Distribution of OpenVINO™ toolkit. Bitstreams from older versions of the Intel® Distribution of OpenVINO™ toolkit are incompatible with later versions of the Intel® Distribution of OpenVINO™ toolkit. For example, you cannot use the `1-0-1_A10DK_FP16_Generic` bitstream, when the Intel® Distribution of OpenVINO™ toolkit supports the `2-0-1_A10DK_FP16_Generic` bitstream.
-
-Depending on how many bitstreams you selected, there are different folders for each FPGA card type which were downloaded in the Intel® Distribution of OpenVINO™ toolkit package:
-
-1. For the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA SG1 or SG2, the pre-trained bistreams are in `/opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/`. This example uses a SqueezeNet bitstream with low precision for the classification sample.
-
-2. Source the environment variable script you made.
-```sh
-source /home/<user>/init_openvino.sh
-```
-	
-3. Change to your home directory:
-```sh
-cd /home/<user>
-```
-	
-4. Program the bitstream for the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA SG1 or SG2:
-```sh
-aocl program acl0 /opt/intel/openvino/bitstreams/a10_vision_design_sg<#>_bitstreams/2019R3_PV_PL<#>_FP11_InceptionV1_SqueezeNet.aocx
-```
-			
-### Steps to Flash the FPGA Card
-
-> **NOTE**:
->	- To avoid having to reprogram the board after a power down, a bitstream will be programmed to permanent memory on the Intel® Vision Accelerator Design with Intel® Arria® 10 FPGA. This will take about 20 minutes.
->	- The steps can be followed above in this guide to do this.
-
-
-## 3. Setup a Neural Network Model for FPGA
-
-In this section, you will create an FP16 model suitable for hardware accelerators. For more information, see the [FPGA plugin](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html) section in the Inference Engine Developer Guide.
-
-
-1. Create a directory for the FP16 SqueezeNet Model:
-```sh
-mkdir ~/squeezenet1.1_FP16
-```
-	
-2. Go to `~/squeezenet1.1_FP16`:
-```sh
-cd ~/squeezenet1.1_FP16
-```
-
-3. Use the Model Optimizer to convert the FP32 SqueezeNet Caffe* model into an FP16 optimized Intermediate Representation (IR). The model files were downloaded when you ran the the Image Classification verification script while [installing the Intel® Distribution of OpenVINO™ toolkit for Linux* with FPGA Support](installing-openvino-linux-fpga.md). To convert, run the Model Optimizer script with the following arguments:	
-```sh
-python3 /opt/intel/openvino/deployment_tools/model_optimizer/mo.py --input_model ~/openvino_models/models/FP16/public/squeezenet1.1/squeezenet1.1.caffemodel --data_type FP16 --output_dir .
-```
-	
-4. The `squeezenet1.1.labels` file contains the classes `ImageNet` uses. This file is included so that the inference results show text instead of classification numbers. Copy `squeezenet1.1.labels` to the your optimized model location:
-```sh
-cp ~/openvino_models/ir/FP16/public/squeezenet1.1/squeezenet1.1.labels  .
-```
-	
-5. Copy a sample image to the release directory. You will use this with your optimized model:
-```sh
-cp /opt/intel/openvino/deployment_tools/demo/car.png ~/inference_engine_samples_build/intel64/Release
-```
-	
-## 4. Run a Sample Application
-
-1. Go to the samples directory
-```sh
-cd ~/inference_engine_samples_build/intel64/Release
-```
-
-2. Use an Inference Engine sample to run a sample application on the CPU:
-```sh
-./classification_sample_async -i car.png -m ~/openvino_models/ir/FP16/public/squeezenet1.1/squeezenet1.1.xml
-```
-Note the CPU throughput in Frames Per Second (FPS). This tells you how quickly the inference is done on the hardware. Now run the inference using the FPGA.
-
-3. Add the `-d` option to target the FPGA:
-```sh
-./classification_sample_async -i car.png -m ~/openvino_models/ir/FP16/public/squeezenet1.1/squeezenet1.1.xml -d HETERO:FPGA,CPU
-```
-The throughput on FPGA is listed and may show a lower FPS. This may be due to the initialization time. To account for that, increase the number of iterations or batch size when deploying to get a better sense of the speed the FPGA can run inference at.
-
-Congratulations, you are done with the Intel® Distribution of OpenVINO™ toolkit installation for FPGA. 
-
-## Additional Resources
-
-Intel® Distribution of OpenVINO™ toolkit home page: [https://software.intel.com/en-us/openvino-toolkit](https://software.intel.com/en-us/openvino-toolkit)
-
-Intel® Distribution of OpenVINO™ toolkit documentation: [https://docs.openvinotoolkit.org/](https://docs.openvinotoolkit.org/)
-
-Inference Engine FPGA plugin documentation: [https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_FPGA.html)
diff --git a/docs/install_guides/VisionAcceleratorFPGA_Configure_Windows.md b/docs/install_guides/VisionAcceleratorFPGA_Configure_Windows.md
deleted file mode 100644
index c7025807452d6d..00000000000000
--- a/docs/install_guides/VisionAcceleratorFPGA_Configure_Windows.md
+++ /dev/null
@@ -1,21 +0,0 @@
-# Configuration Guide for the Intel® Distribution of OpenVINO™ toolkit and the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA SG2 (IEI's Mustang-F100-A10) on Windows* {#openvino_docs_install_guides_VisionAcceleratorFPGA_Configure_Windows}
-
-## Product Change Notice
-Intel® Distribution of OpenVINO™ toolkit for Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA
-
-<table>
-  <tr>
-    <td><strong>Change Notice Begins</strong></td>
-    <td>July 2020</td>
-  </tr>
-  <tr>
-    <td><strong>Change Date</strong></td>
-    <td>October 2020</td>
-  </tr>
-</table> 
-
-Intel will be transitioning to the next-generation programmable deep-learning solution based on FPGAs in order to increase the level of customization possible in FPGA deep-learning. As part of this transition, future standard releases (i.e., non-LTS releases) of Intel® Distribution of OpenVINO™ toolkit will no longer include the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA.
-
-Intel® Distribution of OpenVINO™ toolkit 2020.3.X LTS release will continue to support Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA. For questions about next-generation programmable deep-learning solutions based on FPGAs, please talk to your sales representative or contact us to get the latest FPGA updates.
-
-For documentation for previous releases of Intel® Distribution of OpenVINO™ toolkit for Windows* with FPGA Support, see documentation for the [2020.4 version](https://docs.openvinotoolkit.org/2020.4/openvino_docs_install_guides_VisionAcceleratorFPGA_Configure_Windows.html) and lower.
diff --git a/docs/install_guides/deployment-manager-tool.md b/docs/install_guides/deployment-manager-tool.md
index 0989a3d5929c57..a7a7783767b0fd 100644
--- a/docs/install_guides/deployment-manager-tool.md
+++ b/docs/install_guides/deployment-manager-tool.md
@@ -2,7 +2,7 @@
 
 The Deployment Manager of Intel® Distribution of OpenVINO™ creates a deployment package by assembling the model, IR files, your application, and associated dependencies into a runtime package for your target device.
 
-The Deployment Manager is a Python\* command-line tool that is delivered within the Intel® Distribution of OpenVINO™ toolkit for Linux\* and Windows\* release packages and available after installation in the `<INSTALL_DIR>/deployment_tools/tools/deployment_manager` directory.
+The Deployment Manager is a Python\* command-line tool that is delivered within the Intel® Distribution of OpenVINO™ toolkit for Linux\* and Windows\* release packages and available after installation in the `<INSTALL_DIR>/tools/deployment_manager` directory.
 
 ## Pre-Requisites
 
@@ -32,7 +32,7 @@ Interactive mode provides a user-friendly command-line interface that will guide
 
 1. To launch the Deployment Manager in the interactive mode, open a new terminal window, go to the Deployment Manager tool directory and run the tool script without parameters:
    ```sh
-   <INSTALL_DIR>/deployment_tools/tools/deployment_manager
+   <INSTALL_DIR>/tools/deployment_manager
    ```
    ```sh
    ./deployment_manager.py
@@ -92,9 +92,9 @@ To deploy the Inference Engine components from the development machine to the ta
    ```
    * For Windows, use an archiver your prefer.  
    
-   The package is unpacked to the destination directory and the following subdirectories are created:
-      * `bin` — Snapshot of the `bin` directory from the OpenVINO installation directory.
-      * `deployment_tools/inference_engine` — Contains the Inference Engine binary files.
+   The package is unpacked to the destination directory and the following files and subdirectories are created:
+      * `setupvars.sh` — copy of `setupvars.sh`
+      * `runtime` — Contains the OpenVINO runtime binary files.
       * `install_dependencies` — Snapshot of the `install_dependencies` directory from the OpenVINO installation directory.
       * `<user_data>` — The directory with the user data (IRs, datasets, etc.) you specified while configuring the package.
 3. For Linux, to run inference on a target Intel® GPU, Intel® Movidius™ VPU, or Intel® Vision Accelerator Design with Intel® Movidius™ VPUs, you need to install additional dependencies by running the `install_openvino_dependencies.sh` script:
@@ -110,14 +110,14 @@ To deploy the Inference Engine components from the development machine to the ta
    cd <destination_dir>/openvino/
    ```
    ```sh
-   source ./bin/setupvars.sh
+   source ./setupvars.sh
    ```
    * For Windows:
    ```
    cd <destination_dir>\openvino\
    ```
    ```
-   .\bin\setupvars.bat
+   .\setupvars.bat
    ```
 
 Congratulations, you have finished the deployment of the Inference Engine components to the target host. 
\ No newline at end of file
diff --git a/docs/install_guides/installing-openvino-conda.md b/docs/install_guides/installing-openvino-conda.md
index b231b8b93d045d..de3b36897a1242 100644
--- a/docs/install_guides/installing-openvino-conda.md
+++ b/docs/install_guides/installing-openvino-conda.md
@@ -56,7 +56,7 @@ The **runtime package** includes the following components installed by default:
    ```sh
    conda install openvino-ie4py-ubuntu20 -c intel
    ```
- - Ubuntu* 18.04 
+ - Ubuntu* 18.04
    ```sh
    conda install openvino-ie4py-ubuntu18 -c intel
    ```
diff --git a/docs/install_guides/installing-openvino-docker-linux.md b/docs/install_guides/installing-openvino-docker-linux.md
index 46cabb6f934334..1c3030fa9ae1e6 100644
--- a/docs/install_guides/installing-openvino-docker-linux.md
+++ b/docs/install_guides/installing-openvino-docker-linux.md
@@ -193,7 +193,7 @@ RUN /bin/mkdir -p '/usr/local/lib' && \
 
 WORKDIR /opt/libusb-1.0.22/
 RUN /usr/bin/install -c -m 644 libusb-1.0.pc '/usr/local/lib/pkgconfig' && \
-    cp /opt/intel/openvino_2021/deployment_tools/inference_engine/external/97-myriad-usbboot.rules /etc/udev/rules.d/ && \
+    cp /opt/intel/openvino_2022/runtime/3rdparty/97-myriad-usbboot.rules /etc/udev/rules.d/ && \
     ldconfig
 ```
    - **CentOS 7**:
@@ -223,11 +223,11 @@ RUN /bin/mkdir -p '/usr/local/lib' && \
     /bin/mkdir -p '/usr/local/include/libusb-1.0' && \
     /usr/bin/install -c -m 644 libusb.h '/usr/local/include/libusb-1.0' && \
     /bin/mkdir -p '/usr/local/lib/pkgconfig' && \
-    printf "\nexport LD_LIBRARY_PATH=\${LD_LIBRARY_PATH}:/usr/local/lib\n" >> /opt/intel/openvino_2021/bin/setupvars.sh
+    printf "\nexport LD_LIBRARY_PATH=\${LD_LIBRARY_PATH}:/usr/local/lib\n" >> /opt/intel/openvino_2022/setupvars.sh
 
 WORKDIR /opt/libusb-1.0.22/
 RUN /usr/bin/install -c -m 644 libusb-1.0.pc '/usr/local/lib/pkgconfig' && \
-    cp /opt/intel/openvino_2021/deployment_tools/inference_engine/external/97-myriad-usbboot.rules /etc/udev/rules.d/ && \
+    cp /opt/intel/openvino_2022/runtime/3rdparty/97-myriad-usbboot.rules /etc/udev/rules.d/ && \
     ldconfig
 ```
 2. Run the Docker* image:
@@ -323,44 +323,36 @@ docker run -it --rm --net=host -v /var/tmp:/var/tmp –-ipc=host <image_name>
 
 ### Run Demos in the Docker* Image
 
-To run the Security Barrier Camera Demo on a specific inference device, run the following commands with the root privileges (additional third-party dependencies will be installed):
+To run the Classification Demo Using SqueezeNet on a specific inference device, run the following commands with the root privileges (additional third-party dependencies will be installed):
 
 **CPU**:
 
 ```sh
 docker run -itu root:root --rm <image_name>
-/bin/bash -c "apt update && apt install sudo && deployment_tools/demo/demo_security_barrier_camera.sh -d CPU -sample-options -no_show"
+/bin/bash -c "apt update && apt install sudo && samples/scripts/run_sample_squeezenet.sh -d CPU"
 ```
 
 **GPU**:
 
 ```sh
 docker run -itu root:root --rm --device /dev/dri:/dev/dri <image_name>
-/bin/bash -c "apt update && apt install sudo && deployment_tools/demo/demo_security_barrier_camera.sh -d GPU -sample-options -no_show"
+/bin/bash -c "apt update && apt install sudo && samples/scripts/run_sample_squeezenet.sh -d GPU"
 ```
 
 **MYRIAD**:
 
 ```sh
 docker run -itu root:root --rm --device-cgroup-rule='c 189:* rmw' -v /dev/bus/usb:/dev/bus/usb <image_name>
-/bin/bash -c "apt update && apt install sudo && deployment_tools/demo/demo_security_barrier_camera.sh -d MYRIAD -sample-options -no_show"
+/bin/bash -c "apt update && apt install sudo && samples/scripts/run_sample_squeezenet.sh -d MYRIAD"
 ```
 
 **HDDL**:
 
 ```sh
 docker run -itu root:root --rm --device=/dev/ion:/dev/ion -v /var/tmp:/var/tmp <image_name>
-/bin/bash -c "apt update && apt install sudo && deployment_tools/demo/demo_security_barrier_camera.sh -d HDDL -sample-options -no_show"
+/bin/bash -c "apt update && apt install sudo && samples/scripts/run_sample_squeezenet.sh -d HDDL"
 ```
 
-## Use a Docker* Image for FPGA
-
-Intel will be transitioning to the next-generation programmable deep-learning solution based on FPGAs in order to increase the level of customization possible in FPGA deep-learning. As part of this transition, future standard releases (i.e., non-LTS releases) of Intel® Distribution of OpenVINO™ toolkit will no longer include the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA.
-
-Intel® Distribution of OpenVINO™ toolkit 2020.3.X LTS release will continue to support Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA. For questions about next-generation programmable deep-learning solutions based on FPGAs, please talk to your sales representative or contact us to get the latest FPGA updates.
-
-For instructions for previous releases with FPGA Support, see documentation for the [2020.4 version](https://docs.openvinotoolkit.org/2020.4/openvino_docs_install_guides_installing_openvino_docker_linux.html#use_a_docker_image_for_fpga) or lower.
-
 ## Troubleshooting
 
 If you got proxy issues, please setup proxy settings for Docker. See the Proxy section in the [Install the DL Workbench from Docker Hub* ](@ref workbench_docs_Workbench_DG_Run_Locally) topic.
diff --git a/docs/install_guides/installing-openvino-docker-windows.md b/docs/install_guides/installing-openvino-docker-windows.md
index 6696da70586955..31348f393b1366 100644
--- a/docs/install_guides/installing-openvino-docker-windows.md
+++ b/docs/install_guides/installing-openvino-docker-windows.md
@@ -83,7 +83,7 @@ docker run -it --rm <image_name>
 If you want to try some demos then run image with the root privileges (some additional 3-rd party dependencies will be installed):
 
 ```bat
-docker run -itu ContainerAdministrator --rm <image_name> cmd /S /C "cd deployment_tools\demo && demo_security_barrier_camera.bat -d CPU -sample-options -no_show"
+docker run -itu ContainerAdministrator --rm <image_name> cmd /S /C "cd samples\scripts && run_sample_squeezenet.bat -d CPU"
 ```
 
 ## Configure and Run the Docker* Image for GPU
@@ -138,9 +138,9 @@ GPU Acceleration in Windows containers feature requires to meet Windows host, Op
    ```bat
    copy C:\tmp\OpenCL.dll C:\Windows\System32\ && reg add "HKLM\SOFTWARE\Khronos\OpenCL\Vendors" /v "C:\Windows\System32\DriverStore\FileRepository\iigd_dch.inf_amd64_518f2921ba495409\ocl\bin\x64\intelocl64.dll" /t REG_DWORD /d 0
    ```
-3. For example, run the `demo_security_barrier_camera` demo with the command below:
+3. For example, run the `run_sample_squeezenet` demo with the command below:
    ```bat
-   cd bin && setupvars.bat && cd ../ && cd deployment_tools\demo && demo_security_barrier_camera.bat -d GPU -sample-options -no_show
+   cd samples\scripts && run_sample_squeezenet.bat -d GPU
    ```
    > **NOTE**: Addittional third-party dependencies will be installed.
 
diff --git a/docs/install_guides/installing-openvino-images.md b/docs/install_guides/installing-openvino-images.md
index e6b0373476d3b1..41a9867ccf488a 100644
--- a/docs/install_guides/installing-openvino-images.md
+++ b/docs/install_guides/installing-openvino-images.md
@@ -3,7 +3,7 @@
 You may install Intel® Distribution of OpenVINO™ toolkit from images and repositories using the **Install OpenVINO™** button above or directly from the [Get the Intel® Distribution of OpenVINO™ Toolkit](https://software.intel.com/content/www/us/en/develop/tools/openvino-toolkit/download.html) page. Use the documentation below if you need additional support: 
 
 * [Docker](installing-openvino-docker-linux.md)
-* [Docker with DL Workbench](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub)
+* [Docker with DL Workbench](@ref workbench_docs_Workbench_DG_Run_Locally)
 * [APT](installing-openvino-apt.md)
 * [YUM](installing-openvino-yum.md)
 * [Anaconda Cloud](installing-openvino-conda.md)
diff --git a/docs/install_guides/installing-openvino-linux-fpga.md b/docs/install_guides/installing-openvino-linux-fpga.md
deleted file mode 100644
index 1205d0528d393c..00000000000000
--- a/docs/install_guides/installing-openvino-linux-fpga.md
+++ /dev/null
@@ -1,21 +0,0 @@
-# Install Intel® Distribution of OpenVINO™ toolkit for Linux* with FPGA Support {#openvino_docs_install_guides_installing_openvino_linux_fpga}
-
-## Product Change Notice
-Intel® Distribution of OpenVINO™ toolkit for Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA
-
-<table>
-  <tr>
-    <td><strong>Change Notice Begins</strong></td>
-    <td>July 2020</td>
-  </tr>
-  <tr>
-    <td><strong>Change Date</strong></td>
-    <td>October 2020</td>
-  </tr>
-</table> 
-
-Intel will be transitioning to the next-generation programmable deep-learning solution based on FPGAs in order to increase the level of customization possible in FPGA deep-learning. As part of this transition, future standard releases (i.e., non-LTS releases) of Intel® Distribution of OpenVINO™ toolkit will no longer include the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA.
-
-Intel® Distribution of OpenVINO™ toolkit 2020.3.X LTS release will continue to support Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA. For questions about next-generation programmable deep-learning solutions based on FPGAs, please talk to your sales representative or contact us to get the latest FPGA updates.
-
-For installation instructions for the last release of Intel® Distribution of OpenVINO™ toolkit for Linux* with FPGA Support, see documentation for the [2020.4 version](https://docs.openvinotoolkit.org/2020.4/openvino_docs_install_guides_installing_openvino_linux_fpga.html).
diff --git a/docs/install_guides/installing-openvino-linux-ivad-vpu.md b/docs/install_guides/installing-openvino-linux-ivad-vpu.md
index cd86804307c7fe..9e7135bdfc3593 100644
--- a/docs/install_guides/installing-openvino-linux-ivad-vpu.md
+++ b/docs/install_guides/installing-openvino-linux-ivad-vpu.md
@@ -11,9 +11,9 @@ For Intel® Vision Accelerator Design with Intel® Movidius™ VPUs, the followi
 
 1. Set the environment variables:
 ```sh
-source /opt/intel/openvino_2021/bin/setupvars.sh
+source /opt/intel/openvino_2022/setupvars.sh
 ```
-> **NOTE**: The `HDDL_INSTALL_DIR` variable is set to `<openvino_install_dir>/deployment_tools/inference_engine/external/hddl`. If you installed the Intel® Distribution of OpenVINO™ to the default install directory, the `HDDL_INSTALL_DIR` was set to `/opt/intel/openvino_2021//deployment_tools/inference_engine/external/hddl`.
+> **NOTE**: The `HDDL_INSTALL_DIR` variable is set to `<openvino_install_dir>/runtime/3rdparty/hddl`. If you installed the Intel® Distribution of OpenVINO™ to the default install directory, the `HDDL_INSTALL_DIR` was set to `/opt/intel/openvino_2022/runtime/3rdparty/hddl`.
 
 2. Install dependencies:
 ```sh
@@ -52,7 +52,7 @@ E: [ncAPI] [    965618] [MainThread] ncDeviceOpen:677   Failed to find a device,
 ```sh
 kill -9 $(pidof hddldaemon autoboot)
 pidof hddldaemon autoboot # Make sure none of them is alive
-source /opt/intel/openvino_2021/bin/setupvars.sh
+source /opt/intel/openvino_2022/setupvars.sh
 ${HDDL_INSTALL_DIR}/bin/bsl_reset
 ```
 
diff --git a/docs/install_guides/installing-openvino-linux.md b/docs/install_guides/installing-openvino-linux.md
index 4a7dd77c506ba0..8cf4f4dc213273 100644
--- a/docs/install_guides/installing-openvino-linux.md
+++ b/docs/install_guides/installing-openvino-linux.md
@@ -5,7 +5,14 @@
 > - If you are using Intel® Distribution of OpenVINO™ toolkit on Windows\* OS, see the [Installation Guide for Windows*](installing-openvino-windows.md).
 > - CentOS and Yocto installations will require some modifications that are not covered in this guide.
 > - An internet connection is required to follow the steps in this guide.
-> - [Intel® System Studio](https://software.intel.com/en-us/system-studio) is an all-in-one, cross-platform tool suite, purpose-built to simplify system bring-up and improve system and IoT device application performance on Intel® platforms. If you are using the Intel® Distribution of OpenVINO™ with Intel® System Studio, go to [Get Started with Intel® System Studio](https://software.intel.com/en-us/articles/get-started-with-openvino-and-intel-system-studio-2019).
+
+
+> **TIP**: If you want to [quick start with OpenVINO™ toolkit](@ref 
+> openvino_docs_get_started_get_started_dl_workbench), you can use 
+> the OpenVINO™ [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench). DL Workbench is the OpenVINO™ toolkit UI 
+> that enables you to import a
+> model, analyze its performance and accuracy, visualize the outputs, optimize and prepare the model for deployment
+> on various Intel® platforms. 
 
 ## Introduction
 
@@ -13,7 +20,7 @@ OpenVINO™ toolkit is a comprehensive toolkit for quickly developing applicatio
 
 The Intel® Distribution of OpenVINO™ toolkit for Linux\*:
 - Enables CNN-based deep learning inference on the edge
-- Supports heterogeneous execution across Intel® CPU, Intel® Integrated Graphics, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
+- Supports heterogeneous execution across Intel® CPU, Intel® GPU, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
 - Speeds time-to-market via an easy-to-use library of computer vision functions and pre-optimized kernels
 - Includes optimized calls for computer vision standards including OpenCV\* and OpenCL™
 
@@ -31,19 +38,6 @@ The Intel® Distribution of OpenVINO™ toolkit for Linux\*:
 | [Documentation for Pre-Trained Models ](@ref omz_models_group_intel)                                   | Documentation for the pre-trained models available in the [Open Model Zoo repo](https://github.com/openvinotoolkit/open_model_zoo).  |
 | Deep Learning Streamer (DL Streamer)   | Streaming analytics framework, based on GStreamer, for constructing graphs of media analytics components. For the DL Streamer documentation, see [DL Streamer Samples](@ref gst_samples_README), [API Reference](https://openvinotoolkit.github.io/dlstreamer_gst/), [Elements](https://github.com/openvinotoolkit/dlstreamer_gst/wiki/Elements), [Tutorial](https://github.com/openvinotoolkit/dlstreamer_gst/wiki/DL-Streamer-Tutorial). |
 
-**Could Be Optionally Installed**
-
-[Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench) is a platform built upon OpenVINO™ and provides a web-based graphical environment that enables you to optimize, fine-tune, analyze, visualize, and compare performance of deep learning models on various Intel® architecture
-configurations. In the DL Workbench, you can use most of OpenVINO™ toolkit components:
-* [Model Downloader](@ref omz_tools_downloader)
-* [Intel® Open Model Zoo](@ref omz_models_group_intel)
-* [Model Optimizer](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md)
-* [Post-training Optimization Tool](@ref pot_README)
-* [Accuracy Checker](@ref omz_tools_accuracy_checker)
-* [Benchmark Tool](../../inference-engine/samples/benchmark_app/README.md)
-
-Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub) to get started.
-
 ## System Requirements
 
 **Hardware**
@@ -53,6 +47,7 @@ Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_I
 * Intel® Xeon® Scalable processor (formerly Skylake and Cascade Lake)
 * Intel Atom® processor with support for Intel® Streaming SIMD Extensions 4.1 (Intel® SSE4.1)
 * Intel Pentium® processor N4200/5, N3350/5, or N3450/5 with Intel® HD Graphics
+* Intel® Iris® Xe MAX Graphics
 * Intel® Neural Compute Stick 2
 * Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
 
@@ -69,6 +64,10 @@ Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_I
 - Ubuntu 20.04.0 long-term support (LTS), 64-bit
 - CentOS 7.6, 64-bit (for target only)
 - Yocto Project v3.0, 64-bit (for target only and requires modifications)
+- For deployment scenarios on Red Hat* Enterprise Linux* 8.2 (64 bit), you can use the of Intel® Distribution of OpenVINO™ toolkit run-time package that includes the Inference Engine core libraries, nGraph, OpenCV, Python bindings, CPU and GPU plugins. The package is available as: 
+   - [Downloadable archive](https://storage.openvinotoolkit.org/repositories/openvino/packages/2021.3/l_openvino_toolkit_runtime_rhel8_p_2021.3.394.tgz)
+   - [PyPi package](https://pypi.org/project/openvino/)
+   - [Docker image](https://catalog.redhat.com/software/containers/intel/openvino-runtime/606ff4d7ecb5241699188fb3)
 
 ## Overview
 
@@ -134,7 +133,7 @@ sudo ./install.sh -s silent.cfg
    By default, the Intel® Distribution of OpenVINO™ is installed to the following directory, referred to as `<INSTALL_DIR>`:
       * For root or administrator: `/opt/intel/openvino_<version>/`
       * For regular users: `/home/<USER>/intel/openvino_<version>/`
-   For simplicity, a symbolic link to the latest installation is also created: `/opt/intel/openvino_2021/`.
+   For simplicity, a symbolic link to the latest installation is also created: `/opt/intel/openvino_2022/`.
 
 8. **Optional**: You can choose **Customize** to change the installation directory or the components you want to install:
 > **NOTE**: If there is an OpenVINO™ toolkit version previously installed on your system, the installer will use the same destination directory for next installations. If you want to install a newer version to a different directory, you need to uninstall the previously installed versions.
@@ -157,7 +156,7 @@ These dependencies are required for:
 
 1. Change to the `install_dependencies` directory:
 ```sh
-cd /opt/intel/openvino_2021/install_dependencies
+cd /opt/intel/openvino_2022/install_dependencies
 ```
 2. Run a script to download and install the external software dependencies:
 ```sh
@@ -170,7 +169,7 @@ sudo -E ./install_openvino_dependencies.sh
 You must update several environment variables before you can compile and run OpenVINO™ applications. Run the following script to temporarily set your environment variables:
 
 ```sh
-source /opt/intel/openvino_2021/bin/setupvars.sh
+source /opt/intel/openvino_2022/setupvars.sh
 ```  
 
 **Optional:** The OpenVINO environment variables are removed when you close the shell. As an option, you can permanently set the environment variables as follows:
@@ -182,7 +181,7 @@ vi <user_directory>/.bashrc
 
 2. Add this line to the end of the file:
 ```sh
-source /opt/intel/openvino_2021/bin/setupvars.sh
+source /opt/intel/openvino_2022/setupvars.sh
 ```
 
 3. Save and close the file: press the **Esc** key and type `:wq`.
@@ -218,7 +217,7 @@ You can choose to either configure all supported frameworks at once **OR** confi
 
 1.  Go to the Model Optimizer prerequisites directory:
 ```sh
-cd /opt/intel/openvino_2021/deployment_tools/model_optimizer/install_prerequisites
+cd /opt/intel/openvino_2022/tools/model_optimizer/install_prerequisites
 ```
 2.  Run the script to configure the Model Optimizer for Caffe,
     TensorFlow 1.x, MXNet, Kaldi\*, and ONNX:
@@ -232,7 +231,7 @@ Configure individual frameworks separately **ONLY** if you did not select **Opti
 
 1.  Go to the Model Optimizer prerequisites directory:
 ```sh
-cd /opt/intel/openvino_2021/deployment_tools/model_optimizer/install_prerequisites
+cd /opt/intel/openvino_2022/tools/model_optimizer/install_prerequisites
 ```
 2.  Run the script for your model framework. You can run more than one script:
 
@@ -282,23 +281,25 @@ The steps in this section are required only if you want to enable the toolkit co
 
 1. Go to the install_dependencies directory:
 ```sh
-cd /opt/intel/openvino_2021/install_dependencies/
+cd /opt/intel/openvino_2022/install_dependencies/
 ```
 
-2. Install the **Intel® Graphics Compute Runtime for OpenCL™** driver components required to use the GPU plugin and write custom layers for Intel® Integrated Graphics. The drivers are not included in the package, to install it, make sure you have the internet connection and run the installation script:
-```sh
-sudo -E ./install_NEO_OCL_driver.sh
-```
-   The script compares the driver version on the system to the current version. If the driver version on the system is higher or equal to the current version, the script does 
-not install a new driver. If the version of the driver is lower than the current version, the script uninstalls the lower and installs the current version with your permission:
+2. Install the **Intel® Graphics Compute Runtime for OpenCL™** driver components required to use the GPU plugin and write custom layers for Intel® Integrated Graphics. The drivers are not included in the package and must be installed separately.
+   > **NOTE**: To use the **Intel® Iris® Xe MAX Graphics**, see the [Intel® Iris® Xe MAX Graphics with Linux*](https://dgpu-docs.intel.com/devices/iris-xe-max-graphics/index.html) page for driver installation instructions.
+
+   To install the drivers, make sure you have the internet connection and run the installation script:
+   ```sh
+   sudo -E ./install_NEO_OCL_driver.sh
+   ```
+   The script compares the driver version on the system to the current version. If the driver version on the system is higher or equal to the current version, the script does not install a new driver. If the version of the driver is lower than the current version, the script uninstalls the lower and installs the current version with your permission:
    ![](../img/NEO_check_agreement.png) 
    Higher hardware versions require a higher driver version, namely 20.35 instead of 19.41. If the script fails to uninstall the driver, uninstall it manually. During the script execution, you may see the following command line output:  
 ```sh
 Add OpenCL user to video group    
 ```
-   Ignore this suggestion and continue.<br>You can also find the most recent version of the driver, installation procedure and other information in the [https://github.com/intel/compute-runtime/](https://github.com/intel/compute-runtime/) repository.
+   Ignore this suggestion and continue.<br>You can also find the most recent version of the driver, installation procedure and other information on the [Intel® software for general purpose GPU capabilities](https://dgpu-docs.intel.com/index.html) site.
 
-4. **Optional** Install header files to allow compiling a new code. You can find the header files at [Khronos OpenCL™ API Headers](https://github.com/KhronosGroup/OpenCL-Headers.git).
+3. **Optional** Install header files to allow compiling a new code. You can find the header files at [Khronos OpenCL™ API Headers](https://github.com/KhronosGroup/OpenCL-Headers.git).
 
 You've completed all required configuration steps to perform inference on processor graphics. 
 Proceed to the <a href="#get-started">Get Started</a> to get started with running code samples and demo applications.
@@ -314,7 +315,7 @@ sudo usermod -a -G users "$(whoami)"
    Log out and log in for it to take effect.
 2. To perform inference on Intel® Neural Compute Stick 2, install the USB rules as follows:
    ```sh
-   sudo cp /opt/intel/openvino_2021/inference_engine/external/97-myriad-usbboot.rules /etc/udev/rules.d/
+   sudo cp /opt/intel/openvino_2022/runtime/3rdparty/97-myriad-usbboot.rules /etc/udev/rules.d/
    ```
    ```sh
    sudo udevadm control --reload-rules
@@ -340,17 +341,12 @@ After configuration is done, you are ready to run the verification scripts with
 
 1. Go to the **Inference Engine demo** directory:
 ```sh
-cd /opt/intel/openvino_2021/deployment_tools/demo
+cd /opt/intel/openvino_2022/samples/scripts
 ```
 
 2. Run the **Image Classification verification script**. If you have access to the Internet through the proxy server only, please make sure that it is configured in your OS environment.
 ```sh
-./demo_squeezenet_download_convert_run.sh -d HDDL
-```
-
-3. Run the **Inference Pipeline verification script**:
-```sh
-./demo_security_barrier_camera.sh -d HDDL
+./run_sample_squeezenet.sh -d HDDL
 ```
 
 You've completed all required configuration steps to perform inference on Intel® Vision Accelerator Design with Intel® Movidius™ VPUs. 
diff --git a/docs/install_guides/installing-openvino-macos.md b/docs/install_guides/installing-openvino-macos.md
index e4a225bdab05bd..36249196da0626 100644
--- a/docs/install_guides/installing-openvino-macos.md
+++ b/docs/install_guides/installing-openvino-macos.md
@@ -4,12 +4,17 @@
 > - The Intel® Distribution of OpenVINO™ is supported on macOS\* 10.15.x versions.
 > - An internet connection is required to follow the steps in this guide. If you have access to the Internet through the proxy server only, please make sure that it is configured in your OS environment.
 
+> **TIP**: If you want to [quick start with OpenVINO™ toolkit](@ref 
+> openvino_docs_get_started_get_started_dl_workbench), you can use 
+> the OpenVINO™ [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench). DL Workbench is the OpenVINO™ toolkit UI 
+> that enables you to import a
+> model, analyze its performance and accuracy, visualize the outputs, optimize and prepare the model for deployment
+> on various Intel® platforms. 
+
 ## Introduction
 
 The Intel® Distribution of OpenVINO™ toolkit quickly deploys applications and solutions that emulate human vision. Based on Convolutional Neural Networks (CNN), the toolkit extends computer vision (CV) workloads across Intel® hardware, maximizing performance.
 
-The Intel® Distribution of OpenVINO™ toolkit for macOS* includes the Inference Engine, OpenCV* libraries and Model Optimizer tool to deploy applications for accelerated inference on Intel® CPUs and Intel® Neural Compute Stick 2.  
-
 The Intel® Distribution of OpenVINO™ toolkit for macOS*:
 
 - Enables CNN-based deep learning inference on the edge  
@@ -31,18 +36,6 @@ The following components are installed by default:
 | Additional Tools                                   | A set of tools to work with your models including [Accuracy Checker utility](@ref omz_tools_accuracy_checker), [Post-Training Optimization Tool Guide](@ref pot_README), [Model Downloader](@ref omz_tools_downloader) and other  |
 | [Documentation for Pre-Trained Models ](@ref omz_models_group_intel)                                   | Documentation for the pre-trained models available in the [Open Model Zoo repo](https://github.com/openvinotoolkit/open_model_zoo)  |
 
-**Could Be Optionally Installed**
-
-[Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench) is a platform built upon OpenVINO™ and provides a web-based graphical environment that enables you to optimize, fine-tune, analyze, visualize, and compare performance of deep learning models on various Intel® architecture
-configurations. In the DL Workbench, you can use most of OpenVINO™ toolkit components:
-* [Model Downloader](@ref omz_tools_downloader)
-* [Intel® Open Model Zoo](@ref omz_models_group_intel)
-* [Model Optimizer](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md)
-* [Post-training Optimization Tool](@ref pot_README)
-* [Accuracy Checker](@ref omz_tools_accuracy_checker)
-* [Benchmark Tool](../../inference-engine/samples/benchmark_app/README.md)
-
-Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub) to get started.
 
 ## Development and Target Platform
 
@@ -59,7 +52,7 @@ The development and target platforms have the same requirements, but you can sel
 
 **Software Requirements**
 
-* CMake 3.10 or higher
+* CMake 3.13 or higher
 	+ [Install](https://cmake.org/download/) (choose "macOS 10.13 or later")
 	+ Add `/Applications/CMake.app/Contents/bin` to path (for default install) 
 * Python 3.6 - 3.7
@@ -114,7 +107,7 @@ The disk image is mounted to `/Volumes/m_openvino_toolkit_p_<version>` and autom
 
 5. Click **Next** and follow the instructions on your screen.
 
-6. If you are missing external dependencies, you will see a warning screen. Take note of any dependencies you are missing. After installing the Intel® Distribution of OpenVINO™ toolkit core components, you will need to install the missing dependencies. For example, the screen example below indicates you are missing two dependencies:
+6. If you are missing external dependencies, you will see a warning screen. Take note of any dependencies you are missing. After installing the Intel® Distribution of OpenVINO™ toolkit core components, you will need to install the missing dependencies. For example, the screen example below indicates you are missing a dependency:
    ![](../img/openvino-install-macos-02.png)
 
 7. Click **Next**.
@@ -124,9 +117,9 @@ The disk image is mounted to `/Volumes/m_openvino_toolkit_p_<version>` and autom
    By default, the Intel® Distribution of OpenVINO™ is installed to the following directory, referred to as `<INSTALL_DIR>`:
 
    * For root or administrator: `/opt/intel/openvino_<version>/`
-   * For regular users: `/home/<USER>/intel/openvino_<version>/`
+   * For regular users: `/home/<USER>/intel/openvino_<version>/` 
 
-   For simplicity, a symbolic link to the latest installation is also created: `/home/<user>/intel/openvino_2021/`.
+   For simplicity, a symbolic link to the latest installation is also created: `/home/<user>/intel/openvino_2022/`.
 9. If needed, click **Customize** to change the installation directory or the components you want to install:
    ![](../img/openvino-install-macos-04.png)
    > **NOTE**: If there is an OpenVINO™ toolkit version previously installed on your system, the installer will use the same destination directory for next installations. If you want to install a newer version to a different directory, you need to uninstall the previously installed versions.
@@ -145,10 +138,10 @@ The disk image is mounted to `/Volumes/m_openvino_toolkit_p_<version>` and autom
 You need to update several environment variables before you can compile and run OpenVINO™ applications. Open the macOS Terminal\* or a command-line interface shell you prefer and run the following script to temporarily set your environment variables:
 
    ```sh
-   source /opt/intel/openvino_2021/bin/setupvars.sh
+   source /opt/intel/openvino_2022/setupvars.sh
    ```  
 
-If you didn't choose the default installation option, replace `/opt/intel/openvino_2021` with your directory.
+If you didn't choose the default installation option, replace `/opt/intel/openvino_2022` with your directory.
 
 <strong>Optional</strong>: The OpenVINO environment variables are removed when you close the shell. You can permanently set the environment variables as follows:
 
@@ -160,10 +153,10 @@ If you didn't choose the default installation option, replace `/opt/intel/openvi
 
 3. Add this line to the end of the file:
    ```sh
-   source /opt/intel/openvino_2021/bin/setupvars.sh
+   source /opt/intel/openvino_2022/setupvars.sh
    ```
 
-If you didn't choose the default installation option, replace `/opt/intel/openvino_2021` with your directory.
+If you didn't choose the default installation option, replace `/opt/intel/openvino_2022` with your directory.
 
 4. Save and close the file: press the **Esc** key, type `:wq` and press the **Enter** key.
 
@@ -196,7 +189,7 @@ You can choose to either configure the Model Optimizer for all supported framewo
 
 1. Go to the Model Optimizer prerequisites directory:
    ```sh
-   cd /opt/intel/openvino_2021/deployment_tools/model_optimizer/install_prerequisites
+   cd /opt/intel/openvino_2022/tools/model_optimizer/install_prerequisites
    ```
 
 2. Run the script to configure the Model Optimizer for Caffe, TensorFlow 1.x, MXNet, Kaldi\*, and ONNX:
@@ -210,7 +203,7 @@ Configure individual frameworks separately **ONLY** if you did not select **Opti
 
 1. Go to the Model Optimizer prerequisites directory:
    ```sh
-   cd /opt/intel/openvino_2021/deployment_tools/model_optimizer/install_prerequisites
+   cd /opt/intel/openvino_2022/tools/model_optimizer/install_prerequisites
    ```
 
 2. Run the script for your model framework. You can run more than one script:
@@ -279,14 +272,14 @@ Now you are ready to get started. To continue, see the following pages:
 
 Follow the steps below to uninstall the Intel® Distribution of OpenVINO™ Toolkit from your system:
 
-1. From the the installation directory (by default, `/opt/intel/openvino_2021`), locate and open `openvino_toolkit_uninstaller.app`.
+1. From the installation directory (by default, `/opt/intel/openvino_2022`), locate and open `openvino_toolkit_uninstaller.app`.
 2. Follow the uninstallation wizard instructions.
 3. When uninstallation is complete, click **Finish**. 
 
 
 ## Additional Resources
 
-- To learn more about the verification applications, see `README.txt` in `/opt/intel/openvino_2021/deployment_tools/demo/`.
+- To learn more about the verification applications, see `README.txt` in `/opt/intel/openvino_2022/samples/scripts/`.
 
 - For detailed description of the pre-trained models, go to the [Overview of OpenVINO toolkit Pre-Trained Models](@ref omz_models_group_intel) page.
 
diff --git a/docs/install_guides/installing-openvino-pip.md b/docs/install_guides/installing-openvino-pip.md
index 7a639faff86120..78ec6bfd1d497d 100644
--- a/docs/install_guides/installing-openvino-pip.md
+++ b/docs/install_guides/installing-openvino-pip.md
@@ -1,15 +1,15 @@
 # Install Intel® Distribution of OpenVINO™ Toolkit from PyPI Repository {#openvino_docs_install_guides_installing_openvino_pip}
 
-OpenVINO™ toolkit is a comprehensive toolkit for quickly developing applications and solutions that solve a variety of tasks including emulation of human vision, automatic speech recognition, natural language processing, recommendation systems, and many others. Based on latest generations of artificial neural networks, including Convolutional Neural Networks (CNNs), recurrent and attention-based networks, the toolkit extends computer vision and non-vision workloads across Intel® hardware, maximizing performance. It accelerates applications with high-performance, AI and deep learning inference deployed from edge to cloud.
+OpenVINO™ toolkit is a comprehensive toolkit for quickly developing applications and solutions that solve a variety of tasks including emulation of human vision, automatic speech recognition, natural language processing, recommendation systems, and many others. Based on the latest generations of artificial neural networks, including Convolutional Neural Networks (CNNs), recurrent and attention-based networks, the toolkit extends computer vision and non-vision workloads across Intel® hardware, maximizing performance. It accelerates applications with high-performance AI and deep learning inference deployed from edge to cloud.
 
 Intel® Distribution of OpenVINO™ Toolkit provides the following packages available for installation through the PyPI repository:
 
-* Runtime package with the Inference Engine inside: [https://pypi.org/project/openvino/](https://pypi.org/project/openvino/).
-* Developer package that includes the runtime package as a dependency, Model Optimizer and other developer tools: [https://pypi.org/project/openvino-dev](https://pypi.org/project/openvino-dev).
+* Runtime package with the Inference Engine inside: [https://pypi.org/project/openvino/](https://pypi.org/project/openvino/)
+* Developer package that includes the runtime package as a dependency, Model Optimizer, Accuracy Checker and Post-Training Optimization Tool: [https://pypi.org/project/openvino-dev](https://pypi.org/project/openvino-dev)
 
 ## Additional Resources
 
-- [Intel® Distribution of OpenVINO™ toolkit](https://software.intel.com/en-us/openvino-toolkit).
-- [Model Optimizer Developer Guide](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md).
-- [Inference Engine Developer Guide](../IE_DG/Deep_Learning_Inference_Engine_DevGuide.md).
-- [Inference Engine Samples Overview](../IE_DG/Samples_Overview.md).
+- [Intel® Distribution of OpenVINO™ toolkit](https://software.intel.com/en-us/openvino-toolkit)
+- [Model Optimizer Developer Guide](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md)
+- [Inference Engine Developer Guide](../IE_DG/Deep_Learning_Inference_Engine_DevGuide.md)
+- [Inference Engine Samples Overview](../IE_DG/Samples_Overview.md)
diff --git a/docs/install_guides/installing-openvino-raspbian.md b/docs/install_guides/installing-openvino-raspbian.md
index 338beda73c813a..af6ee21c7cc44b 100644
--- a/docs/install_guides/installing-openvino-raspbian.md
+++ b/docs/install_guides/installing-openvino-raspbian.md
@@ -75,11 +75,11 @@ The guide assumes you downloaded the OpenVINO toolkit for Raspbian* OS. If you d
    By default, the package file is saved as `l_openvino_toolkit_runtime_raspbian_p_<version>.tgz`.
 3. Create an installation folder.
    ```sh
-   sudo mkdir -p /opt/intel/openvino_2021
+   sudo mkdir -p /opt/intel/openvino_2022
    ```
 4. Unpack the archive:
    ```sh
-   sudo tar -xf  l_openvino_toolkit_runtime_raspbian_p_<version>.tgz --strip 1 -C /opt/intel/openvino_2021
+   sudo tar -xf  l_openvino_toolkit_runtime_raspbian_p_<version>.tgz --strip 1 -C /opt/intel/openvino_2022
    ```
 
 Now the OpenVINO toolkit components are installed. Additional configuration steps are still required. Continue to the next sections to install External Software Dependencies, configure the environment and set up USB rules.
@@ -97,12 +97,12 @@ CMake is installed. Continue to the next section to set the environment variable
 
 You must update several environment variables before you can compile and run OpenVINO toolkit applications. Run the following script to temporarily set the environment variables:
 ```sh
-source /opt/intel/openvino_2021/bin/setupvars.sh
+source /opt/intel/openvino_2022/setupvars.sh
 ```
 
 **(Optional)** The OpenVINO environment variables are removed when you close the shell. As an option, you can permanently set the environment variables as follows:
 ```sh
-echo "source /opt/intel/openvino_2021/bin/setupvars.sh" >> ~/.bashrc
+echo "source /opt/intel/openvino_2022/setupvars.sh" >> ~/.bashrc
 ```
 
 To test your change, open a new terminal. You will see the following:
@@ -120,11 +120,11 @@ This task applies only if you have an Intel® Neural Compute Stick 2 device.
    Log out and log in for it to take effect.
 2. If you didn't modify `.bashrc` to permanently set the environment variables, run `setupvars.sh` again after logging in:
    ```sh
-   source /opt/intel/openvino_2021/bin/setupvars.sh
+   source /opt/intel/openvino_2022/setupvars.sh
    ```
 3. To perform inference on the Intel® Neural Compute Stick 2, install the USB rules running the `install_NCS_udev_rules.sh` script:
    ```sh
-   sh /opt/intel/openvino_2021/install_dependencies/install_NCS_udev_rules.sh
+   sh /opt/intel/openvino_2022/install_dependencies/install_NCS_udev_rules.sh
    ```
 4. Plug in your Intel® Neural Compute Stick 2.
 
@@ -140,7 +140,7 @@ Follow the next steps to use the pre-trained face detection model using Inferenc
    ```
 2. Build the Object Detection Sample:
    ```sh
-   cmake -DCMAKE_BUILD_TYPE=Release -DCMAKE_CXX_FLAGS="-march=armv7-a" /opt/intel/openvino_2021/deployment_tools/inference_engine/samples/cpp
+   cmake -DCMAKE_BUILD_TYPE=Release -DCMAKE_CXX_FLAGS="-march=armv7-a" /opt/intel/openvino_2022/samples/cpp
    ```
    ```sh
    make -j2 object_detection_sample_ssd
diff --git a/docs/install_guides/installing-openvino-windows-fpga.md b/docs/install_guides/installing-openvino-windows-fpga.md
deleted file mode 100644
index 8c34f082bb9698..00000000000000
--- a/docs/install_guides/installing-openvino-windows-fpga.md
+++ /dev/null
@@ -1,21 +0,0 @@
-# Install Intel® Distribution of OpenVINO™ toolkit for Windows* with FPGA Support {#openvino_docs_install_guides_installing_openvino_windows_fpga}
-
-## Product Change Notice
-Intel® Distribution of OpenVINO™ toolkit for Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA
-
-<table>
-  <tr>
-    <td><strong>Change Notice Begins</strong></td>
-    <td>July 2020</td>
-  </tr>
-  <tr>
-    <td><strong>Change Date</strong></td>
-    <td>October 2020</td>
-  </tr>
-</table> 
-
-Intel will be transitioning to the next-generation programmable deep-learning solution based on FPGAs in order to increase the level of customization possible in FPGA deep-learning. As part of this transition, future standard releases (i.e., non-LTS releases) of Intel® Distribution of OpenVINO™ toolkit will no longer include the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA.
-
-Intel® Distribution of OpenVINO™ toolkit 2020.3.X LTS release will continue to support Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA. For questions about next-generation programmable deep-learning solutions based on FPGAs, please talk to your sales representative or contact us to get the latest FPGA updates.
-
-For installation instructions for the last release of Intel® Distribution of OpenVINO™ toolkit for Windows* with FPGA Support, see documentation for the [2020.4 version](https://docs.openvinotoolkit.org/2020.4/openvino_docs_install_guides_installing_openvino_windows_fpga.html).
diff --git a/docs/install_guides/installing-openvino-windows.md b/docs/install_guides/installing-openvino-windows.md
index 8e3b6ece81fb4d..d82044529ea5ea 100644
--- a/docs/install_guides/installing-openvino-windows.md
+++ b/docs/install_guides/installing-openvino-windows.md
@@ -1,8 +1,14 @@
 # Install Intel® Distribution of OpenVINO™ toolkit for Windows* 10 {#openvino_docs_install_guides_installing_openvino_windows}
 
-> **NOTES**:
+> **NOTE**:
 > - This guide applies to Microsoft Windows\* 10 64-bit. For Linux* OS information and instructions, see the [Installation Guide for Linux](installing-openvino-linux.md).
-> - [Intel® System Studio](https://software.intel.com/en-us/system-studio) is an all-in-one, cross-platform tool suite, purpose-built to simplify system bring-up and improve system and IoT device application performance on Intel® platforms. If you are using the Intel® Distribution of OpenVINO™ with Intel® System Studio, go to [Get Started with Intel® System Studio](https://software.intel.com/en-us/articles/get-started-with-openvino-and-intel-system-studio-2019).
+
+> **TIP**: If you want to [quick start with OpenVINO™ toolkit](@ref 
+> openvino_docs_get_started_get_started_dl_workbench), you can use 
+> the OpenVINO™ [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench). DL Workbench is the OpenVINO™ toolkit UI 
+> that enables you to import a
+> model, analyze its performance and accuracy, visualize the outputs, optimize and prepare the model for deployment
+> on various Intel® platforms. 
 
 ## Introduction
 
@@ -46,7 +52,7 @@ For more information, see the online [Intel® Distribution of OpenVINO™ toolk
 The Intel® Distribution of OpenVINO™ toolkit for Windows\* 10 OS:
 
 - Enables CNN-based deep learning inference on the edge
-- Supports heterogeneous execution across Intel® CPU, Intel® Processor Graphics (GPU), Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
+- Supports heterogeneous execution across Intel® CPU, Intel® GPU, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
 - Speeds time-to-market through an easy-to-use library of computer vision functions and pre-optimized kernels
 - Includes optimized calls for computer vision standards including OpenCV\* and OpenCL™
 
@@ -64,18 +70,6 @@ The following components are installed by default:
 | Additional Tools                                   | A set of tools to work with your models including [Accuracy Checker utility](@ref omz_tools_accuracy_checker), [Post-Training Optimization Tool Guide](@ref pot_README), [Model Downloader](@ref omz_tools_downloader) and other  |
 | [Documentation for Pre-Trained Models ](@ref omz_models_group_intel)                                   | Documentation for the pre-trained models available in the [Open Model Zoo repo](https://github.com/openvinotoolkit/open_model_zoo)  |
 
-**Could Be Optionally Installed**
-
-[Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench) is a platform built upon OpenVINO™ and provides a web-based graphical environment that enables you to optimize, fine-tune, analyze, visualize, and compare performance of deep learning models on various Intel® architecture
-configurations. In the DL Workbench, you can use most of OpenVINO™ toolkit components:
-* [Model Downloader](@ref omz_tools_downloader)
-* [Intel® Open Model Zoo](@ref omz_models_group_intel)
-* [Model Optimizer](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md)
-* [Post-training Optimization Tool](@ref pot_README)
-* [Accuracy Checker](@ref omz_tools_accuracy_checker)
-* [Benchmark Tool](../../inference-engine/samples/benchmark_app/README.md)
-
-Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub) to get started.
 
 ### System Requirements
 
@@ -86,6 +80,7 @@ Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_I
 * Intel® Xeon® Scalable processor (formerly Skylake and Cascade Lake)
 * Intel Atom® processor with support for Intel® Streaming SIMD Extensions 4.1 (Intel® SSE4.1)
 * Intel Pentium® processor N4200/5, N3350/5, or N3450/5 with Intel® HD Graphics
+* Intel® Iris® Xe MAX Graphics
 * Intel® Neural Compute Stick 2
 * Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
 
@@ -101,9 +96,8 @@ Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_I
 - Microsoft Windows\* 10 64-bit
 
 **Software**
-- [Microsoft Visual Studio* with C++ **2019 or 2017** with MSBuild](http://visualstudio.microsoft.com/downloads/)
-- [CMake **3.10 or higher** 64-bit](https://cmake.org/download/)
-   > **NOTE**: If you want to use Microsoft Visual Studio 2019, you are required to install CMake 3.14.
+- [Microsoft Visual Studio* with C++ **2019 or 2017** with MSBuild](http://visualstudio.microsoft.com/downloads/). Make sure that C++ CMake tools for Windows is [enabled](https://docs.microsoft.com/en-us/cpp/build/cmake-projects-in-visual-studio?view=msvc-160#:~:text=The%20Visual%20C%2B%2B%20Tools%20for,Visual%20Studio%20generators%20are%20supported).
+- [CMake **3.10 or higher** 64-bit](https://cmake.org/download/). If you want to use Microsoft Visual Studio 2019, you are required to install CMake 3.14.
 - [Python **3.6** - **3.8** 64-bit](https://www.python.org/downloads/windows/)
 
 ## Installation Steps
@@ -113,7 +107,7 @@ Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_I
 1. If you have not downloaded the Intel® Distribution of OpenVINO™ toolkit, [download the latest version](https://software.intel.com/content/www/us/en/develop/tools/openvino-toolkit/download.html). By default, the file is saved to the `Downloads` directory as `w_openvino_toolkit_p_<version>.exe`.
 2. Go to the `Downloads` folder and double-click `w_openvino_toolkit_p_<version>.exe`. A window opens to let you choose your installation directory and components. 
    ![](../img/openvino-install-windows-01.png)
-   The default installation directory is `C:\Program Files (x86)\Intel\openvino_<version>`, for simplicity, a shortcut to the latest installation is also created: `C:\Program Files (x86)\Intel\openvino_2021`. If you choose a different installation directory, the installer will create the directory for you.
+   The default installation directory is `C:\Program Files (x86)\Intel\openvino_<version>`, for simplicity, a shortcut to the latest installation is also created: `C:\Program Files (x86)\Intel\openvino_2022`. If you choose a different installation directory, the installer will create the directory for you.
    > **NOTE**: If there is an OpenVINO™ toolkit version previously installed on your system, the installer will use the same destination directory for next installations. If you want to install a newer version to a different directory, you need to uninstall the previously installed versions.    
 3. Click **Next**.
 4. You are asked if you want to provide consent to gather information. Choose the option of your choice. Click **Next**.
@@ -132,7 +126,7 @@ The screen example below indicates you are missing two dependencies:
 
 You must update several environment variables before you can compile and run OpenVINO™ applications. Open the Command Prompt, and run the `setupvars.bat` batch file to temporarily set your environment variables:
 ```sh
-"C:\Program Files (x86)\Intel\openvino_2021\bin\setupvars.bat"
+"C:\Program Files (x86)\Intel\openvino_2022\setupvars.bat"
 ```
 > **IMPORTANT**: Windows PowerShell* is not recommended to run the configuration commands, please use the Command Prompt instead.
 
@@ -153,7 +147,7 @@ The Model Optimizer is a key component of the Intel® Distribution of OpenVINO
 
 The Inference Engine reads, loads, and infers the IR files, using a common API across the CPU, GPU, or VPU hardware.  
 
-The Model Optimizer is a Python*-based command line tool (`mo.py`), which is located in `C:\Program Files (x86)\Intel\openvino_2021\deployment_tools\model_optimizer`. Use this tool on models trained with popular deep learning frameworks such as Caffe\*, TensorFlow\*, MXNet\*, and ONNX\* to convert them to an optimized IR format that the Inference Engine can use.
+The Model Optimizer is a Python*-based command line tool (`mo.py`), which is located in `C:\Program Files (x86)\Intel\openvino_2022\tools\model_optimizer`. Use this tool on models trained with popular deep learning frameworks such as Caffe\*, TensorFlow\*, MXNet\*, and ONNX\* to convert them to an optimized IR format that the Inference Engine can use.
 
 This section explains how to use scripts to configure the Model Optimizer either for all of the supported frameworks at the same time or for individual frameworks. If you want to manually configure the Model Optimizer instead of using scripts, see the **Using Manual Configuration Process** section on the [Configuring the Model Optimizer](../MO_DG/prepare_model/Config_Model_Optimizer.md) page.
 
@@ -168,7 +162,7 @@ You can configure the Model Optimizer either for all supported frameworks at onc
 
 > **NOTE**:
 > In the steps below:
-> - If you you want to use the Model Optimizer from another installed versions of Intel® Distribution of OpenVINO™ toolkit installed, replace `openvino_2021` with `openvino_<version>`, where `<version>` is the required version.
+> - If you you want to use the Model Optimizer from another installed versions of Intel® Distribution of OpenVINO™ toolkit installed, replace `openvino_2022` with `openvino_<version>`, where `<version>` is the required version.
 > - If you installed the Intel® Distribution of OpenVINO™ toolkit to the non-default installation directory, replace `C:\Program Files (x86)\Intel` with the directory where you installed the software.
 
 These steps use a command prompt to make sure you see error messages.
@@ -182,7 +176,7 @@ Type commands in the opened window:
 
 2. Go to the Model Optimizer prerequisites directory.<br>
 ```sh
-cd C:\Program Files (x86)\Intel\openvino_2021\deployment_tools\model_optimizer\install_prerequisites
+cd C:\Program Files (x86)\Intel\openvino_2022\tools\model_optimizer\install_prerequisites
 ```
 
 3. Run the following batch file to configure the Model Optimizer for Caffe\*, TensorFlow\* 1.x, MXNet\*, Kaldi\*, and ONNX\*:<br>
@@ -194,7 +188,7 @@ install_prerequisites.bat
 
 1. Go to the Model Optimizer prerequisites directory:<br>
 ```sh
-cd C:\Program Files (x86)\Intel\openvino_2021\deployment_tools\model_optimizer\install_prerequisites
+cd C:\Program Files (x86)\Intel\openvino_2022\tools\model_optimizer\install_prerequisites
 ```
 
 2. Run the batch file for the framework you will use with the Model Optimizer. You can use more than one:
@@ -275,8 +269,8 @@ To perform inference on Intel® Vision Accelerator Design with Intel® Movidius
 
   1. Download and install <a href="https://www.microsoft.com/en-us/download/details.aspx?id=48145">Visual C++ Redistributable for Visual Studio 2017</a>
   2. Check with a support engineer if your Intel® Vision Accelerator Design with Intel® Movidius™ VPUs card requires SMBUS connection to PCIe slot (most unlikely). Install the SMBUS driver only if confirmed (by default, it's not required):
-      1. Go to the `<INSTALL_DIR>\deployment_tools\inference-engine\external\hddl\drivers\SMBusDriver` directory, where `<INSTALL_DIR>` is the directory in which the Intel Distribution of OpenVINO toolkit is installed.
-      2. Right click on the `hddlsmbus.inf` file and choose **Install** from the pop up menu.
+      1. Go to the `<INSTALL_DIR>\runtime\3rdparty\hddl\drivers\SMBusDriver` directory, where `<INSTALL_DIR>` is the directory in which the Intel Distribution of OpenVINO toolkit is installed.
+      2. Right click on the `hddlsmbus.inf` file and choose **Install** from the pop-up menu.
 
 You are done installing your device driver and are ready to use your Intel® Vision Accelerator Design with Intel® Movidius™ VPUs.
 
@@ -338,6 +332,7 @@ To learn more about converting deep learning models, go to:
 - [Convert Your TensorFlow* Model](../MO_DG/prepare_model/convert_model/Convert_Model_From_TensorFlow.md)
 - [Convert Your MXNet* Model](../MO_DG/prepare_model/convert_model/Convert_Model_From_MxNet.md)
 - [Convert Your ONNX* Model](../MO_DG/prepare_model/convert_model/Convert_Model_From_ONNX.md)
+- [Convert Your Kaldi* Model](../MO_DG/prepare_model/convert_model/Convert_Model_From_Kaldi.md)
 
 ## Additional Resources
 
diff --git a/docs/install_guides/installing-openvino-yum.md b/docs/install_guides/installing-openvino-yum.md
index d92e7e891d10b5..3c3ad19ef7ba9c 100644
--- a/docs/install_guides/installing-openvino-yum.md
+++ b/docs/install_guides/installing-openvino-yum.md
@@ -110,8 +110,7 @@ To install the full runtime version of the OpenVINO package:
 ```sh
 sudo yum install intel-openvino-runtime-centos7-<VERSION>.<UPDATE>.<BUILD_NUM>
 ```
-
-#### Examples
+For example:
 
 ```sh
 sudo yum install intel-openvino-runtime-centos7-2021.3.394
diff --git a/docs/install_guides/movidius-setup-guide.md b/docs/install_guides/movidius-setup-guide.md
index c26ebbda38d9de..0bb5de0fe69024 100644
--- a/docs/install_guides/movidius-setup-guide.md
+++ b/docs/install_guides/movidius-setup-guide.md
@@ -46,7 +46,7 @@ The `hddldaemon` is a system service, a binary executable that is run to manage
 `<IE>` refers to the following default OpenVINO&trade; Inference Engine directories:
 -  **Linux:**	   
  ```
- /opt/intel/openvino_2021/inference_engine
+ /opt/intel/openvino_2022/inference_engine
  ```
 -  **Windows:**	    
 ``` 
diff --git a/docs/install_guides/pypi-openvino-dev.md b/docs/install_guides/pypi-openvino-dev.md
index 01616f7e85eecf..e0827d0c53d087 100644
--- a/docs/install_guides/pypi-openvino-dev.md
+++ b/docs/install_guides/pypi-openvino-dev.md
@@ -11,7 +11,7 @@ license terms for third party or open source software included in or with the So
 
 OpenVINO™ toolkit is a comprehensive toolkit for quickly developing applications and solutions that solve a variety of tasks including emulation of human vision, automatic speech recognition, natural language processing, recommendation systems, and many others. Based on latest generations of artificial neural networks, including Convolutional Neural Networks (CNNs), recurrent and attention-based networks, the toolkit extends computer vision and non-vision workloads across Intel® hardware, maximizing performance. It accelerates applications with high-performance, AI and deep learning inference deployed from edge to cloud.
 
-The **developer package** includes the following components installed by default:
+**The developer package includes the following components installed by default:**
 
 | Component        | Console Script                                                                   | Description                                                                                                                                                                                                                                                                                                   |  
 |------------------|---------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
@@ -21,14 +21,14 @@ The **developer package** includes the following components installed by default
 | [Post-Training Optimization Tool](https://docs.openvinotoolkit.org/latest/pot_README.html)| `pot` |**Post-Training Optimization Tool** allows you to optimize trained models with advanced capabilities, such as quantization and low-precision optimizations, without the need to retrain or fine-tune models. Optimizations are also available through the [API](https://docs.openvinotoolkit.org/latest/pot_compression_api_README.html).                                            |
 | [Model Downloader and other Open Model Zoo tools](https://docs.openvinotoolkit.org/latest/omz_tools_downloader.html)| `omz_downloader` <br> `omz_converter` <br> `omz_quantizer` <br> `omz_info_dumper`| **Model Downloader** is a tool for getting access to the collection of high-quality and extremely fast pre-trained deep learning [public](https://docs.openvinotoolkit.org/latest/omz_models_group_public.html) and [Intel](https://docs.openvinotoolkit.org/latest/omz_models_group_intel.html)-trained models. These free pre-trained models can be used to speed up the development and production deployment process without training your own models. The tool downloads model files from online sources and, if necessary, patches them to make them more usable with Model Optimizer. A number of additional tools are also provided to automate the process of working with downloaded models:<br> **Model Converter** is a tool for converting Open Model Zoo models that are stored in an original deep learning framework format into the Inference Engine Intermediate Representation (IR) using Model Optimizer. <br> **Model Quantizer** is a tool for automatic quantization of full-precision models in the IR format into low-precision versions using the Post-Training Optimization Tool. <br> **Model Information Dumper** is a helper utility for dumping information about the models to a stable, machine-readable format.
 
+> **NOTE**: The developer package also installs the OpenVINO™ runtime package as a dependency.
 
-**Developer package** also provides the **runtime package** installed as a dependency. The runtime package includes the following components:
+**The runtime package installs the following components:**
 
 | Component                                                                                           | Description                                                                                                                                                                                                                                                                                                   |  
 |-----------------------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
 | [Inference Engine](https://pypi.org/project/openvino)               | This is the engine that runs the deep learning model. It includes a set of libraries for an easy inference integration into your applications.                                                                                                                                                                                                |
 
-
 ## System Requirements
 The complete list of supported hardware is available in the [Release Notes](https://software.intel.com/content/www/us/en/develop/articles/openvino-relnotes.html#inpage-nav-8).
 
@@ -40,7 +40,7 @@ The table below lists the supported operating systems and Python* versions requi
 |   Ubuntu* 20.04 long-term support (LTS), 64-bit              | 3.6, 3.7, 3.8                                       |
 |   Red Hat* Enterprise Linux* 8, 64-bit                       | 3.6, 3.8                                            |
 |   CentOS* 7, 64-bit                                          | 3.6, 3.7, 3.8                                       |
-|   macOS* 10.15.x versions                                    | 3.6, 3.7, 3.8                                       |
+|   macOS* 10.15.x                                             | 3.6, 3.7, 3.8                                       |
 |   Windows 10*, 64-bit                                        | 3.6, 3.7, 3.8                                       |
 
 > **NOTE**: This package can be installed on other versions of macOS, Linux and Windows, but only the specific versions above are fully validated.
@@ -112,7 +112,7 @@ For example, to install and configure the components for working with TensorFlow
    ```sh
    python -c "from openvino.inference_engine import IECore"
    ```
-   You will not see any error messages if installation finished successfully.
+   If installation was successful, you will not see any error messages (no console output).
 
 ## Troubleshooting
 
diff --git a/docs/install_guides/pypi-openvino-rt.md b/docs/install_guides/pypi-openvino-rt.md
index a41c02e7b2d7a7..321830837848da 100644
--- a/docs/install_guides/pypi-openvino-rt.md
+++ b/docs/install_guides/pypi-openvino-rt.md
@@ -86,7 +86,7 @@ Run the command below:
 python -c "from openvino.inference_engine import IECore"
 ```
    
-You will not see any error messages if installation finished successfully.
+If installation was successful, you will not see any error messages (no console output).
 
 ## Troubleshooting
 
diff --git a/docs/migration_ov_2_0/docs/common_inference_pipeline.md b/docs/migration_ov_2_0/docs/common_inference_pipeline.md
new file mode 100644
index 00000000000000..af2dbf25304116
--- /dev/null
+++ b/docs/migration_ov_2_0/docs/common_inference_pipeline.md
@@ -0,0 +1,55 @@
+# OpenVINO™ Inference Pipeline {#ov_inference_pipeline}
+
+Usually to inference network with the OpenVINO™ toolkit users need to do next steps:
+ 1. Create Core
+ 2. (Optional) Read model from the disk
+     2.1. Configure Input and Output of the Model
+ 3. Load the Model to the Device
+ 4. Create an Inference Request
+ 5. Prepare Input
+ 6. Start Inference
+ 7. Process the Inference Results
+
+Code snippets below cover these steps and show how application code should be changed for migration to OpenVINO™ 2.0.
+
+## 1. Create Core
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:create_core
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:create_core
+
+## 2. (Optional) Read model from the disk
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:read_model
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:read_model
+
+### 2.1 Configure Input and Output of the Model
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:get_inputs_outputs
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:get_inputs_outputs
+
+## 3. Load the Model to the Device
+
+Inference Engine API:
+
+@snippet snippets/ie_common.cpp ie:compile_model
+
+OpenVINO™ 2.0 API:
+
+@snippet snippets/ov_common.cpp ov_api_2_0:compile_model
+
+## 5. TBD
diff --git a/docs/migration_ov_2_0/docs/intro.md b/docs/migration_ov_2_0/docs/intro.md
new file mode 100644
index 00000000000000..5d89b7aff3d809
--- /dev/null
+++ b/docs/migration_ov_2_0/docs/intro.md
@@ -0,0 +1,12 @@
+# OpenVINO™ API 2.0 transition guide {#ov_2_0_transition_guide}
+
+The OpenVINO™ API 2.0 introduced in order to simplify migration from other frameworks and make the OpenVINO™ API more user-friendly.
+The list with differences between APIs below:
+
+ - OpenVINO™ API 2.0 uses tensor names or indexes to work with Inputs or Outputs, the old API works with operation names.
+ - Structures for Shapes, element types were changed.
+ - Naming style was changed. The old API uses CamelCaseStyle and OpenVINO™ API 2.0 uses snake_case for function names.
+ - Namespaces were aligned between components.
+
+Please look at next transition guides to understand how transit own application to OpenVINO™ API 2.0.
+ - [OpenVINO™ Common Inference pipeline](@ref ov_inference_pipeline)
diff --git a/docs/nGraph_DG/nGraph_Python_API.md b/docs/nGraph_DG/nGraph_Python_API.md
index 3b778747c06e69..da6357b6bd8f26 100644
--- a/docs/nGraph_DG/nGraph_Python_API.md
+++ b/docs/nGraph_DG/nGraph_Python_API.md
@@ -169,13 +169,13 @@ You can also set attribute values using corresponding setter methods, for exampl
 node.set_axis(0)
 ```
 
-Currently, you can get all attributes of a node using the `_get_attributes` method. Please note that this is an internal API method and may change in future versions of OpenVINO.
+Currently, you can get all attributes of a node using the `get_attributes` method.
 
 The following code displays all attributes for all nodes in a function:
 
 ```python
 for node in function.get_ordered_ops():
-    attributes = node._get_attributes()
+    attributes = node.get_attributes()
     if(attributes):
         print('Operation {} of type {} has attributes:'.format(node.get_friendly_name(), node.get_type_name()))
         for attr, value in attributes.items():
diff --git a/docs/onnx_custom_op/CMakeLists.txt b/docs/onnx_custom_op/CMakeLists.txt
index 09d6635ee92145..5403489794e958 100644
--- a/docs/onnx_custom_op/CMakeLists.txt
+++ b/docs/onnx_custom_op/CMakeLists.txt
@@ -7,11 +7,11 @@ set(CMAKE_CXX_STANDARD 11)
 
 set(TARGET_NAME "onnx_custom_op")
 
-find_package(ngraph REQUIRED COMPONENTS onnx_ngraph_frontend)
+find_package(OpenVINO REQUIRED COMPONENTS ONNX)
 
 add_library(${TARGET_NAME} STATIC onnx_custom_op.cpp onnx_custom_op.hpp)
 
-target_link_libraries(${TARGET_NAME} PUBLIC ngraph::ngraph ngraph::onnx_ngraph_frontend)
+target_link_libraries(${TARGET_NAME} PUBLIC openvino::core openvino::frontend::onnx)
 # [cmake:onnx_custom_op]
 
 # Enable code style check
diff --git a/docs/ops/generation/RandomUniform_8.md b/docs/ops/generation/RandomUniform_8.md
index 8f461bdf045859..3c8f3ace3b07cb 100644
--- a/docs/ops/generation/RandomUniform_8.md
+++ b/docs/ops/generation/RandomUniform_8.md
@@ -12,11 +12,13 @@
 The generation algorithm is based on underlying random integer generator that uses Philox algorithm. Philox algorithm 
 is a counter-based pseudo-random generator, which produces uint32 values. Single invocation of Philox algorithm returns 
 four result random values, depending on the given *key* and *counter* values. *Key* and *counter* are initialized 
-with *seed* and *seed2* attributes respectively.
+with *global_seed* and *op_seed* attributes respectively.
+
+If both seed values equal to zero, RandomUniform generates non-deterministic sequence.
 
 \f[
-key = seed\\
-counter = seed2
+key = global_seed\\
+counter = op_seed
 \f]
 
 Link to the original paper [Parallel Random Numbers: As Easy as 1, 2, 3](https://www.thesalmons.org/john/random123/papers/random123sc11.pdf)
@@ -130,7 +132,7 @@ result = x \mod (maxval - minval) + minval,
 where *x* is uint32 random value.
 
 
-Example 1. *RandomUniform* output with `seed` = 150, `seed2` = 10, `output_type` = f32:
+Example 1. *RandomUniform* output with `global_seed` = 150, `op_seed` = 10, `output_type` = f32:
 
 ``` 
 input_shape    = [ 3, 3 ]
@@ -139,7 +141,7 @@ output  = [[0.7011236  0.30539632 0.93931055]
           [0.5197197   0.22727466 0.991374  ]]
 ```
 
-Example 2. *RandomUniform* output with `seed` = 80, `seed2` = 100, `output_type` = double:
+Example 2. *RandomUniform* output with `global_seed` = 80, `op_seed` = 100, `output_type` = double:
 
 ``` 
 input_shape    = [ 2, 2 ]
@@ -152,7 +154,7 @@ output  = [[5.65927959 4.23122376]
           [2.67008206 2.36423758]]
 ```
 
-Example 3. *RandomUniform* output with `seed` = 80, `seed2` = 100, `output_type` = i32:
+Example 3. *RandomUniform* output with `global_seed` = 80, `op_seed` = 100, `output_type` = i32:
 
 ``` 
 input_shape    = [ 2, 3 ]
@@ -175,18 +177,20 @@ output  = [[65 70 56]
     * **Type**: string
     * **Required**: *Yes*
 
-* *seed*
+* *global_seed*
 
     * **Description**: global seed value.
     * **Range of values**: positive integers
     * **Type**: `int`
+    * **Default value**: 0
     * **Required**: *Yes*
 
-* *seed2*
+* *op_seed*
 
     * **Description**: operational seed value.
     * **Range of values**: positive integers
     * **Type**: `int`
+    * **Default value**: 0
     * **Required**: *Yes*
 
 **Inputs**:
@@ -212,7 +216,7 @@ output  = [[65 70 56]
 
 ```xml
 <layer ... name="RandomUniform" type="RandomUniform">
-    <data output_type="f32" seed="234" seed2="148"/>
+    <data output_type="f32" global_seed="234" op_seed="148"/>
     <input>
         <port id="0" precision="I32">  <!-- shape value: [2, 3, 10] -->
             <dim>3</dim>
diff --git a/docs/ops/movement/GatherTree_1.md b/docs/ops/movement/GatherTree_1.md
index e39d616d36afff..5c4441b37b3f73 100644
--- a/docs/ops/movement/GatherTree_1.md
+++ b/docs/ops/movement/GatherTree_1.md
@@ -2,63 +2,60 @@
 
 **Versioned name**: *GatherTree-1*
 
-**Category**: Beam search post-processing
+**Category**: *Data movement*
 
 **Short description**: Generates the complete beams from the ids per each step and the parent beam ids.
 
 **Detailed description**
 
-The GatherTree operation implements the same algorithm as the [GatherTree operation in TensorFlow](https://www.tensorflow.org/addons/api_docs/python/tfa/seq2seq/gather_tree).
+*GatherTree* operation reorders token IDs of a given input tensor `step_id` representing IDs per each step of beam search, based on input tensor `parent_ids` representing the parent beam IDs. For a given beam, past the time step containing the first decoded `end_token` all values are filled in with end_token.
 
-Pseudo code:
+The algorithm in pseudocode is as follows:
 
 ```python
-final_idx[ :, :, :] = end_token
+final_ids[ :, :, :] = end_token
 for batch in range(BATCH_SIZE):
     for beam in range(BEAM_WIDTH):
         max_sequence_in_beam = min(MAX_TIME, max_seq_len[batch])
 
-        parent = parent_idx[max_sequence_in_beam - 1, batch, beam]
+        parent = parent_ids[max_sequence_in_beam - 1, batch, beam]
 
-        final_idx[max_sequence_in_beam - 1, batch, beam] = step_idx[max_sequence_in_beam - 1, batch, beam]
+        final_ids[max_sequence_in_beam - 1, batch, beam] = step_ids[max_sequence_in_beam - 1, batch, beam]
 
         for level in reversed(range(max_sequence_in_beam - 1)):
-            final_idx[level, batch, beam] = step_idx[level, batch, parent]
+            final_ids[level, batch, beam] = step_ids[level, batch, parent]
 
-            parent = parent_idx[level, batch, parent]
+            parent = parent_ids[level, batch, parent]
 
         # For a given beam, past the time step containing the first decoded end_token
         # all values are filled in with end_token.
         finished = False
         for time in range(max_sequence_in_beam):
             if(finished):
-                final_idx[time, batch, beam] = end_token
-            elif(final_idx[time, batch, beam] == end_token):
+                final_ids[time, batch, beam] = end_token
+            elif(final_ids[time, batch, beam] == end_token):
                 finished = True
 ```
 
-Element data types for all input tensors should match each other.
+*GatherTree* operation is equivalent to [GatherTree operation in TensorFlow](https://www.tensorflow.org/addons/api_docs/python/tfa/seq2seq/gather_tree).
 
-**Attributes**: *GatherTree* has no attributes
+**Attributes**: *GatherTree* operation has no attributes.
 
 **Inputs**
 
-* **1**:  `step_ids` -- a tensor of shape `[MAX_TIME, BATCH_SIZE, BEAM_WIDTH]` of type *T* with indices from per each step. **Required.**
-
-* **2**:  `parent_idx` -- a tensor of shape `[MAX_TIME, BATCH_SIZE, BEAM_WIDTH]` of type *T* with parent beam indices. **Required.**
-
-* **3**:  `max_seq_len` -- a tensor of shape `[BATCH_SIZE]` of type *T* with maximum lengths for each sequence in the batch. **Required.**
-
-* **4**:  `end_token` -- a scalar tensor of type *T* with value of the end marker in a sequence. **Required.**
-
+* **1**:  `step_ids` - Indices per each step. A tensor of type *T* and rank 3. Layout is `[MAX_TIME, BATCH_SIZE, BEAM_WIDTH]`. **Required.**
+* **2**:  `parent_ids` - Parent beam indices. A tensor of type *T* and rank 3. Layout is `[MAX_TIME, BATCH_SIZE, BEAM_WIDTH]`. **Required.**
+* **3**:  `max_seq_len` - Maximum lengths for each sequence in the batch. A tensor of type *T* and rank 1. Layout is `[BATCH_SIZE]`. **Required.**
+* **4**:  `end_token` - Value of the end marker in a sequence. A scalar of type *T*. **Required.**
+* **Note**: Inputs should have integer values only.
 
 **Outputs**
 
-* **1**: `final_idx` -- a tensor of shape `[MAX_TIME, BATCH_SIZE, BEAM_WIDTH]` of type *T*.
+* **1**: `final_ids` - The reordered token IDs based on `parent_ids` input. A tensor of type *T* and rank 3. Layout is `[MAX_TIME, BATCH_SIZE, BEAM_WIDTH]`.
 
 **Types**
 
-* *T*: `float32` or `int32`; `float32` should have integer values only.
+* *T*: any supported numeric type.
 
 **Example**
 
diff --git a/docs/ops/movement/ScatterUpdate_3.md b/docs/ops/movement/ScatterUpdate_3.md
index b004ad1b663f1f..1ba52d09e3e017 100644
--- a/docs/ops/movement/ScatterUpdate_3.md
+++ b/docs/ops/movement/ScatterUpdate_3.md
@@ -7,82 +7,80 @@
 **Short description**: *ScatterUpdate* creates a copy of the first input tensor with updated elements specified with second and third input tensors.
 
 **Detailed description**: *ScatterUpdate* creates a copy of the first input tensor with updated elements in positions specified with `indices` input
-and values specified with `updates` tensor starting from the dimension with index `axis`. For the `data` tensor of shape `[d_0, d_1, ..., d_n]`,
-`indices` tensor of shape `[i_0, i_1, ..., i_k]` and `updates` tensor of shape
-`[d_0, d_1, ... d_(axis - 1), i_0, i_1, ..., i_k, d_(axis + 1), ..., d_n]` the operation computes
+and values specified with `updates` tensor starting from the dimension with index `axis`. For the `data` tensor of shape \f$[d_0,\;d_1,\;\dots,\;d_n]\f$,
+`indices` tensor of shape \f$[i_0,\;i_1,\;\dots,\;i_k]\f$ and `updates` tensor of shape
+\f$[d_0,\;d_1,\;\dots,\;d_{axis - 1},\;i_0,\;i_1,\;\dots,\;i_k,\;d_{axis + 1},\;\dots, d_n]\f$ the operation computes
 for each `m, n, ..., p` of the `indices` tensor indices:
 
-```
-data[..., indices[m, n, ..., p], ...] = updates[..., m, n, ..., p, ...]
-```
 
-where first `...` in the `data` corresponds to first `axis` dimensions, last `...` in the `data` corresponds to the
+\f[data[\dots,\;indices[m,\;n,\;\dots,\;p],\;\dots] = updates[\dots,\;m,\;n,\;\dots,\;p,\;\dots]\f]
+
+where first \f$\dots\f$ in the `data` corresponds to \f$[d_0,\;\dots,\;d_{axis - 1}]\f$ dimensions, last\f$\dots\f$ in the `data` corresponds to the
 `rank(data) - (axis + 1)` dimensions.
 
 Several examples for case when `axis = 0`:
-1. `indices` is a 0D tensor: `data[indices, ...] = updates[...]`
-2. `indices` is a 1D tensor (for each `i`): `data[indices[i], ...] = updates[i, ...]`
-3. `indices` is a ND tensor (for each `i, ..., j`): `data[indices[i, ..., j], ...] = updates[i, ..., j, ...]`
-
-This operation is similar to TensorFlow* operation [ScatterUpdate](https://www.tensorflow.org/versions/r1.15/api_docs/python/tf/scatter_update)
-but allows scattering for the arbitrary axis.
+1. `indices` is a \f$0\f$D tensor: \f$data[indices,\;\dots] = updates[\dots]\f$
+2. `indices` is a \f$1\f$D tensor (\f$\forall_{i}\f$): \f$data[indices[i],\;\dots] = updates[i,\;\dots]\f$
+3. `indices` is a \f$N\f$D tensor (\f$\forall_{i,\;\dots,\;j}\f$): \f$data[indices[i],\;\dots,\;j],\;\dots] = updates[i,\;\dots,\;j,\;\dots]\f$
 
 **Attributes**: *ScatterUpdate* does not have attributes.
 
 **Inputs**:
 
-*   **1**: `data` tensor of arbitrary rank `r` and of type *T*. **Required.**
+*   **1**: `data` tensor of arbitrary rank `r` and type *T_NUMERIC*. **Required.**
 
 *   **2**: `indices` tensor with indices of type *T_IND*.
-All index values are expected to be within bounds `[0, s - 1]` along axis of size `s`. If multiple indices point to the
-same output location then the order of updating the values is undefined. If an index points to non-existing output
-tensor element or is negative then an exception is raised. **Required.**
+All index values are expected to be within bounds `[0, s - 1]` along the axis of size `s`. If multiple indices point to the
+same output location, the order of updating the values is undefined. If an index points to a non-existing output
+tensor element or is negative, then an exception is raised. **Required.**
 
-*   **3**: `updates` tensor of type *T*. **Required.**
+*   **3**: `updates` tensor of type *T_NUMERIC* and rank equal to `rank(indices) + rank(data) - 1` **Required.**
 
 *   **4**: `axis` tensor with scalar or 1D tensor with one element of type *T_AXIS* specifying axis for scatter.
-The value can be in range `[-r, r - 1]` where `r` is the rank of `data`. **Required.**
+The value can be in the range `[ -r, r - 1]`, where `r` is the rank of `data`. **Required.**
 
 **Outputs**:
 
-*   **1**: tensor with shape equal to `data` tensor of the type *T*.
+*   **1**: tensor with shape equal to `data` tensor of the type *T_NUMERIC*.
 
 **Types**
 
-* *T*: any numeric type.
+* *T_NUMERIC*: any numeric type.
 
 * *T_IND*: any supported integer types.
 
 * *T_AXIS*: any supported integer types.
 
-**Example**
+**Examples**
+
+*Example 1*
 
 ```xml
 <layer ... type="ScatterUpdate">
     <input>
-        <port id="0">
+        <port id="0">  <!-- data -->
             <dim>1000</dim>
             <dim>256</dim>
             <dim>10</dim>
             <dim>15</dim>
         </port>
-        <port id="1">
+        <port id="1">  <!-- indices -->
             <dim>125</dim>
             <dim>20</dim>
         </port>
-        <port id="2">
+        <port id="2">  <!-- udpates -->
             <dim>1000</dim>
             <dim>125</dim>
             <dim>20</dim>
             <dim>10</dim>
             <dim>15</dim>
         </port>
-        <port id="3">     <!-- value [1] -->
-            <dim>1</dim>
+        <port id="3">   <!-- axis -->
+            <dim>1</dim> <!-- value [1] -->
         </port>
     </input>
     <output>
-        <port id="4" precision="FP32">
+        <port id="4" precision="FP32"> <!-- output -->
             <dim>1000</dim>
             <dim>256</dim>
             <dim>10</dim>
@@ -91,3 +89,32 @@ The value can be in range `[-r, r - 1]` where `r` is the rank of `data`. **Requi
     </output>
 </layer>
 ```
+
+*Example 2*
+
+```xml
+<layer ... type="ScatterUpdate">
+    <input>
+        <port id="0">  <!-- data -->
+            <dim>3</dim>    <!-- {{-1.0f, 1.0f, -1.0f, 3.0f, 4.0f},  -->
+            <dim>5</dim>    <!-- {-1.0f, 6.0f, -1.0f, 8.0f, 9.0f},   -->
+        </port>             <!-- {-1.0f, 11.0f, 1.0f, 13.0f, 14.0f}} -->
+        <port id="1">  <!-- indices -->
+            <dim>2</dim> <!-- {0, 2} -->
+        </port>
+        <port id="2">  <!-- udpates -->
+            <dim>3</dim> <!-- {1.0f, 1.0f} -->
+            <dim>2</dim> <!-- {1.0f, 1.0f} -->
+        </port>          <!-- {1.0f, 2.0f} -->
+        <port id="3">   <!-- axis -->
+            <dim>1</dim> <!-- {1} -->
+        </port>
+    </input>
+    <output>
+        <port id="4">  <!-- output -->
+            <dim>3</dim>    <!-- {{1.0f, 1.0f, 1.0f, 3.0f, 4.0f},   -->
+            <dim>5</dim>    <!-- {1.0f, 6.0f, 1.0f, 8.0f, 9.0f},    -->
+        </port>             <!-- {1.0f, 11.0f, 2.0f, 13.0f, 14.0f}} -->
+    </output>
+</layer>
+```
\ No newline at end of file
diff --git a/docs/ops/movement/Slice_8.md b/docs/ops/movement/Slice_8.md
new file mode 100644
index 00000000000000..7ebfe6b1a9ff4e
--- /dev/null
+++ b/docs/ops/movement/Slice_8.md
@@ -0,0 +1,419 @@
+## Slice <a name="Slice"></a> {#openvino_docs_ops_movement_Slice_8}
+
+**Versioned name**: *Slice-8*
+
+**Category**: *Data movement*
+
+**Short description**: *Slice* operation extracts a slice of the input tensor.
+
+**Detailed Description**: *Slice* operation selects a region of values from the `data` tensor.
+Selected values start at indexes provided in the `start` input (inclusively) and end
+at indexes provides in `stop` input (exclusively).
+
+The `step` input allows subsampling of `data`, selecting every *n*-th element,
+where `n` is equal to `step` element for corresponding axis.
+Negative `step` value indicates slicing backwards, so the sequence along the corresponding axis is reversed in the output tensor.
+To select all values contiguously set `step` to `1` for each axis.
+
+The optional `axes` input allows specifying slice indexes only on selected axes.
+Other axes will not be affected and will be output in full.
+
+The rules follow python language slicing `data[start:stop:step]`.
+
+**Attributes**: *Slice* operation has no attributes.
+
+**Inputs**
+
+* **1**: `data` - tensor (to be sliced) of type *T* and shape rank greater or equal to 1. **Required.**
+
+* **2**: `start` - 1D tensor of type *T_IND*. Indices corresponding to axes in `data`.
+  Defines the starting coordinate of the slice in the `data` tensor.
+  A negative index value represents counting elements from the end of that dimension.
+  A value larger than the size of a dimension is silently clamped. **Required.**
+
+* **3**: `stop` - 1D, type *T_IND*, similar to `start`.
+  Defines the coordinate of the opposite vertex of the slice, or where the slice ends.
+  Stop indexes are exclusive, which means values lying on the ending edge are
+  not included in the output slice.
+  To slice to the end of a dimension of unknown size `INT_MAX`
+  may be used (or `INT_MIN` if slicing backwards). **Required.**
+
+* **4**: `step` - 1D tensor of type *T_IND* and the same shape as `start` and `stop`.
+  Integer value that specifies the increment between each index used in slicing.
+  Value cannot be `0`, negative value indicates slicing backwards. **Required.**
+
+* **5**: `axes` - 1D tensor of type *T_AXIS*.
+  Optional 1D tensor indicating which dimensions the values in `start` and `stop` apply to.
+  Negative value means counting dimensions from the end. The range is `[-r, r - 1]`, where `r` is the rank of the `data` input tensor.
+  Values are required to be unique. If a particular axis is unspecified, it will be output in full and not sliced.
+  Default value: `[0, 1, 2, ..., start.shape[0] - 1]`. **Optional.**
+
+Number of elements in `start`, `stop`, `step`, and `axes` inputs are required to be equal.
+
+**Outputs**
+
+* **1**: Tensor of type *T* with values of the selected slice. The shape of the output tensor has the same rank as the shape of `data` input and reduced dimensions according to the values specified by `start`, `stop`, and `step` inputs.
+
+**Types**
+
+* *T*: any arbitrary supported type.
+* *T_IND*: any supported integer type.
+* *T_AXIS*: any supported integer type.
+
+
+**Examples**
+
+*Example 1: basic slicing*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [1] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [8] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [1] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [1, 2, 3, 4, 5, 6, 7] -->
+            <dim>7</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 2: basic slicing, `axes` default*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [1] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [8] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [1] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="4">       <!-- output: [1, 2, 3, 4, 5, 6, 7] -->
+            <dim>7</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 3: basic slicing, `step: [2]`*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [1] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [8] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [2] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [1, 3, 5, 7] -->
+            <dim>4</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 4: `start` and `stop` out of the dimension size, `step: [1]`*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [-100] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [100] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [1] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+            <dim>10</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 5: slicing backward all elements, `step: [-1]`, `stop: [-11]`*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [9] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [-11] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [-1] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [9, 8, 7, 6, 5, 4, 3, 2, 1, 0] -->
+            <dim>10</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 6: slicing backward, `step: [-1]`, `stop: [0]`*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [9] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [0] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [-1] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [9, 8, 7, 6, 5, 4, 3, 2, 1] -->
+            <dim>9</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 7: slicing backward, `step: [-1]`, `stop: [-10]`*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [9] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [-10] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [-1] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [9, 8, 7, 6, 5, 4, 3, 2, 1] -->
+            <dim>9</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 8: slicing backward, `step: [-2]`*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [9] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [-11] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [-2] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [9, 7, 5, 3, 1] -->
+            <dim>5</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 9: `start` and `stop` out of the dimension size, slicing backward*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] -->
+          <dim>10</dim>
+        </port>
+        <port id="1">       <!-- start: [100] -->
+          <dim>1</dim>
+        </port>
+        <port id="2">       <!-- stop: [-100] -->
+          <dim>1</dim>
+        </port>
+        <port id="3">       <!-- step: [-1] -->
+          <dim>1</dim>
+        </port>
+        <port id="4">       <!-- axes: [0] -->
+          <dim>1</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output: [9, 8, 7, 6, 5, 4, 3, 2, 1, 0] -->
+            <dim>10</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 10: slicing 2D tensor, all axes specified*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data: data: [[0, 1, 2, 3, 4], [5, 6, 7, 8, 9]] -->
+          <dim>2</dim>
+          <dim>5</dim>
+        </port>
+        <port id="1">       <!-- start: [0, 1] -->
+          <dim>2</dim>
+        </port>
+        <port id="2">       <!-- stop: [2, 4] -->
+          <dim>2</dim>
+        </port>
+        <port id="3">       <!-- step: [1, 2] -->
+          <dim>2</dim>
+        </port>
+        <port id="4">       <!-- axes: [0, 1] -->
+          <dim>2</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">      <!-- output: [1, 3, 6, 8] -->
+            <dim>2</dim>
+            <dim>2</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 11: slicing 3D tensor, all axes specified*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data -->
+          <dim>20</dim>
+          <dim>10</dim>
+          <dim>5</dim>
+        </port>
+        <port id="1">       <!-- start: [0, 0, 0] -->
+          <dim>2</dim>
+        </port>
+        <port id="2">       <!-- stop: [4, 10, 5] -->
+          <dim>2</dim>
+        </port>
+        <port id="3">       <!-- step: [1, 1, 1] -->
+          <dim>2</dim>
+        </port>
+        <port id="4">       <!-- axes: [0, 1, 2] -->
+          <dim>2</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output -->
+            <dim>4</dim>
+            <dim>10</dim>
+            <dim>5</dim>
+        </port>
+    </output>
+</layer>
+```
+
+*Example 12: slicing 3D tensor, last axes default*
+
+```xml
+<layer id="1" type="Slice" ...>
+    <input>
+        <port id="0">       <!-- data -->
+          <dim>20</dim>
+          <dim>10</dim>
+          <dim>5</dim>
+        </port>
+        <port id="1">       <!-- start: [0, 0] -->
+          <dim>2</dim>
+        </port>
+        <port id="2">       <!-- stop: [4, 10] -->
+          <dim>2</dim>
+        </port>
+        <port id="3">       <!-- step: [1, 1] -->
+          <dim>2</dim>
+        </port>
+        <port id="4">       <!-- axes: [0, 1] -->
+          <dim>2</dim>
+        </port>
+    </input>
+    <output>
+        <port id="5">       <!-- output -->
+            <dim>4</dim>
+            <dim>10</dim>
+            <dim>5</dim>
+        </port>
+    </output>
+</layer>
+```
diff --git a/docs/optimization_guide/dldt_optimization_guide.md b/docs/optimization_guide/dldt_optimization_guide.md
index 740f47870619ac..698e9f7952adc2 100644
--- a/docs/optimization_guide/dldt_optimization_guide.md
+++ b/docs/optimization_guide/dldt_optimization_guide.md
@@ -8,7 +8,7 @@ For information on the general workflow, refer to the documentation in <a href="
 
 ### Deep Learning Inference Engine Overview <a name="dldt-overview"></a>
 
-Deep Learning Inference Engine is a part of Intel&reg; Deep Learning Deployment Toolkit (Intel&reg; DL Deployment Toolkit) and OpenVINO&trade; toolkit. Inference Engine facilitates deployment of deep learning solutions by delivering a unified, device-agnostic API.
+Deep Learning Inference Engine is a part of OpenVINO™ toolkit. Inference Engine facilitates deployment of deep learning solutions by delivering a unified, device-agnostic API.
 
 Below, there are the three main steps of the deployment process:
 
@@ -17,7 +17,7 @@ Below, there are the three main steps of the deployment process:
 
 	- *Performance flow*: This is an offline step where general topology-level optimizations happen automatically (see <a href="#mo-knobs-related-to-performance">Model Optimizer Knobs Related to Performance</a>).
 
-	- *Tools*: OpenVINO™ features the Model Optimizer that enables automatic and seamless transition from a training to deployment environment.
+	- *Tools*: OpenVINO™ features the Model Optimizer, which enables automatic and seamless transition from a training to deployment environment.
 
 2.	**Model Inference/Execution**<br>
 	After conversion, Inference Engine consumes the IR to perform inference. While Inference Engine API itself is target-agnostic, internally, it has a notion of plugins, which are device-specific libraries facilitating the hardware-assisted acceleration.
@@ -25,14 +25,14 @@ Below, there are the three main steps of the deployment process:
 	-	*Performance flow*: Upon conversion to IR, the execution starts with existing [Inference Engine samples](../IE_DG/Samples_Overview.md) to measure and tweak the performance of the network on different devices.<br>
 		> **NOTE**: While consuming the same IR, each plugin performs additional device-specific optimizations at load time, so the resulting accuracy might differ. Also, enabling and optimizing custom kernels is error-prone (see <a href="#optimizing-custom-kernels">Optimizing Custom Kernels</a>).
 
-	-	*Tools*: Beyond inference performance that samples report (see <a href="#latency-vs-throughput">Latency vs. Throughput</a>), you can get further device- and kernel-level timing with the <a href="#performance-counters">Inference Engine performance counters</a> and <a href="#vtune-examples">Intel&reg; VTune&trade;</a>.
+	-	*Tools*: Beyond inference performance that samples report (see <a href="#latency-vs-throughput">Latency vs. Throughput</a>), you can get further device- and kernel-level timing with the <a href="#performance-counters">Inference Engine performance counters</a> and <a href="#vtune-examples">Intel® VTune™</a>.
 
 3.	**Integration to the product**<br>
 	After model inference is verified with the [samples](../IE_DG/Samples_Overview.md), the Inference Engine code is typically integrated into a real application or pipeline.
 
 	- *Performance flow*: The most important point is to preserve the sustained performance achieved with the stand-alone model execution. Take precautions when combining with other APIs and be careful testing the performance of every integration step.
 
-	- *Tools*: Beyond tracking the actual wall-clock time of your application, see <a href="#vtune-examples">Intel&reg; VTune&trade; Examples</a> for application-level and system-level information.
+	- *Tools*: Beyond tracking the actual wall-clock time of your application, see <a href="#vtune-examples">Intel® VTune™ Examples</a> for application-level and system-level information.
 
 
 ## Gathering the Performance Numbers <a name="gathering-performance-numbers"></a>
@@ -50,12 +50,12 @@ When evaluating performance of your model with the Inference Engine, you must me
 
 ### Latency vs. Throughput <a name="latency-vs-throughput"></a>
 
-In the asynchronous case (see <a href="#new-request-based-api">Request-Based API and “GetBlob” Idiom</a>), the performance of an individual infer request is usually of less concern. Instead, you typically execute multiple requests asynchronously and measure the throughput in images per second by dividing the number of images that were processed by the processing time.
-In contrast, for the latency-oriented tasks, the time to a single frame is more important.
+In the asynchronous case (see <a href="#new-request-based-api">Request-Based API and “GetBlob” Idiom</a>), the performance of an individual infer request is usually of less concern. Instead, you typically execute multiple requests asynchronously and measure the throughput in images per second by dividing the number of images that were processed by the processing time. 
+In contrast, for latency-oriented tasks, the time to a single frame is more important.
 
 Refer to the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample, which allows latency vs. throughput measuring.
 
-> **NOTE**: The [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample also supports batching, that is automatically packing multiple input images into a single request. However, high batch size results in a latency penalty. So for more real-time oriented usages, batch sizes that are as low as a single input are usually used. Still, devices like CPU, Intel®Movidius™ Myriad™ 2 VPU, Intel® Movidius™ Myriad™ X VPU, or Intel® Vision Accelerator Design with Intel® Movidius™ VPU require a number of parallel requests instead of batching to leverage the performance. Running multiple requests should be coupled with a device configured to the corresponding number of streams. See <a href="#cpu-streams">details on CPU streams</a> for an example.
+> **NOTE**: The [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample also supports batching, that is, automatically packing multiple input images into a single request. However, high batch size results in a latency penalty. So for more real-time oriented usages, batch sizes that are as low as a single input are usually used. Still, devices like CPU, Intel®Movidius™ Myriad™ 2 VPU, Intel® Movidius™ Myriad™ X VPU, or Intel® Vision Accelerator Design with Intel® Movidius™ VPU require a number of parallel requests instead of batching to leverage the performance. Running multiple requests should be coupled with a device configured to the corresponding number of streams. See <a href="#cpu-streams">details on CPU streams</a> for an example.
 
 [OpenVINO™ Deep Learning Workbench tool](https://docs.openvinotoolkit.org/latest/workbench_docs_Workbench_DG_Introduction.html) provides throughput versus latency charts for different numbers of streams, requests, and batch sizes to find the performance sweet spot.
 
@@ -65,7 +65,7 @@ When comparing the Inference Engine performance with the framework or another re
 
 -	Wrap exactly the inference execution (refer to the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample for an example).
 -	Track model loading time separately.
--	Ensure the inputs are identical for the Inference Engine and the framework. For example, Caffe\* allows to auto-populate the input with random values. Notice that it might give different performance than on real images.
+-	Ensure the inputs are identical for the Inference Engine and the framework. For example, Caffe\* allows you to auto-populate the input with random values. Notice that it might give different performance than on real images.
 -	Similarly, for correct performance comparison, make sure the access pattern, for example, input layouts, is optimal for Inference Engine (currently, it is NCHW).
 -	Any user-side pre-processing should be tracked separately.
 -	Make sure to try the same environment settings that the framework developers recommend, for example, for TensorFlow*. In many cases, things that are more machine friendly, like respecting NUMA (see <a href="#cpu-checklist">CPU Checklist</a>), might work well for the Inference Engine as well.
@@ -83,11 +83,11 @@ Refer to the [Benchmark App](../../inference-engine/samples/benchmark_app/README
 
 ## Model Optimizer Knobs Related to Performance <a name="mo-knobs-related-to-performance"></a>
 
-Networks training is typically done on high-end data centers, using popular training frameworks like Caffe\*, TensorFlow\*, and MXNet\*. Model Optimizer converts the trained model in original proprietary formats to IR that describes the topology. IR is accompanied by a binary file with weights. These files in turn are consumed by the Inference Engine and used for scoring.
+Network training is typically done on high-end data centers, using popular training frameworks like Caffe\*, TensorFlow\*, and MXNet\*. Model Optimizer converts the trained model in original proprietary formats to IR that describes the topology. IR is accompanied by a binary file with weights. These files in turn are consumed by the Inference Engine and used for scoring.
 
 ![](../img/workflow_steps.png)
 
-As described in the [Model Optimizer Guide](../MO_DG/prepare_model/Prepare_Trained_Model.md), there are a number of device-agnostic optimizations the tool performs.  For example, certain primitives like linear operations (BatchNorm and ScaleShift), are automatically fused into convolutions. Generally, these layers should not be manifested in the resulting IR:
+As described in the [Model Optimizer Guide](../MO_DG/Deep_Learning_Model_Optimizer_DevGuide.md), there are a number of device-agnostic optimizations the tool performs. For example, certain primitives like linear operations (BatchNorm and ScaleShift) are automatically fused into convolutions. Generally, these layers should not be manifested in the resulting IR:
 
 ![](../img/resnet_269.png)
 
@@ -109,43 +109,42 @@ Also:
 	Notice that the devices like GPU are doing better with larger batch size. While it is possible to set the batch size in the runtime using the Inference Engine [ShapeInference feature](../IE_DG/ShapeInference.md).
 
 -	**Resulting IR precision**<br>
-The resulting IR precision, for instance, `FP16` or `FP32`, directly affects performance. As CPU now supports `FP16` (while internally upscaling to `FP32` anyway) and because this is the best precision for a GPU target, you may want to always convert models to `FP16`. Notice that this is the only precision that Intel&reg; Movidius&trade; Myriad&trade; 2 and Intel&reg; Myriad&trade; X VPUs support.
+The resulting IR precision, for instance, `FP16` or `FP32`, directly affects performance. As CPU now supports `FP16` (while internally upscaling to `FP32` anyway) and because this is the best precision for a GPU target, you may want to always convert models to `FP16`. Notice that this is the only precision that Intel® Movidius™ Myriad™ 2 and Intel® Myriad™ X VPUs support.
 
 
 ## Multi-Device Execution <a name="multi-device-optimizations"></a>
-OpenVINO&trade; toolkit supports automatic multi-device execution, please see [MULTI-Device plugin description](../IE_DG/supported_plugins/MULTI.md).
+OpenVINO™ toolkit supports automatic multi-device execution, please see [MULTI-Device plugin description](../IE_DG/supported_plugins/MULTI.md).
 In the next chapter you can find the device-specific tips, while this section covers few recommendations
 for the multi-device execution:
--	MULTI usually performs best when the fastest device is specified first in the list of the devices.
-    This is particularly important when the parallelism is not sufficient
-    (e.g. the number of request in the flight is not enough to saturate all devices).
-- It is highly recommended to query the optimal number of inference requests directly from the instance of the ExecutionNetwork
-  (resulted from the LoadNetwork call with the specific multi-device configuration as a parameter).
-Please refer to the code of the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample for details.
--   Notice that for example CPU+GPU execution performs better with certain knobs
+-	MULTI usually performs best when the fastest device is specified first in the list of the devices. 
+    This is particularly important when the parallelism is not sufficient 
+    (e.g., the number of request in the flight is not enough to saturate all devices).
+- It is highly recommended to query the optimal number of inference requests directly from the instance of the ExecutionNetwork 
+  (resulted from the LoadNetwork call with the specific multi-device configuration as a parameter). 
+Please refer to the code of the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample for details.    
+-   Notice that for example CPU+GPU execution performs better with certain knobs 
     which you can find in the code of the same [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample.
     One specific example is disabling GPU driver polling, which in turn requires multiple GPU streams (which is already a default for the GPU) to amortize slower
     inference completion from the device to the host.
--	Multi-device logic always attempts to save on the (e.g. inputs) data copies between device-agnostic, user-facing inference requests
+-	Multi-device logic always attempts to save on the (e.g., inputs) data copies between device-agnostic, user-facing inference requests
     and device-specific 'worker' requests that are being actually scheduled behind the scene.
     To facilitate the copy savings, it is recommended to start the requests in the order that they were created
     (with ExecutableNetwork's CreateInferRequest).
 
-
 ## Device-Specific Optimizations <a name="device-specific-optimizations"></a>
 
-The Inference Engine supports several target devices (CPU, GPU, Intel&reg; Movidius&trade; Myriad&trade; 2 VPU, Intel&reg; Movidius&trade; Myriad&trade; X VPU, Intel® Vision Accelerator Design with Intel® Movidius™ Vision Processing Units (VPU) and FPGA), and each of them has a corresponding plugin. If you want to optimize a specific device, you must keep in mind the following tips to increase the performance.
+The Inference Engine supports several target devices (CPU, GPU, Intel® Neural Compute Stick 2, Intel® Vision Accelerator Design with Intel® Movidius™ Vision Processing Units (VPU)), and each of them has a corresponding plugin. If you want to optimize a specific device, keep in mind the following tips to increase performance.
 
 ### CPU Checklist <a name="cpu-checklist"></a>
 
-CPU plugin completely relies on the Intel&reg; Math Kernel Library for Deep Neural Networks (Intel&reg; MKL-DNN) for major primitives acceleration, for example, Convolutions or FullyConnected.
+The CPU plugin completely relies on the Intel® Math Kernel Library for Deep Neural Networks (Intel® MKL-DNN) for major primitives acceleration, for example, Convolutions or FullyConnected.
 
-The only hint you can get from that is how the major primitives are accelerated (and you cannot change this). For example, on the Core machines, you should see variations of the `jit_avx2` when inspecting the <a href="#performance-counters">internal inference performance counters</a> (and additional '_int8' postfix for [int8 inference](../IE_DG/Int8Inference.md)). If you are an advanced user, you can further trace the CPU execution with (see <a href="#vtune-examples">Intel&reg; VTune&trade;</a>).
+The only hint you can get from that is how the major primitives are accelerated (and you cannot change this). For example, on machines with Intel® Core™ processors, you should see variations of the `jit_avx2` when inspecting the <a href="#performance-counters">internal inference performance counters</a> (and additional '_int8' postfix for [int8 inference](../IE_DG/Int8Inference.md)). If you are an advanced user, you can further trace the CPU execution with (see <a href="#vtune-examples">Intel&reg; VTune™</a>).
 
-Internally, the Inference Engine has a threading abstraction level, which allows for compiling the [open source version](https://github.com/openvinotoolkit/openvino) with either Intel&reg; Threading Building Blocks (Intel&reg; TBB) which is now default, or OpenMP* as an alternative parallelism solution. When using inference on the CPU, this is particularly important to align threading model with the rest of your application (and any third-party libraries that you use) to avoid oversubscription. For more information, see <a href="#note-on-app-level-threading">Note on the App-Level Threading</a> section.
+Internally, the Inference Engine has a threading abstraction level, which allows for compiling the [open source version](https://github.com/openvinotoolkit/openvino) with either Intel® Threading Building Blocks (Intel® TBB) which is now default, or OpenMP* as an alternative parallelism solution. When using inference on the CPU, this is particularly important to align threading model with the rest of your application (and any third-party libraries that you use) to avoid oversubscription. For more information, see <a href="#note-on-app-level-threading">Note on the App-Level Threading</a> section.
 
- Since R1 2019, the OpenVINO&trade; toolkit comes pre-compiled with Intel TBB,
- so any  OpenMP* API or environment settings (like `OMP_NUM_THREADS`) has no effect.
+ Since R1 2019, OpenVINO™ toolkit comes pre-compiled with Intel TBB,
+ so any OpenMP* API or environment settings (like `OMP_NUM_THREADS`) have no effect.
  Certain tweaks (like number of threads used for inference on the CPU) are still possible via  [CPU configuration options](../IE_DG/supported_plugins/CPU.md).
  Finally, the OpenVINO CPU inference is NUMA-aware, please refer to the <a href="#note-on-numa">Tips for inference on NUMA systems</a> section.
 
@@ -157,15 +156,16 @@ Other general recommendations:
 
 #### Throughput Mode for CPU <a name="cpu-streams"></a>
 Unlike most accelerators, CPU is perceived as an inherently latency-oriented device.
-In fact, the OpenVINO does support the "throughput" mode for the CPU, which allows the Inference Engine to efficiently run multiple inference requests on the CPU simultaneously, greatly improving the overall throughput.
+In fact, OpenVINO supports the "throughput" mode for the CPU, which allows the Inference Engine to efficiently run multiple inference requests on the CPU simultaneously, greatly improving the overall throughput.
 
 Internally, the execution resources are split/pinned into execution "streams".
 This feature usually provides much better performance for the networks than batching. This is especially true for the many-core server machines:
 ![](../img/cpu_streams_explained_1.png)
+
 Compared with the batching, the parallelism is somewhat transposed (i.e. performed over inputs, and much less within CNN ops):
 ![](../img/cpu_streams_explained.png)
 
-Try the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample and play with number of streams running in parallel. The rule of thumb is tying up to a number of CPU cores on your machine.
+Try the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md) sample and play with the number of streams running in parallel. The rule of thumb is tying up to a number of CPU cores on your machine.
 For example, on an 8-core CPU, compare the `-nstreams 1` (which is a legacy, latency-oriented scenario) to the 2, 4, and 8 streams.
 Notice that on a multi-socket machine, the bare minimum of streams for a latency scenario equals the number of sockets.
 
@@ -178,7 +178,7 @@ If your application is hard or impossible to change in accordance with the multi
 
 ### GPU Checklist <a name="gpu-checklist"></a>
 
-Inference Engine relies on the [Compute Library for Deep Neural Networks (clDNN)](https://01.org/cldnn) for Convolutional Neural Networks acceleration on Intel&reg; GPUs. Internally, clDNN uses OpenCL&trade; to implement the kernels. Thus, many general tips apply:
+Inference Engine relies on the [Compute Library for Deep Neural Networks (clDNN)](https://01.org/cldnn) for Convolutional Neural Networks acceleration on Intel® GPUs. Internally, clDNN uses OpenCL™ to implement the kernels. Thus, many general tips apply:
 
 -	Prefer `FP16` over `FP32`, as the Model Optimizer can generate both variants and the `FP32` is default.
 - 	Try to group individual infer jobs by using batches.
@@ -190,22 +190,11 @@ Inference Engine relies on the [Compute Library for Deep Neural Networks (clDNN)
 Notice that while disabling the polling, this option might reduce the GPU performance, so usually this option is used with multiple [GPU streams](../IE_DG/supported_plugins/GPU.md).
 
 
-### Intel&reg; Movidius&trade; Myriad&trade; X Visual Processing Unit and Intel&reg; Vision Accelerator Design with Intel&reg; Movidius&trade; VPUs  <a name="myriad"></a>
-
-Since Intel&reg; Movidius&trade; Myriad&trade; X Visual Processing Unit (Intel&reg; Movidius&trade; Myriad&trade; 2 VPU) communicates with the host over USB, minimum four infer requests in flight are recommended to hide the data transfer costs. See <a href="#new-request-based-api">Request-Based API and “GetBlob” Idiom</a> and [Benchmark App Sample](../../inference-engine/samples/benchmark_app/README.md) for more information.
-
-Intel&reg; Vision Accelerator Design with Intel&reg; Movidius&trade; VPUs requires to keep at least 32 inference requests in flight to fully saturate the device.
-
-### FPGA <a name="fpga"></a>
+### Intel® Movidius™ Myriad™ X Visual Processing Unit and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs  <a name="myriad"></a>
 
-Below are listed the most important tips for the efficient usage of the FPGA:
+Since Intel® Movidius™ Myriad™ X Visual Processing Unit (Intel® Movidius™ Myriad™ 2 VPU) communicates with the host over USB, minimum four infer requests in flight are recommended to hide the data transfer costs. See <a href="#new-request-based-api">Request-Based API and “GetBlob” Idiom</a> and [Benchmark App Sample](../../inference-engine/samples/benchmark_app/README.md) for more information.
 
--	Just like for the Intel&reg; Movidius&trade; Myriad&trade; VPU flavors, for the FPGA, it is important to hide the communication overheads by running multiple inference requests in parallel. For examples, refer to the [Benchmark App Sample](../../inference-engine/samples/benchmark_app/README.md).
--	Since the first inference iteration with FPGA is always significantly slower than the subsequent ones, make sure you run multiple iterations (all samples, except GUI-based demos, have the `-ni` or 'niter' option  to do that).
--	FPGA performance heavily depends on the bitstream.
--	Number of the infer request per executable network is limited to five, so “channel” parallelism (keeping individual infer request per camera/video input) would not work beyond five inputs. Instead, you need to mux the inputs into some queue that will internally use a pool of (5) requests.
--	In most scenarios, the FPGA acceleration is leveraged through <a href="heterogeneity">heterogeneous execution</a> with further specific tips.
--	For multi-device FPGA execution please refer to the [FPGA plugin documentation](../IE_DG/supported_plugins/FPGA.md)
+Intel® Vision Accelerator Design with Intel® Movidius™ VPUs requires keeping at least 32 inference requests in flight to fully saturate the device.
 
 ## Heterogeneity <a name="heterogeneity"></a>
 
@@ -231,15 +220,15 @@ The execution through heterogeneous plugin has three distinct steps:
 	-	The affinity setting is made before loading the network to the (heterogeneous) plugin, so this is always a **static** setup with respect to execution.
 
 2.	**Loading a network to the heterogeneous plugin**, which internally splits the network into subgraphs.<br>
-	You can check the decisions the plugin makes, see <a href="#analyzing-heterogeneous-execution">Analysing the Heterogeneous Execution</a>.
+	You can check the decisions the plugin makes, see <a href="#analyzing-heterogeneous-execution">Analyzing the Heterogeneous Execution</a>.
 
 3.	**Executing the infer requests**. From user’s side, this looks identical to a single-device case, while internally, the subgraphs are executed by actual plugins/devices.
 
-Performance benefits of the heterogeneous execution depend heavily on the communications granularity between devices. If transmitting/converting data from one part device to another takes more time than the execution, the heterogeneous approach makes little or no sense. Using Intel&reg; VTune&trade; helps to visualize the execution flow on a timeline (see <a href="#vtune-examples">Intel&reg; VTune&trade; Examples</a>).
+Performance benefits of the heterogeneous execution depend heavily on the communications granularity between devices. If transmitting/converting data from one part device to another takes more time than the execution, the heterogeneous approach makes little or no sense. Using Intel® VTune™ helps to visualize the execution flow on a timeline (see <a href="#vtune-examples">Intel® VTune™ Examples</a>).
 
-Similarly, if there are too much subgraphs, the synchronization and data transfers might eat the entire performance. In some cases, you can define the (coarser) affinity manually to avoid sending data back and forth many times during one inference.
+Similarly, if there are too many subgraphs, the synchronization and data transfers might eat the entire performance. In some cases, you can define the (coarser) affinity manually to avoid sending data back and forth many times during one inference.
 
-The general affinity “rule of thumb” is to keep computationally-intensive kernels on the accelerator, and "glue" or helper  kernels on the CPU. Notice that this includes the granularity considerations. For example, running some custom activation (that comes after every accelerator-equipped convolution) on the CPU might result in performance degradation due to too much data type and/or layout conversions, even though the activation itself can be extremely fast. In this case, it might make sense to consider implementing the kernel for the accelerator (see <a href="#optimizing-custom-kernels">Optimizing Custom Kernels</a>). The conversions typically manifest themselves as outstanding (comparing to CPU-only execution) 'Reorder' entries (see <a href="#performance-counters">Internal Inference Performance Counters</a>).
+The general affinity rule of thumb is to keep computationally-intensive kernels on the accelerator, and "glue" or helper kernels on the CPU. Notice that this includes the granularity considerations. For example, running some custom activation (that comes after every accelerator-equipped convolution) on the CPU might result in performance degradation due to too much data type and/or layout conversions, even though the activation itself can be extremely fast. In this case, it might make sense to consider implementing the kernel for the accelerator (see <a href="#optimizing-custom-kernels">Optimizing Custom Kernels</a>). The conversions typically manifest themselves as outstanding (comparing to CPU-only execution) 'Reorder' entries (see <a href="#performance-counters">Internal Inference Performance Counters</a>).
 
 For general details on the heterogeneous plugin, refer to the [corresponding section in the Inference Engine Developer Guide](../IE_DG/supported_plugins/HETERO.md).
 
@@ -250,23 +239,15 @@ Every Inference Engine sample supports the `-d` (device) option.
 For example, here is a command to run an [Object Detection Sample SSD Sample](../../inference-engine/samples/object_detection_sample_ssd/README.md):
 
 ```sh
-./object_detection_sample_ssd -m  <path_to_model>/ModelSSD.xml -i <path_to_pictures>/picture.jpg -d HETERO:FPGA,CPU
+./object_detection_sample_ssd -m  <path_to_model>/ModelSSD.xml -i <path_to_pictures>/picture.jpg -d HETERO:GPU,CPU
 ```
 
 where:
 
 -	`HETERO` stands for Heterogeneous plugin.
--	`FPGA,CPU` points to fallback policy with first priority on FPGA and further fallback to CPU.
+-	`GPU,CPU` points to fallback policy with first priority on GPU and further fallback to CPU.
 
-You can point more than two devices: `-d HETERO:FPGA,GPU,CPU`.
-
-### Heterogeneous Scenarios with FPGA <a name="heterogeneous-scenarios-fpga"></a>
-
-As FPGA is considered as an inference accelerator, most performance issues are related to the fact that due to the fallback, the CPU can be still used quite heavily.
--	Yet in most cases, the CPU does only small/lightweight layers, for example, post-processing (`SoftMax` in most classification models or `DetectionOutput` in the SSD*-based topologies). In that case, limiting the number of CPU threads with [`KEY_CPU_THREADS_NUM`](../IE_DG/supported_plugins/CPU.md) config would further reduce the CPU utilization without significantly degrading the overall performance.
--	Also, if you are still using OpenVINO version earlier than R1 2019, or if you have recompiled the Inference Engine with OpemMP (say for backward compatibility), setting the `KMP_BLOCKTIME` environment variable to something less than default 200ms (we suggest 1ms) is particularly helpful. Use `KMP_BLOCKTIME=0` if the CPU subgraph is small.
-
-> **NOTE**: General threading tips (see <a href="#note-on-app-level-threading">Note on the App-Level Threading</a>) apply well, even when the entire topology fits the FPGA, because there is still a host-side code for data pre- and post-processing.
+You can point more than two devices: `-d HETERO:GPU,MYRIAD,CPU`.
 
 ### General Tips on GPU/CPU Execution <a name="tips-on-gpu-cpu-execution"></a>
 
@@ -278,11 +259,11 @@ The following tips are provided to give general guidance on optimizing execution
 
 -	The general affinity “rule of thumb” is to keep computationally-intensive kernels on the accelerator, and "glue" (or helper) kernels on the CPU. Notice that this includes the granularity considerations. For example, running some (custom) activation on the CPU would result in too many conversions.
 
--	It is advised to do <a href="#analyzing-hetero-execution">performance analysis</a> to determine “hotspot” kernels, which should be the first candidates for offloading. At the same time, it is often more efficient to offload some reasonably sized sequence of kernels, rather than individual kernels, to minimize scheduling and other runtime overhead.
+-	It is advised to do <a href="#analyzing-heterogeneous-execution">performance analysis</a> to determine “hotspot” kernels, which should be the first candidates for offloading. At the same time, it is often more efficient to offload some reasonably sized sequence of kernels, rather than individual kernels, to minimize scheduling and other runtime overhead.
 
--	Notice that GPU can be busy with other tasks (like rendering). Similarly, the CPU can be in charge for the general OS routines and other application threads (see <a href="#note-on-app-level-threading">Note on the App-Level Threading</a>). Also, a high interrupt rate due to many subgraphs can raise the frequency of the one device and drag the frequency of another down.
+-	Notice that the GPU can be busy with other tasks (like rendering). Similarly, the CPU can be in charge for the general OS routines and other application threads (see <a href="#note-on-app-level-threading">Note on the App-Level Threading</a>). Also, a high interrupt rate due to many subgraphs can raise the frequency of the device and drag down the frequency of another.
 
--	Device performance can be affected by dynamic frequency scaling. For example, running long kernels on both devices simultaneously might eventually result in one or both devices stopping use of the Intel&reg; Turbo Boost Technology. This might result in overall performance decrease, even comparing to single-device scenario.
+-	Device performance can be affected by dynamic frequency scaling. For example, running long kernels on both devices simultaneously might eventually result in one or both devices stopping use of the Intel® Turbo Boost Technology. This might result in overall performance decrease, even comparing to single-device scenario.
 
 -	Mixing the `FP16` (GPU) and `FP32` (CPU) execution results in conversions and, thus, performance issues. If you are seeing a lot of heavy outstanding (compared to the CPU-only execution) Reorders, consider implementing actual GPU kernels. Refer to <a href="#performance-counters">Internal Inference Performance Counters</a> for more information.
 
@@ -295,22 +276,21 @@ After enabling the configuration key, the heterogeneous plugin generates two fil
 -	`hetero_affinity.dot` - per-layer affinities. This file is generated only if default fallback policy was executed (as otherwise you have set the affinities by yourself, so you know them).
 -	`hetero_subgraphs.dot` - affinities per sub-graph. This file is written to the disk during execution of `Core::LoadNetwork` for the heterogeneous flow.
 
-You can use GraphViz\* utility or `.dot` converters (for example, to `.png` or `.pdf`), like xdot\*, available on Linux\* OS with `sudo apt-get install xdot`. Below is an example of the output trimmed to the two last layers (one executed on the FPGA and another on the CPU):
+You can use the GraphViz\* utility or `.dot` converters (for example, to `.png` or `.pdf`), like xdot\*, available on Linux\* OS with `sudo apt-get install xdot`. Below is an example of the output trimmed to the two last layers (one executed on the FPGA and another on the CPU):
 
 ![](../img/output_trimmed.png)
 
-You can also use performance data (in the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md), it is an option `-pc`) to get performance data on each subgraph. Again, refer to the [HETERO plugin documentation](https://docs.openvinotoolkit.org/latest/openvino_docs_IE_DG_supported_plugins_HETERO.html#analyzing_heterogeneous_execution) and to <a href="#performance-counters">Internal Inference Performance Counters</a> for a general counters information.
-
+You can also use performance data (in the [Benchmark App](../../inference-engine/samples/benchmark_app/README.md), it is an option `-pc`) to get performance data on each subgraph. Again, refer to the [HETERO plugin documentation](https://docs.openvinotoolkit.org/latest/openvino_docs_IE_DG_supported_plugins_HETERO.html#analyzing_heterogeneous_execution) and to <a href="#performance-counters">Internal Inference Performance Counters</a> for information on general counters.
 
 ## Optimizing Custom Kernels <a name="optimizing-custom-kernels"></a>
 
-### Few Initial Performance Considerations <a name="initial-performance-considerations"></a>
+### A Few Initial Performance Considerations <a name="initial-performance-considerations"></a>
 
 The Inference Engine supports CPU, GPU and VPU custom kernels. Typically, custom kernels are used to quickly implement missing layers for new topologies. You should not override standard layers implementation, especially on the critical path, for example, Convolutions.  Also, overriding existing layers can disable some existing performance optimizations, such as fusing.
 
 It is usually easier to start with the CPU extension and switch to the GPU after debugging with the CPU path. Sometimes, when the custom layers are at the very end of your pipeline, it is easier to implement them as regular post-processing in your application without wrapping them as kernels. This is particularly true for the kernels that do not fit the GPU well, for example, output bounding boxes sorting. In many cases, you can do such post-processing on the CPU.
 
-There are many cases when sequence of the custom kernels can be implemented as a "super" kernel allowing to save on data accesses.
+There are many cases when sequence of the custom kernels can be implemented as a "super" kernel, allowing you to save on data accesses.
 
 Finally, with the heterogeneous execution, it is possible to execute the vast majority of intensive computations with the accelerator and keep the custom pieces on the CPU. The tradeoff is granularity/costs of communication between different devices.
 
@@ -322,10 +302,10 @@ In most cases, before actually implementing a full-blown code for the kernel, yo
 
 Other than that, when implementing the kernels, you can try the methods from the previous chapter to understand actual contribution and, if any custom kernel is in the hotspots, optimize that.
 
-### Few Device-Specific Tips <a name="device-specific-tips"></a>
+### A Few Device-Specific Tips <a name="device-specific-tips"></a>
 
--	As already outlined in the <a href="#cpu-checklist">CPU Checklist</a>, align the threading model that you use in your CPU kernels with the model that the rest of the Inference Engine compiled with.
--	For CPU extensions, consider kernel flavor that supports blocked layout, if your kernel is in the hotspots (see <a href="#performance-counters">Internal Inference Performance Counters</a>). Since Intel MKL-DNN internally operates on the blocked layouts, this would save you a data packing (Reorder) on tensor inputs/outputs of your kernel. For example of the blocked layout support, please, refer to the extensions in the `<OPENVINO_INSTALL_DIR>/deployment_tools/samples/extension/`.
+- As already outlined in the <a href="#cpu-checklist">CPU Checklist</a>, align the threading model that you use in your CPU kernels with the model that the rest of the Inference Engine compiled with.
+- For CPU extensions, consider kernel flavor that supports blocked layout, if your kernel is in the hotspots (see <a href="#performance-counters">Internal Inference Performance Counters</a>). Since Intel MKL-DNN internally operates on the blocked layouts, this would save you a data packing (Reorder) on tensor inputs/outputs of your kernel.
 
 ## Plugging Inference Engine to Applications <a name="plugging-ie-to-applications"></a>
 
@@ -349,7 +329,7 @@ If you are building an app-level pipeline with third-party components like GStre
 - The rule of thumb is that you should try to have the overall number of active threads in your application equal to the number of cores in your machine. Keep in mind the spare core(s) that the OpenCL driver under the GPU plugin might also need.
 - One specific workaround to limit the number of threads for the Inference Engine is using the [CPU configuration options](../IE_DG/supported_plugins/CPU.md).
 - To avoid further oversubscription, use the same threading model in all modules/libraries that your application uses. Notice that third party components might bring their own threading. For example, using Inference Engine which is now compiled with the TBB by default might lead to [performance troubles](https://www.threadingbuildingblocks.org/docs/help/reference/appendices/known_issues/interoperability.html) when mixed in the same app with another computationally-intensive library, but compiled with OpenMP. You can try to compile the [open source version](https://github.com/openvinotoolkit/openvino) of the Inference Engine to use the OpenMP as well. But notice that in general, the TBB offers much better composability, than other threading solutions.
-- If your code (or third party libraries) uses GNU OpenMP, the Intel&reg; OpenMP (if you have recompiled Inference Engine with that) must be initialized first. This can be achieved by linking your application with the Intel OpenMP instead of GNU OpenMP, or using `LD_PRELOAD` on Linux* OS.
+- If your code (or third party libraries) uses GNU OpenMP, the Intel® OpenMP (if you have recompiled Inference Engine with that) must be initialized first. This can be achieved by linking your application with the Intel OpenMP instead of GNU OpenMP, or using `LD_PRELOAD` on Linux* OS.
 
 ### Letting the Inference Engine Accelerate Image Pre-processing/Conversion <a name="image-preprocessing"></a>
 
@@ -363,7 +343,7 @@ Note that in many cases, you can directly share the (input) data with the Infere
 
 ### Basic Interoperability with Other APIs <a name="basic-interoperability-with-other-apis"></a>
 
-The general approach for sharing data between Inference Engine and media/graphics APIs like Intel&reg; Media Server Studio (Intel&reg; MSS) is based on sharing the *system* memory.  That is, in your code, you should map or copy the data from the API to the CPU address space first.
+The general approach for sharing data between Inference Engine and media/graphics APIs like Intel® Media Server Studio (Intel® MSS) is based on sharing the *system* memory.  That is, in your code, you should map or copy the data from the API to the CPU address space first.
 
 For Intel® Media SDK, it is recommended to perform a viable pre-processing, for example, crop/resize, and then convert to RGB again with the [Video Processing Procedures (VPP)](https://software.intel.com/content/www/us/en/develop/tools/oneapi/components/onevpl.htm). Then lock the result and create an Inference Engine blob on top of that. The resulting pointer can be used for `SetBlob`:
 
@@ -401,22 +381,22 @@ More importantly, an infer request encapsulates the reference to the “executab
 
 ### Performance Aspects of Running Multiple Requests Simultaneously <a name="running-multiple-requests-simultaneously"></a>
 
-If your application simultaneously executes multiple infer requests:
+If your application simultaneously executes multiple inference requests:
 
-- 	For the CPU, the best solution, you can use the <a href="#cpu-streams">CPU "throughput" mode</a>.
-	-	If latency is of more concern, you can try the `EXCLUSIVE_ASYNC_REQUESTS` [configuration option](../IE_DG/supported_plugins/CPU.md) that limits the number of the simultaneously executed requests for all (executable) networks that share the specific device to just one:<br>
+- 	For the CPU, the best solution is to use the <a href="#cpu-streams">CPU "throughput" mode</a>.
+	-	If latency is of more concern, you can try the `EXCLUSIVE_ASYNC_REQUESTS` [configuration option](../IE_DG/supported_plugins/CPU.md), which limits the number of the simultaneously executed requests for all (executable) networks that share the specific device to just one:<br>
 
 @snippet snippets/dldt_optimization_guide7.cpp part7
 
-		<br>For more information on the executable networks notation, see <a href="#new-request-based-api">Request-Based API and “GetBlob” Idiom</a>.
+<br>For more information on the executable networks notation, see <a href="#new-request-based-api">Request-Based API and “GetBlob” Idiom</a>.
 
-	-	The heterogeneous device uses the `EXCLUSIVE_ASYNC_REQUESTS` by default.
+-	The heterogeneous device uses the `EXCLUSIVE_ASYNC_REQUESTS` by default.
 
-	-	`KEY_EXCLUSIVE_ASYNC_REQUESTS` option affects only device queues of the individual application.
+-	`KEY_EXCLUSIVE_ASYNC_REQUESTS` option affects only device queues of the individual application.
 
--	For FPGA and GPU, the actual work is serialized by a plugin and/or a driver anyway.
+-	For GPU, the actual work is serialized by a plugin and/or a driver anyway.
 
-- 	Finally, for <a href="#myriad">any VPU flavor</a>, using multiple requests is a must for achieving good throughput.
+- 	Finally, for <a href="#myriad">any VPU model</a>, using multiple requests is a must for achieving good throughput. 
 
 In the Inference Engine, there is no notion of requests priorities. It is left to the user side (for example, not queuing the low priority infer request, until another higher priority is waiting). Notice that it would require additional logic to synchronize between executable networks (queues) in your application code.
 
@@ -432,33 +412,33 @@ You can compare the pseudo-codes for the regular and async-based approaches:
 
 @snippet snippets/dldt_optimization_guide8.cpp part8
 
-![Intel&reg; VTune&trade; screenshot](../img/vtune_regular.png)
+![Intel® VTune™ screenshot](../img/vtune_regular.png)
 
 -	In the "true" async mode, the `NEXT` request is populated in the main (application) thread, while the `CURRENT` request is processed:<br>
 
 @snippet snippets/dldt_optimization_guide9.cpp part9
 
-![Intel&reg; VTune&trade; screenshot](../img/vtune_async.png)
+![Intel® VTune™ screenshot](../img/vtune_async.png)
 
 The technique can be generalized to any available parallel slack. For example, you can do inference and simultaneously encode the resulting or previous frames or run further inference, like emotion detection on top of the face detection results.
 
 There are important performance caveats though: for example, the tasks that run in parallel should try to avoid oversubscribing the shared compute resources. If the inference is performed on the FPGA and the CPU is essentially idle, it makes sense to do things on the CPU in parallel. However, multiple infer requests can oversubscribe that. Notice that heterogeneous execution can implicitly use the CPU, refer to <a href="#heterogeneity">Heterogeneity</a>.
 
-Also, if the inference is performed on the graphics processing unit (GPU), it can take little gain to do the encoding, for instance, of the resulting video, on the same GPU in parallel, because the device is already busy.
+Also, if the inference is performed on the graphics processing unit (GPU), there is little gain in doing the encoding of the resulting video on the same GPU in parallel, for instance, because the device is already busy.
 
 Refer to the [Object Detection SSD Demo](@ref omz_demos_object_detection_demo_cpp) (latency-oriented Async API showcase) and [Benchmark App Sample](../../inference-engine/samples/benchmark_app/README.md) (which has both latency and throughput-oriented modes) for complete examples of the Async API in action.
 
 ## Using Tools <a name="using-tools"></a>
 
-Whether you are tuning for the first time or doing advanced performance optimization, you need a a tool that provides accurate insights. Intel&reg; VTune&trade; Amplifier gives you the tool to mine it and interpret the profiling data.
+Whether you are tuning for the first time or doing advanced performance optimization, you need a a tool that provides accurate insights. Intel® VTune™ Amplifier gives you the tool to mine it and interpret the profiling data.
 
 Alternatively, you can gather the raw profiling data that samples report, the second chapter provides example of how to interpret these.
 
-### Intel&reg; VTune&trade; Examples <a name="vtune-examples"></a>
+### Intel® VTune™ Examples <a name="vtune-examples"></a>
 
-All major performance calls of the Inference Engine are instrumented with Instrumentation and Tracing Technology APIs. This allows viewing the Inference Engine calls on the Intel&reg; VTune&trade; timelines and aggregations plus correlating them to the underlying APIs, like OpenCL.  In turn, this enables careful per-layer execution breakdown.
+All major performance calls of the Inference Engine are instrumented with Instrumentation and Tracing Technology APIs. This allows viewing the Inference Engine calls on the Intel® VTune™ timelines and aggregations plus correlating them to the underlying APIs, like OpenCL.  In turn, this enables careful per-layer execution breakdown.
 
-When choosing the Analysis type in Intel&reg; VTune&trade; Amplifier, make sure to select the **Analyze user tasks, events, and counters** option:
+When choosing the Analysis type in Intel® VTune™ Amplifier, make sure to select the **Analyze user tasks, events, and counters** option:
 
 ![](../img/vtune_option.jpg)
 
@@ -478,7 +458,7 @@ Example of Inference Engine calls:
 
 Similarly, you can use any GPU analysis in the Intel VTune Amplifier and get general correlation with Inference Engine API as well as the execution breakdown for OpenCL kernels.
 
-Just like with regular native application, further drill down in the counters is possible, however, this is mostly useful for <a href="#optimizing-custom-kernels">optimizing custom kernels</a>. Finally, with the Intel VTune Amplifier, the profiling is not limited to your user-level code (see the [corresponding section in the Intel&reg; VTune&trade; Amplifier User's Guide](https://software.intel.com/en-us/vtune-amplifier-help-analyze-performance)).
+Just like with regular native application, further drill down in the counters is possible, however, this is mostly useful for <a href="#optimizing-custom-kernels">optimizing custom kernels</a>. Finally, with the Intel VTune Amplifier, the profiling is not limited to your user-level code (see the [corresponding section in the Intel® VTune™ Amplifier User's Guide](https://software.intel.com/en-us/vtune-amplifier-help-analyze-performance)).
 
 ### Internal Inference Performance Counters <a name="performance-counters"></a>
 
diff --git a/docs/ovsa/ovsa_get_started.md b/docs/ovsa/ovsa_get_started.md
index 9d19ee63eb1253..7f541dd956c9fe 100644
--- a/docs/ovsa/ovsa_get_started.md
+++ b/docs/ovsa/ovsa_get_started.md
@@ -51,7 +51,7 @@ After the license is successfully validated, the OpenVINO™ Model Server loads
 
 ![Security Add-on Diagram](ovsa_diagram.png)
 
-The binding between SWTPM (vTPM used in guest VM) and HW TPM (TPM on the host) is explained in [this document](https://github.com/openvinotoolkit/security_addon/blob/release_2021_3/docs/fingerprint-changes.md)
+The binding between SWTPM (vTPM used in guest VM) and HW TPM (TPM on the host) is explained in [this document](https://github.com/openvinotoolkit/security_addon/blob/release_2021_4/docs/fingerprint-changes.md)
 
 ## About the Installation
 The Model Developer, Independent Software Vendor, and User each must prepare one physical hardware machine and one Kernel-based Virtual Machine (KVM). In addition, each person must prepare a Guest Virtual Machine (Guest VM) for each role that person plays. 
@@ -135,7 +135,7 @@ Begin this step on the Intel® Core™ or Xeon® processor machine that meets th
 10. Install the [`tpm2-tools`](https://github.com/tpm2-software/tpm2-tools/releases/download/4.3.0/tpm2-tools-4.3.0.tar.gz).<br>
     Installation information is at https://github.com/tpm2-software/tpm2-tools/blob/master/INSTALL.md
 11. Install the [Docker packages](https://docs.docker.com/engine/install/ubuntu/).	
-    > **NOTE**: Regardless of whether you used the `install_host_deps.sh` script, complete step 12 to finish setting up the packages on the Host Machine.
+    **NOTE**: Regardless of whether you used the `install_host_deps.sh` script, complete step 12 to finish setting up the packages on the Host Machine.
 12. If you are running behind a proxy, [set up a proxy for Docker](https://docs.docker.com/config/daemon/systemd/). 
 
 The following are installed and ready to use:
@@ -255,7 +255,7 @@ Networking is set up on the Host Machine. Continue to the Step 3 to prepare a Gu
 Download the [OpenVINO™ Security Add-on](https://github.com/openvinotoolkit/security_addon).
 
 
-### Step 4: Set Up one Guest VM for the combined roles of Model Developer and Independent Software Vendor<a name="dev-isv-vm"></a>.
+### Step 4: Set Up one Guest VM for the combined roles of Model Developer and Independent Software Vendor<a name="dev-isv-vm"></a>
 
 For each separate role you play, you must prepare a virtual machine, called a Guest VM. Because in this release, the Model Developer and Independent Software Vendor roles are combined, these instructions guide you to set up one Guest VM, named `ovsa_isv`.
 
@@ -489,7 +489,7 @@ This step is for the combined role of Model Developer and Independent Software V
 2. Build the OpenVINO™ Security Add-on:
    ```sh
    make clean all
-   sudo make package
+   sudo -s make package
    ```
    The following packages are created under the `release_files` directory:
    - `ovsa-kvm-host.tar.gz`: Host Machine file
@@ -517,13 +517,13 @@ This step is for the combined role of Model Developer and Independent Software V
 
 If you are using more than one Host Machine repeat Step 3 on each.
 
-### Step 4: Set up packages on the Guest VM
+### Step 4: Install the OpenVINO™ Security Add-on Model Developer / ISV Components
 This step is for the combined role of Model Developer and Independent Software Vendor. References to the Guest VM are to `ovsa_isv_dev`.
  
-1. Log on to the Guest VM.
+1. Log on to the Guest VM  as `<user>`.
 2. Create the OpenVINO™ Security Add-on directory in the home directory
    ```sh
-   mkdir OVSA
+   mkdir -p ~/OVSA
    ```
 3. Go to the Host Machine, outside of the Guest VM.
 4. Copy `ovsa-developer.tar.gz` from `release_files` to the Guest VM:
@@ -532,27 +532,25 @@ This step is for the combined role of Model Developer and Independent Software V
    scp ovsa-developer.tar.gz username@<isv-developer-vm-ip-address>:/<username-home-directory>/OVSA
    ```
 5. Go to the Guest VM.
-6. Install the software to the Guest VM:
+6. Create `ovsa` user
+   ``sh
+   sudo useradd -m ovsa
+   sudo passwd ovsa
+   ```
+7. Install the software to the Guest VM:
    ```sh
-   cd OVSA
+   cd ~/OVSA
    tar xvfz ovsa-developer.tar.gz
    cd ovsa-developer
-   sudo -s
-   ./install.sh
-   ```
-7. Create  a directory named `artefacts`. This directory will hold artefacts required to create licenses:
-   ```sh
-   cd /<username-home-directory>/OVSA
-   mkdir artefacts
-   cd artefacts
+   sudo ./install.sh
    ```
-8. Start the license server on a separate terminal.
+8. Start the license server on a separate terminal as `ovsa` user.
    ```sh
-   sudo -s
    source /opt/ovsa/scripts/setupvars.sh
    cd /opt/ovsa/bin
    ./license_server
    ```
+   **NOTE**: If you are behind a firewall, check and set your proxy settings to ensure the license server is able to validate the certificates.
 
 ### Step 5: Install the OpenVINO™ Security Add-on Model Hosting Component
 
@@ -562,27 +560,27 @@ The Model Hosting components install the OpenVINO™ Security Add-on Runtime Doc
     
 1. Log on to the Guest VM as `<user>`.
 2. Create the OpenVINO™ Security Add-on directory in the home directory
-   ```sh
-   mkdir OVSA
-   ```
+    ```sh
+    mkdir -p ~/OVSA
+    ```
 3. While on the Host Machine copy the ovsa-model-hosting.tar.gz from release_files to the Guest VM:
    ```sh
    cd $OVSA_RELEASE_PATH
-   scp ovsa-model-hosting.tar.gz username@<isv-developer-vm-ip-address>:/<username-home-directory>/OVSA
+   scp ovsa-model-hosting.tar.gz username@<runtime-vm-ip-address>:/<username-home-directory>/OVSA
    ```
-4. Install the software to the Guest VM:
+4. Go to the Guest VM.
+5. Create `ovsa` user
    ```sh
-   cd OVSA
+   sudo useradd -m ovsa
+   sudo passwd ovsa
+   sudo usermod -aG docker ovsa
+   ``` 
+6. Install the software to the Guest VM:
+   ```sh
+   cd ~/OVSA
    tar xvfz ovsa-model-hosting.tar.gz
    cd ovsa-model-hosting
-   sudo -s
-   ./install.sh
-   ```
-5. Create a directory named `artefacts`:
-   ```sh
-   cd /<username-home-directory>/OVSA
-   mkdir artefacts
-   cd artefacts
+   sudo ./install.sh
    ```
 
 ## How to Use the OpenVINO™ Security Add-on
@@ -599,24 +597,27 @@ The following figure describes the interactions between the Model Developer, Ind
 
 ### Model Developer Instructions
 
-The Model Developer creates model, defines access control and creates the user license. References to the Guest VM are to `ovsa_isv_dev`. After the model is created, access control enabled, and the license is ready, the Model Developer provides the license details to the Independent Software Vendor before sharing to the Model User.
+The Model Developer creates model, defines access control and creates the user license. After the model is created, access control enabled, and the license is ready, the Model Developer provides the license details to the Independent Software Vendor before sharing to the Model User.
 
-#### Step 1: Create a key store and add a certificate to it
+References to the Guest VM are to `ovsa_isv_dev`. Log on to the Guest VM as `ovsa` user.
 
-1. Set up a path to the artefacts directory:
-   ```sh
-   sudo -s
-   cd /<username-home-directory>/OVSA/artefacts
-	export OVSA_DEV_ARTEFACTS=$PWD
-   source /opt/ovsa/scripts/setupvars.sh
-   ```
-2. Create files to request a certificate:<br>
-   This example uses a self-signed certificate for demonstration purposes. In a production environment, use CSR files to request for a CA-signed certificate.
+#### Step 1: Set up the artefacts directory
+
+Create a directory named artefacts. This directory will hold artefacts required to create licenses:
+```sh
+mkdir -p ~/OVSA/artefacts
+cd ~/OVSA/artefacts
+export OVSA_DEV_ARTEFACTS=$PWD
+source /opt/ovsa/scripts/setupvars.sh
+```
+#### Step 2: Create a key store and add a certificate to it
+1. Create files to request a certificate:
+This example uses a self-signed certificate for demonstration purposes. In a production environment, use CSR files to request for a CA-signed certificate.
    ```sh
    cd $OVSA_DEV_ARTEFACTS
    /opt/ovsa/bin/ovsatool keygen -storekey -t ECDSA -n Intel -k isv_keystore -r  isv_keystore.csr -e "/C=IN/CN=localhost"
    ```
-   Two files are created:
+   Below two files are created along with the keystore file:
    - `isv_keystore.csr`- A Certificate Signing Request (CSR)  
    - `isv_keystore.csr.crt` - A self-signed certificate
    
@@ -627,50 +628,38 @@ The Model Developer creates model, defines access control and creates the user l
    /opt/ovsa/bin/ovsatool keygen -storecert -c isv_keystore.csr.crt -k isv_keystore
    ```	
 	
-#### Step 2: Create the model
+#### Step 3: Create the model
 
 This example uses `curl` to download the `face-detection-retail-004` model from the OpenVINO Model Zoo. If you are behind a firewall, check and set your proxy settings.
 
-1. Log on to the Guest VM.
- 
-2. Download a model from the Model Zoo:
-   ```sh
-   cd $OVSA_DEV_ARTEFACTS	
-   curl --create-dirs https://storage.openvinotoolkit.org/repositories/open_model_zoo/2021.3/models_bin/1/face-detection-retail-0004/FP32/face-detection-retail-0004.xml https://   storage.openvinotoolkit.org/repositories/open_model_zoo/2021.3/models_bin/1/face-detection-retail-0004/FP32/face-detection-retail-0004.bin -o model/face-detection-retail-0004.xml -o    model/face-detection-retail-0004.bin
-   ```
-   The model is downloaded to the `OVSA_DEV_ARTEFACTS/model` directory.
-	
-#### Step 3: Define access control for  the model and create a master license for it
+Download a model from the Model Zoo:
+```sh
+curl --create-dirs https://download.01.org/opencv/2021/openvinotoolkit/2021.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP32/face-detection-retail-0004.xml https://download.01.org/opencv/2021/openvinotoolkit/2021.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP32/face-detection-retail-0004.bin -o model/face-detection-retail-0004.xml -o model/face-detection-retail-0004.bin
+```
+The model is downloaded to the `OVSA_DEV_ARTEFACTS/model` directory
 
-1. Go to the `artefacts` directory:
-   ```sh	
-   cd $OVSA_DEV_ARTEFACTS
-   ```
-2. Run the `uuidgen` command:
-   ```sh	
-   uuidgen
-   ```
-3. Define and enable the model access control and master license:
-   ```sh	
-	/opt/ovsa/bin/ovsatool controlAccess -i model/face-detection-retail-0004.xml model/face-detection-retail-0004.bin -n "face detection" -d "face detection retail" -v 0004 -p face_detection_model.dat -m face_detection_model.masterlic -k isv_keystore -g <output-of-uuidgen>
-   ```
-The Intermediate Representation files for the `face-detection-retail-0004` model are encrypted as `face_detection_model.dat` and a master license is generated as `face_detection_model.masterlic`.
+#### Step 4: Define access control for  the model and create a master license for it
 
-#### Step 4: Create a Runtime Reference TCB
+Define and enable the model access control and master license:
+```sh	
+uuid=$(uuidgen)
+/opt/ovsa/bin/ovsatool controlAccess -i model/face-detection-retail-0004.xml model/face-detection-retail-0004.bin -n "face detection" -d "face detection retail" -v 0004 -p face_detection_model.dat -m face_detection_model.masterlic -k isv_keystore -g $uuid
+```
+The Intermediate Representation files for the `face-detection-retail-0004` model are encrypted as `face_detection_model.dat` and a master license is generated as `face_detection_model.masterlic`
+
+#### Step 5: Create a Runtime Reference TCB
 
 Use the runtime reference TCB to create a customer license for the access controlled model and the specific runtime.
 
 Generate the reference TCB for the runtime
 ```sh
-cd $OVSA_DEV_ARTEFACTS
-source /opt/ovsa/scripts/setupvars.sh
-	/opt/ovsa/bin/ovsaruntime gen-tcb-signature -n "Face Detect @ Runtime VM" -v "1.0" -f face_detect_runtime_vm.tcb -k isv_keystore
+/opt/ovsa/bin/ovsaruntime gen-tcb-signature -n "Face Detect @ Runtime VM" -v "1.0" -f face_detect_runtime_vm.tcb -k isv_keystore
 ```
 	
-#### Step 5: Publish the access controlled Model and Runtime Reference TCB
+#### Step 6: Publish the access controlled Model and Runtime Reference TCB
 The access controlled model is ready to be shared with the User and the reference TCB is ready to perform license checks.
 
-#### Step 6: Receive a User Request
+#### Step 7: Receive a User Request
 1. Obtain artefacts from the User who needs access to a access controlled model:
    * Customer certificate from the customer's key store.
    * Other information that apply to your licensing practices, such as the length of time the user needs access to the model
@@ -678,8 +667,9 @@ The access controlled model is ready to be shared with the User and the referenc
 2. Create a customer license configuration
    ```sh
    cd $OVSA_DEV_ARTEFACTS
-   /opt/ovsa/bin/ovsatool licgen -t TimeLimit -l30 -n "Time Limit License Config" -v 1.0 -u "<isv-developer-vm-ip-address>:<license_server-port>" -k isv_keystore -o 30daylicense.config
+   /opt/ovsa/bin/ovsatool licgen -t TimeLimit -l30 -n "Time Limit License Config" -v 1.0 -u "<isv-developer-vm-ip-address>:<license_server-port>" /opt/ovsa/certs/server.crt  -k isv_keystore -o 30daylicense.config
    ```
+   **NOTE**: The parameter /opt/ovsa/certs/server.crt  contains the certificate used by the License Server. The server certificate will be added to the customer license and validated during use. Refer to [OpenVINO™ Security Add-on License Server Certificate Pinning](https://github.com/openvinotoolkit/security_addon/blob/release_2021_4/docs/ovsa_license_server_cert_pinning.md)
 3. Create the customer license
    ```sh
    cd $OVSA_DEV_ARTEFACTS
@@ -693,27 +683,30 @@ The access controlled model is ready to be shared with the User and the referenc
    ```
 
 5. Provide these files to the User:
-   * `face_detection_model.dat`
-   * `face_detection_model.lic`
+	* `face_detection_model.dat`
+	* `face_detection_model.lic`
 
-### User Instructions
-References to the Guest VM are to `ovsa_rumtime`.
+### Model User Instructions
+References to the Guest VM are to `ovsa_rumtime`. Log on to the Guest VM as `ovsa` user.
 
-#### Step 1: Add a CA-Signed Certificate to a Key Store
+#### Step 1: Setup up the artefacts directory
 
-1. Set up a path to the artefacts directory:
+1. Create a directory named artefacts. This directory will hold artefacts required to create licenses:
    ```sh
-   sudo -s
-   cd /<username-home-directory>/OVSA/artefacts
+   mkdir -p ~/OVSA/artefacts
+   cd ~/OVSA/artefacts
    export OVSA_RUNTIME_ARTEFACTS=$PWD
    source /opt/ovsa/scripts/setupvars.sh
    ```
-2. Generate a Customer key store file:
+
+#### Step 2: Add a CA-Signed Certificate to a Key Store
+
+1. Generate a Customer key store file:
    ```sh
    cd $OVSA_RUNTIME_ARTEFACTS
    /opt/ovsa/bin/ovsatool keygen -storekey -t ECDSA -n Intel -k custkeystore -r  custkeystore.csr -e "/C=IN/CN=localhost"
    ```
-   Two files are created:
+   Below two files are created along with the keystore file:
    * `custkeystore.csr` - A Certificate Signing Request (CSR)
    * `custkeystore.csr.crt` - A self-signed certificate
 
@@ -724,20 +717,25 @@ References to the Guest VM are to `ovsa_rumtime`.
    /opt/ovsa/bin/ovsatool keygen -storecert -c custkeystore.csr.crt -k custkeystore
    ```
 
-#### Step 2: Request an access controlled Model from the Model Developer
+#### Step 3: Request an access controlled Model from the Model Developer
 This example uses scp to share data between the ovsa_runtime and ovsa_dev Guest VMs on the same Host Machine.
 
 1. Communicate your need for a model to the Model Developer. The Developer will ask you to provide the certificate from your key store and other information. This example uses the length of time the model needs to be available. 
-2. Generate an artefact file to provide to the Developer:
+2. The model user's certificate needs to be provided to the Developer:
    ```sh
    cd $OVSA_RUNTIME_ARTEFACTS
    scp custkeystore.csr.crt username@<developer-vm-ip-address>:/<username-home-directory>/OVSA/artefacts
    ```
+#### Step 4: Receive and load the access controlled model into the OpenVINO™ Model Server
+1. Receive the model as files named:
+   * face_detection_model.dat
+   * face_detection_model.lic
+   ```sh
+   cd $OVSA_RUNTIME_ARTEFACTS
+   scp username@<developer-vm-ip-address>:/<username-home-directory>/OVSA/artefacts/face_detection_model.dat .
+   scp username@<developer-vm-ip-address>:/<username-home-directory>/OVSA/artefacts/face_detection_model.lic .
+   ```
 
-#### Step 3: Receive and load the access controlled model into the OpenVINO™ Model Server
-1. Receive the model as files named
-   * `face_detection_model.dat`
-   * `face_detection_model.lic`
 2. Prepare the environment:
    ```sh
    cd $OVSA_RUNTIME_ARTEFACTS/..
@@ -776,14 +774,14 @@ This example uses scp to share data between the ovsa_runtime and ovsa_dev Guest
    }
    ```
 
-#### Step 4: Start the NGINX Model Server
+#### Step 5: Start the NGINX Model Server
 The NGINX Model Server publishes the access controlled model.
    ```sh
    ./start_secure_ovsa_model_server.sh
    ```
 For information about the NGINX interface, see https://github.com/openvinotoolkit/model_server/blob/main/extras/nginx-mtls-auth/README.md
 
-#### Step 5: Prepare to run Inference
+#### Step 6: Prepare to run Inference
 
 1. Log on to the Guest VM from another terminal.
 
@@ -798,7 +796,7 @@ For information about the NGINX interface, see https://github.com/openvinotoolki
    ```
 3. Copy the `face_detection.py` from the example_client in `/opt/ovsa/example_client`
    ```sh
-   cd /home/intel/OVSA/ovms
+   cd ~/OVSA/ovms
    cp /opt/ovsa/example_client/* .
    ```
 4. Copy the sample images for inferencing. An image directory is created that includes a sample image for inferencing.
@@ -806,11 +804,11 @@ For information about the NGINX interface, see https://github.com/openvinotoolki
    curl --create-dirs https://raw.githubusercontent.com/openvinotoolkit/model_server/master/example_client/images/people/people1.jpeg -o images/people1.jpeg
    ```
 
-#### Step 6: Run Inference
+#### Step 7: Run Inference
 
 Run the `face_detection.py` script:
 ```sh
-python3 face_detection.py --grpc_port 3335 --batch_size 1 --width 300 --height 300 --input_images_dir images --output_dir results --tls --server_cert server.pem --client_cert client.pem --client_key client.key --model_name controlled-access-model
+python3 face_detection.py --grpc_port 3335 --batch_size 1 --width 300 --height 300 --input_images_dir images --output_dir results --tls --server_cert /var/OVSA/Modelserver/server.pem --client_cert /var/OVSA/Modelserver/client.pem --client_key /var/OVSA/Modelserver/client.key --model_name controlled-access-model
 ```	
 
 ## Summary
diff --git a/docs/snippets/HETERO1.cpp b/docs/snippets/HETERO1.cpp
index 046eff1a3a2095..7f5616f5846601 100644
--- a/docs/snippets/HETERO1.cpp
+++ b/docs/snippets/HETERO1.cpp
@@ -12,7 +12,7 @@ auto function = network.getFunction();
 
 // This example demonstrates how to perform default affinity initialization and then
 // correct affinity manually for some layers
-const std::string device = "HETERO:FPGA,CPU";
+const std::string device = "HETERO:GPU,CPU";
 
 // QueryNetworkResult object contains map layer -> device
 InferenceEngine::QueryNetworkResult res = core.QueryNetwork(network, device, { });
diff --git a/docs/snippets/HETERO2.cpp b/docs/snippets/HETERO2.cpp
index a845f03c0a2161..9e7fcc050e5342 100644
--- a/docs/snippets/HETERO2.cpp
+++ b/docs/snippets/HETERO2.cpp
@@ -5,7 +5,7 @@ using namespace InferenceEngine;
 //! [part2]
 InferenceEngine::Core core;
 auto network = core.ReadNetwork("sample.xml");
-auto executable_network = core.LoadNetwork(network, "HETERO:FPGA,CPU");
+auto executable_network = core.LoadNetwork(network, "HETERO:GPU,CPU");
 //! [part2]
 return 0;
 }
diff --git a/docs/snippets/dldt_optimization_guide0.cpp b/docs/snippets/dldt_optimization_guide0.cpp
deleted file mode 100644
index efa228d23d1b44..00000000000000
--- a/docs/snippets/dldt_optimization_guide0.cpp
+++ /dev/null
@@ -1,17 +0,0 @@
-#include <ie_core.hpp>
-
-int main() {
-using namespace InferenceEngine;
-//! [part0]
-using namespace InferenceEngine::PluginConfigParams;
-using namespace InferenceEngine::HeteroConfigParams;
-
-Core ie;
-auto network = ie.ReadNetwork("sample.xml");
-// ...
-
-auto execNetwork = ie.LoadNetwork(network, "HETERO:FPGA,CPU", { {KEY_HETERO_DUMP_GRAPH_DOT, YES} });
-//! [part0]
-
-return 0;
-}
diff --git a/docs/snippets/ie_common.cpp b/docs/snippets/ie_common.cpp
new file mode 100644
index 00000000000000..6a558129243082
--- /dev/null
+++ b/docs/snippets/ie_common.cpp
@@ -0,0 +1,43 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <ie_core.hpp>
+
+int main() {
+    //! [ie:create_core]
+    InferenceEngine::Core core;
+    //! [ie:create_core]
+
+    //! [ie:read_model]
+    InferenceEngine::CNNNetwork network = core.ReadNetwork("model.xml");
+    //! [ie:read_model]
+
+    //! [ie:get_inputs_outputs]
+    InferenceEngine::InputsDataMap inputs = network.getInputsInfo();
+    InferenceEngine::OutputsDataMap outputs = network.getOutputsInfo();
+    //! [ie:get_inputs_outputs]
+
+    //! [ie:compile_model]
+    InferenceEngine::ExecutableNetwork exec_network = core.LoadNetwork(network, "CPU");
+    //! [ie:compile_model]
+
+    //! [ie:create_infer_request]
+    InferenceEngine::InferRequest infer_request = exec_network.CreateInferRequest();
+    //! [ie:create_infer_request]
+
+    //! [ie:get_input_tensor]
+    InferenceEngine::Blob::Ptr input_blob = infer_request.GetBlob(inputs.begin()->first);
+    // fill input blob
+    //! [ie:get_input_tensor]
+
+    //! [ie:inference]
+    infer_request.Infer();
+    //! [ie:inference]
+
+    //! [ie:get_output_tensor]
+    InferenceEngine::Blob::Ptr output_blob = infer_request.GetBlob(outputs.begin()->first);
+    // process output data
+    //! [ie:get_output_tensor]
+    return 0;
+}
diff --git a/docs/snippets/ov_common.cpp b/docs/snippets/ov_common.cpp
new file mode 100644
index 00000000000000..7cb9e344f7cbaa
--- /dev/null
+++ b/docs/snippets/ov_common.cpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+#include <openvino/core/function.hpp>
+#include <openvino/runtime/runtime.hpp>
+
+int main() {
+    //! [ov_api_2_0:create_core]
+    ov::runtime::Core core;
+    //! [ov_api_2_0:create_core]
+
+    //! [ov_api_2_0:read_model]
+    std::shared_ptr<ov::Function> network = core.read_model("model.xml");
+    //! [ov_api_2_0:read_model]
+
+    //! [ov_api_2_0:get_inputs_outputs]
+    ov::ParameterVector inputs = network->get_parameters();
+    ov::ResultVector outputs = network->get_results();
+    //! [ov_api_2_0:get_inputs_outputs]
+
+    //! [ov_api_2_0:compile_model]
+    ov::runtime::ExecutableNetwork exec_network = core.compile_model(network, "CPU");
+    //! [ov_api_2_0:compile_model]
+
+    ov::runtime::InferRequest infer_request = exec_network.create_infer_request();
+    //
+    // InferenceEngine::Blob::Ptr input_blob = infer_request.GetBlob(inputs.begin()->first);
+    // // fill input blob
+    // infer_request.Infer();
+    //
+    // InferenceEngine::Blob::Ptr output_blob = infer_request.GetBlob(outputs.begin()->first);
+    // process output data
+    return 0;
+}
diff --git a/docs/template_extension/CMakeLists.txt b/docs/template_extension/CMakeLists.txt
index 230323768e04d4..90a9e886b35e62 100644
--- a/docs/template_extension/CMakeLists.txt
+++ b/docs/template_extension/CMakeLists.txt
@@ -7,30 +7,28 @@ set(CMAKE_CXX_STANDARD 11)
 
 set(TARGET_NAME "template_extension")
 
-find_package(ngraph REQUIRED OPTIONAL_COMPONENTS onnx_ngraph_frontend)
-find_package(InferenceEngine REQUIRED)
+find_package(OpenVINO REQUIRED COMPONENTS Runtime OPTIONAL_COMPONENTS ONNX)
 find_package(OpenCV QUIET COMPONENTS core)
 
 set(SRC cpu_kernel.cpp extension.cpp op.cpp)
 
-if (OpenCV_FOUND)
+if(OpenCV_FOUND)
     set(SRC ${SRC} fft_kernel.cpp fft_op.cpp)
 endif()
 
 add_library(${TARGET_NAME} MODULE ${SRC})
 
-if (OpenCV_FOUND)
+if(OpenCV_FOUND)
     target_compile_definitions(${TARGET_NAME} PRIVATE OPENCV_IMPORT_ENABLED)
     target_link_libraries(${TARGET_NAME} PRIVATE opencv_core)
 endif()
 
 target_compile_definitions(${TARGET_NAME} PRIVATE IMPLEMENT_INFERENCE_EXTENSION_API)
-target_link_libraries(${TARGET_NAME} PRIVATE IE::inference_engine
-                                             ${NGRAPH_LIBRARIES})
+target_link_libraries(${TARGET_NAME} PRIVATE openvino::core openvino::runtime)
 
-if (ngraph_onnx_ngraph_frontend_FOUND)
-    target_link_libraries(${TARGET_NAME} PRIVATE ngraph::onnx_ngraph_frontend)
-    target_compile_definitions(${TARGET_NAME} PRIVATE NGRAPH_ONNX_FRONTEND_ENABLED)
+if(OpenVINO_Frontend_ONNX_FOUND)
+    target_link_libraries(${TARGET_NAME} PRIVATE openvino::frontend::onnx)
+    target_compile_definitions(${TARGET_NAME} PRIVATE OPENVINO_ONNX_FRONTEND_ENABLED)
 endif()
 # [cmake:extension]
 
diff --git a/docs/template_extension/extension.cpp b/docs/template_extension/extension.cpp
index d3be82d1120fa9..140d9086ea487e 100644
--- a/docs/template_extension/extension.cpp
+++ b/docs/template_extension/extension.cpp
@@ -11,7 +11,7 @@
 #    include "fft_op.hpp"
 #endif
 #include <ngraph/ngraph.hpp>
-#ifdef NGRAPH_ONNX_FRONTEND_ENABLED
+#ifdef OPENVINO_ONNX_FRONTEND_ENABLED
 #    include <onnx_import/onnx_utils.hpp>
 #endif
 
@@ -24,7 +24,7 @@ using namespace TemplateExtension;
 
 //! [extension:ctor]
 Extension::Extension() {
-#ifdef NGRAPH_ONNX_FRONTEND_ENABLED
+#ifdef OPENVINO_ONNX_FRONTEND_ENABLED
     ngraph::onnx_import::register_operator(Operation::type_info.name,
                                            1,
                                            "custom_domain",
@@ -49,12 +49,12 @@ Extension::Extension() {
 
 //! [extension:dtor]
 Extension::~Extension() {
-#ifdef NGRAPH_ONNX_FRONTEND_ENABLED
+#ifdef OPENVINO_ONNX_FRONTEND_ENABLED
     ngraph::onnx_import::unregister_operator(Operation::type_info.name, 1, "custom_domain");
 #    ifdef OPENCV_IMPORT_ENABLED
     ngraph::onnx_import::unregister_operator(FFTOp::type_info.name, 1, "custom_domain");
 #    endif  // OPENCV_IMPORT_ENABLED
-#endif      // NGRAPH_ONNX_FRONTEND_ENABLED
+#endif      // OPENVINO_ONNX_FRONTEND_ENABLED
 }
 //! [extension:dtor]
 
diff --git a/docs/template_plugin/tests/functional/op_reference/atan.cpp b/docs/template_plugin/tests/functional/op_reference/atan.cpp
new file mode 100644
index 00000000000000..76f1edd74f6acc
--- /dev/null
+++ b/docs/template_plugin/tests/functional/op_reference/atan.cpp
@@ -0,0 +1,102 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <ie_core.hpp>
+#include <ie_ngraph_utils.hpp>
+#include <ngraph/ngraph.hpp>
+#include <shared_test_classes/base/layer_test_utils.hpp>
+#include <vector>
+
+#include "base_reference_test.hpp"
+
+using namespace ngraph;
+
+namespace reference_tests {
+namespace {
+
+struct AtanParams {
+    Tensor input;
+    Tensor expected;
+};
+
+struct Builder : ParamsBuilder<AtanParams> {
+    REFERENCE_TESTS_ADD_SET_PARAM(Builder, input);
+    REFERENCE_TESTS_ADD_SET_PARAM(Builder, expected);
+};
+
+class ReferenceAtanLayerTest : public testing::TestWithParam<AtanParams>, public CommonReferenceTest {
+public:
+    void SetUp() override {
+        auto params = GetParam();
+        function = CreateFunction(params.input.shape, params.input.type);
+        inputData = {params.input.data};
+        refOutData = {params.expected.data};
+    }
+    static std::string getTestCaseName(const testing::TestParamInfo<AtanParams>& obj) {
+        auto param = obj.param;
+        std::ostringstream result;
+        result << "shape=" << param.input.shape << "_";
+        result << "type=" << param.input.type;
+        return result.str();
+    }
+
+private:
+    static std::shared_ptr<Function> CreateFunction(const Shape& shape, const element::Type& type) {
+        const auto in = std::make_shared<op::Parameter>(type, shape);
+        const auto atan = std::make_shared<op::Atan>(in);
+        return std::make_shared<Function>(NodeVector{atan}, ParameterVector{in});
+    }
+};
+
+TEST_P(ReferenceAtanLayerTest, AtanWithHardcodedRefs) {
+    Exec();
+}
+
+}  // namespace
+
+INSTANTIATE_TEST_SUITE_P(
+    smoke_Atan_With_Hardcoded_Refs, ReferenceAtanLayerTest,
+    ::testing::Values(
+        Builder{}
+            .input({{11}, element::f16, std::vector<ngraph::float16>{-4.f, -2.f, -1.f, -0.5f, -0.25f, 0.f, 0.25f, 0.5f, 1.f, 2.f, 4.f}})
+            .expected({{11}, element::f16, std::vector<ngraph::float16>{-1.32581766f,
+                                                                       -1.10714872f,
+                                                                       -0.78539816f,
+                                                                       -0.46364761f,
+                                                                       -0.24497866f,
+                                                                        0.00000000f,
+                                                                        0.24497866f,
+                                                                        0.46364761f,
+                                                                        0.78539816f,
+                                                                        1.10714872f,
+                                                                        1.32581766f}}),
+        Builder{}
+            .input({{11}, element::f32, std::vector<float>{-4.f, -2.f, -1.f, -0.5f, -0.25f, 0.f, 0.25f, 0.5f, 1.f, 2.f, 4.f}})
+            .expected({{11}, element::f32, std::vector<float>{-1.32581766f,
+                                                             -1.10714872f,
+                                                             -0.78539816f,
+                                                             -0.46364761f,
+                                                             -0.24497866f,
+                                                              0.00000000f,
+                                                              0.24497866f,
+                                                              0.46364761f,
+                                                              0.78539816f,
+                                                              1.10714872f,
+                                                              1.32581766f}}),
+        Builder{}
+            .input({{5}, element::i32, std::vector<int32_t>{-2, -1, 0, 1, 2}})
+            .expected({{5}, element::i32, std::vector<int32_t>{-1, -1, 0, 1, 1}}),
+        Builder{}
+            .input({{5}, element::i64, std::vector<int64_t>{-2, -1, 0, 1, 2}})
+            .expected({{5}, element::i64, std::vector<int64_t>{-1, -1, 0, 1, 1}}),
+        Builder{}
+            .input({{5}, element::u32, std::vector<uint32_t>{0, 1, 2, 3, 4}})
+            .expected({{5}, element::u32, std::vector<uint32_t>{0, 1, 1, 1, 1}}),
+        Builder{}
+            .input({{5}, element::u64, std::vector<uint64_t>{0, 1, 2, 3, 4}})
+            .expected({{5}, element::u64, std::vector<uint64_t>{0, 1, 1, 1, 1}})),
+    ReferenceAtanLayerTest::getTestCaseName);
+}  // namespace reference_tests
\ No newline at end of file
diff --git a/docs/template_plugin/tests/functional/op_reference/gather_tree.cpp b/docs/template_plugin/tests/functional/op_reference/gather_tree.cpp
new file mode 100644
index 00000000000000..412848f3a9eed3
--- /dev/null
+++ b/docs/template_plugin/tests/functional/op_reference/gather_tree.cpp
@@ -0,0 +1,100 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <ie_core.hpp>
+#include <ie_ngraph_utils.hpp>
+#include <limits>
+#include <algorithm>
+#include <ngraph/ngraph.hpp>
+#include <shared_test_classes/base/layer_test_utils.hpp>
+
+#include "base_reference_test.hpp"
+
+using namespace reference_tests;
+using namespace ngraph;
+using namespace InferenceEngine;
+
+namespace {
+struct GatherTreeParams {
+    template <class IN_ET>
+    GatherTreeParams(const ngraph::Shape inShape, std::vector<IN_ET> stepIds, const std::vector<IN_ET> parentIds,
+        const std::vector<IN_ET> maxSeqLen, const std::vector<IN_ET> endToken, std::vector<IN_ET> output) :
+        stepIdsTensor(inShape, element::from<IN_ET>(), stepIds), parentIdsTensor(inShape, element::from<IN_ET>(), parentIds),
+        maxSeqLenTensor(ngraph::Shape{inShape[1]}, element::from<IN_ET>(), maxSeqLen), endTokenTensor(ngraph::Shape{}, element::from<IN_ET>(), endToken),
+        expectedTensor(inShape, element::from<IN_ET>(), output) {}
+    Tensor stepIdsTensor;
+    Tensor parentIdsTensor;
+    Tensor maxSeqLenTensor;
+    Tensor endTokenTensor;
+    Tensor expectedTensor;
+};
+
+class ReferenceGatherTreeTest : public testing::TestWithParam<GatherTreeParams>, public CommonReferenceTest {
+public:
+    void SetUp() override {
+        auto params = GetParam();
+        function = CreateFunction(params);
+        inputData = {params.stepIdsTensor.data, params.parentIdsTensor.data, params.maxSeqLenTensor.data, params.endTokenTensor.data};
+        refOutData = {params.expectedTensor.data};
+    }
+    static std::string getTestCaseName(const testing::TestParamInfo<GatherTreeParams>& obj) {
+        auto param = obj.param;
+        std::ostringstream result;
+        result << "iType=" << param.stepIdsTensor.type << "_";
+        result << "iShape=" << param.stepIdsTensor.shape;
+        return result.str();
+    }
+
+private:
+    static std::shared_ptr<Function> CreateFunction(const GatherTreeParams& params) {
+        const auto stepIds = std::make_shared<op::Parameter>(params.stepIdsTensor.type, params.stepIdsTensor.shape);
+        const auto parentIds = std::make_shared<op::Parameter>(params.parentIdsTensor.type, params.parentIdsTensor.shape);
+        const auto maxSeqLen = std::make_shared<op::Parameter>(params.maxSeqLenTensor.type, params.maxSeqLenTensor.shape);
+        const auto endToken = std::make_shared<op::Parameter>(params.endTokenTensor.type, params.endTokenTensor.shape);
+        const auto gatherTree = std::make_shared<op::v1::GatherTree>(stepIds, parentIds, maxSeqLen, endToken);
+        return std::make_shared<Function>(NodeVector {gatherTree}, ParameterVector {stepIds, parentIds, maxSeqLen, endToken});
+    }
+};
+
+TEST_P(ReferenceGatherTreeTest, CompareWithRefs) {
+    Exec();
+}
+
+template <element::Type_t IN_ET>
+std::vector<GatherTreeParams> generateGatherTreeParams() {
+    using T = typename element_type_traits<IN_ET>::value_type;
+    std::vector<GatherTreeParams> gatherTreeParams {
+        GatherTreeParams(Shape{4, 1, 3},
+                         std::vector<T>{1, 2, 3, 4, 5, 6, 7, 8, 9, -1, -1, -1},
+                         std::vector<T>{0, 0, 0, 0, 1, 1, 2, 1, 2, -1, -1, -1},
+                         std::vector<T>{3},
+                         std::vector<T>{10},
+                         std::vector<T>{2, 2, 2, 6, 5, 6, 7, 8, 9, 10, 10, 10}),
+        GatherTreeParams(Shape{2, 2, 2},
+                         std::vector<T>{1, 2, 3, 4, 5, 6, 7, 8},
+                         std::vector<T>{0, 0, 0, 0, 0, 0, 0, 0},
+                         std::vector<T>{2, 4},
+                         std::vector<T>{0},
+                         std::vector<T>{1, 1, 3, 3, 5, 6, 7, 8})
+    };
+    return gatherTreeParams;
+}
+
+std::vector<GatherTreeParams> generateGatherTreeCombinedParams() {
+    const std::vector<std::vector<GatherTreeParams>> gatherTreeTypeParams {
+        generateGatherTreeParams<element::Type_t::f32>(),
+        generateGatherTreeParams<element::Type_t::i32>()};
+    std::vector<GatherTreeParams> combinedParams;
+
+    for (const auto& params : gatherTreeTypeParams) {
+        combinedParams.insert(combinedParams.end(), params.begin(), params.end());
+    }
+    return combinedParams;
+}
+
+INSTANTIATE_TEST_SUITE_P(smoke_GatherTree_With_Hardcoded_Refs, ReferenceGatherTreeTest,
+    testing::ValuesIn(generateGatherTreeCombinedParams()), ReferenceGatherTreeTest::getTestCaseName);
+} // namespace
\ No newline at end of file
diff --git a/docs/template_plugin/tests/functional/op_reference/max_pool.cpp b/docs/template_plugin/tests/functional/op_reference/max_pool.cpp
new file mode 100644
index 00000000000000..2cca7c50513f75
--- /dev/null
+++ b/docs/template_plugin/tests/functional/op_reference/max_pool.cpp
@@ -0,0 +1,400 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <ie_core.hpp>
+#include <ie_ngraph_utils.hpp>
+#include <ngraph/ngraph.hpp>
+#include <shared_test_classes/base/layer_test_utils.hpp>
+#include <tuple>
+
+#include "base_reference_test.hpp"
+
+using namespace ngraph;
+using namespace reference_tests;
+using namespace InferenceEngine;
+
+struct MaxPoolParams {
+    template <class Input_t, class Indices_t>
+    MaxPoolParams(const Shape& input_shape,
+                  const element::Type& input_type,
+                  const std::vector<Input_t>& input_data,
+                  const std::vector<Input_t>& expected_values,
+                  const element::Type& indices_type,
+                  const std::vector<Indices_t>& expected_indices,
+                  const Strides& strides,
+                  const Strides& dilations,
+                  const Shape& pads_begin,
+                  const Shape& pads_end,
+                  const Shape& kernel,
+                  const op::PadType pad_type = op::PadType::EXPLICIT,
+                  const int64_t axis = 0)
+        : m_input_shape(input_shape),
+          m_input_type(input_type),
+          m_indices_type(indices_type),
+          m_input_data(CreateBlob(input_type, input_data)),
+          m_expected_values(CreateBlob(input_type, expected_values)),
+          m_expected_indices(CreateBlob(indices_type, expected_indices)),
+          m_strides(strides),
+          m_dilations(dilations),
+          m_pads_begin(pads_begin),
+          m_pads_end(pads_end),
+          m_kernel(kernel),
+          m_pad_type(pad_type),
+          m_axis(axis) {}
+    Shape m_input_shape;
+    element::Type m_input_type;
+    element::Type m_indices_type;
+    InferenceEngine::Blob::Ptr m_input_data;
+    InferenceEngine::Blob::Ptr m_expected_values;
+    InferenceEngine::Blob::Ptr m_expected_indices;
+    Strides m_strides;
+    Strides m_dilations;
+    Shape m_pads_begin;
+    Shape m_pads_end;
+    Shape m_kernel;
+    op::PadType m_pad_type;
+    int64_t m_axis;
+};
+
+class ReferenceMaxPoolLayerTest : public testing::TestWithParam<MaxPoolParams>, public CommonReferenceTest {
+public:
+    void SetUp() override {
+        const auto params = GetParam();
+        function = CreateFunction(params);
+        inputData = {params.m_input_data};
+        refOutData = {params.m_expected_values, params.m_expected_indices};
+    }
+    static std::string getTestCaseName(const testing::TestParamInfo<MaxPoolParams>& obj) {
+        const auto p = obj.param;
+        std::ostringstream result;
+        result << p.m_input_shape.size() - 2 << "D/";
+        result << "input_shape=" << p.m_input_shape << ";";
+        result << "input_type=" << p.m_input_type << ";";
+        result << "indices_type=" << p.m_indices_type << ";";
+        result << "strides=" << p.m_strides << ";";
+        result << "dilations=" << p.m_dilations << ";";
+        result << "pads_begin=" << p.m_pads_begin << ";";
+        result << "pads_end=" << p.m_pads_end << ";";
+        result << "kernel=" << p.m_kernel << ";";
+        result << "pad_type=" << p.m_pad_type << ";";
+        result << "axis=" << p.m_axis;
+        return result.str();
+    }
+
+private:
+    static std::shared_ptr<Function> CreateFunction(const MaxPoolParams& params) {
+        const auto in = std::make_shared<op::Parameter>(params.m_input_type, params.m_input_shape);
+        const auto max_pool = std::make_shared<op::v8::MaxPool>(in,
+                                                                params.m_strides,
+                                                                params.m_dilations,
+                                                                params.m_pads_begin,
+                                                                params.m_pads_end,
+                                                                params.m_kernel,
+                                                                op::RoundingType::FLOOR,
+                                                                params.m_pad_type,
+                                                                params.m_indices_type,
+                                                                params.m_axis);
+        return std::make_shared<Function>(max_pool, ParameterVector{in});
+    }
+};
+
+TEST_P(ReferenceMaxPoolLayerTest, CompareWithHardcodedRefs) {
+    Exec();
+}
+
+INSTANTIATE_TEST_SUITE_P(
+    smoke_MaxPool_With_Hardcoded_Refs,
+    ReferenceMaxPoolLayerTest,
+    ::testing::Values(
+        MaxPoolParams(Shape{1, 1, 9},
+                      element::i32,
+                      std::vector<int32_t>{1, 2, 3, 4, 5, 6, 7, 8, 9},
+                      std::vector<int32_t>{2, 3, 4, 5, 6, 7, 8, 9},
+                      element::i64,
+                      std::vector<int64_t>{1, 2, 3, 4, 5, 6, 7, 8},
+                      Strides{1},
+                      Strides{1},
+                      Shape{},
+                      Shape{},
+                      Shape{2}),
+        MaxPoolParams(Shape{1, 1, 9},
+                      element::i32,
+                      std::vector<int32_t>{1, 2, 3, 4, 5, 6, 7, 8, 9},
+                      std::vector<int32_t>{2, 4, 6, 8},
+                      element::i64,
+                      std::vector<int64_t>{1, 3, 5, 7},
+                      Strides{2},
+                      Strides{1},
+                      Shape{},
+                      Shape{},
+                      Shape{2}),
+        MaxPoolParams(Shape{1, 1, 9},
+                      element::i32,
+                      std::vector<int32_t>{1, 2, 3, 4, 5, 6, 7, 8, 9},
+                      std::vector<int32_t>{1, 3, 5, 7, 9},
+                      element::i64,
+                      std::vector<int64_t>{0, 2, 4, 6, 8},
+                      Strides{2},
+                      Strides{1},
+                      Shape{},
+                      Shape{},
+                      Shape{2},
+                      op::PadType::SAME_LOWER),
+        MaxPoolParams(Shape{1, 1, 9},
+                      element::i32,
+                      std::vector<int32_t>{1, 2, 3, 4, 5, 6, 7, 8, 9},
+                      std::vector<int32_t>{2, 4, 6, 8, 9},
+                      element::i64,
+                      std::vector<int64_t>{1, 3, 5, 7, 8},
+                      Strides{2},
+                      Strides{1},
+                      Shape{},
+                      Shape{},
+                      Shape{2},
+                      op::PadType::SAME_UPPER),
+        MaxPoolParams(Shape{1, 1, 9},
+                      element::i32,
+                      std::vector<int32_t>{1, 2, 3, 4, 5, 6, 7, 8, 9},
+                      std::vector<int32_t>{3, 5, 7, 9},
+                      element::i32,
+                      std::vector<int32_t>{2, 4, 6, 8},
+                      Strides{2},
+                      Strides{2},
+                      Shape{},
+                      Shape{},
+                      Shape{2}),
+        MaxPoolParams(Shape{1, 2, 4},
+                      element::f32,
+                      std::vector<float>{1.0f, 2.0f, 3.0f, 4.0f, 0.0f, -3.14f, -2.71f, 5.0f},
+                      std::vector<float>{3.0f, 4.0f, 0.0f, 5.0f},
+                      element::i32,
+                      std::vector<int32_t>{2, 3, 4, 7},
+                      Strides{1},
+                      Strides{1},
+                      Shape{},
+                      Shape{},
+                      Shape{3}),
+        MaxPoolParams(Shape{1, 2, 4},
+                      element::f32,
+                      std::vector<float>{1.0f, 2.0f, 3.0f, 4.0f, 0.0f, -3.14f, -2.71f, 5.0f},
+                      std::vector<float>{3.0f, 4.0f, 0.0f, 5.0f},
+                      element::i32,
+                      std::vector<int32_t>{2, 3, 0, 3},
+                      Strides{1},
+                      Strides{1},
+                      Shape{},
+                      Shape{},
+                      Shape{3},
+                      op::PadType::EXPLICIT,
+                      2),
+        MaxPoolParams(Shape{1, 1, 9},
+                      element::i32,
+                      std::vector<int32_t>{1, 9, 3, 8, 5, 2, 6, 4, 7},
+                      std::vector<int32_t>{1, 9, 6, 7},
+                      element::i32,
+                      std::vector<int32_t>{0, 1, 6, 8},
+                      Strides{3},
+                      Strides{1},
+                      Shape{2},
+                      Shape{2},
+                      Shape{3}),
+        /*************************************************/
+        /***************** 2D test cases *****************/
+        /*************************************************/
+        MaxPoolParams(Shape{1, 1, 3, 3},
+                      element::i32,
+                      std::vector<int32_t>{3, 9, 10, 5, 7, 2, 18, 8, -2},
+                      std::vector<int32_t>{9, 10, 18, 8},
+                      element::i32,
+                      std::vector<int32_t>{1, 2, 6, 7},
+                      Strides{1, 1},
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2}),
+        MaxPoolParams(Shape{1, 1, 4, 4},  // simple 4x4 input test
+                      element::i32,
+                      std::vector<int32_t>{8, -9, 1, -16, -14, 15, -17, 19, -13, 3, 10, 17, 16, -11, -15, 20},
+                      std::vector<int32_t>{15, 15, 19, 15, 15, 19, 16, 10, 20},
+                      element::i32,
+                      std::vector<int32_t>{5, 5, 7, 5, 5, 7, 12, 10, 15},
+                      Strides{1, 1},
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2}),
+        MaxPoolParams(Shape{1, 1, 4, 4},
+                      element::i32,
+                      std::vector<int32_t>{8, -9, 1, -16, -14, 15, -17, 19, -13, 3, 10, 17, 16, -11, -15, 20},
+                      std::vector<int32_t>{15, 19, 16, 20},
+                      element::i32,
+                      std::vector<int32_t>{5, 7, 12, 15},
+                      Strides{2, 2},  // strides: 2x2
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2}),
+        MaxPoolParams(Shape{1, 1, 4, 4},
+                      element::i32,
+                      std::vector<int32_t>{8, -9, 1, -16, -14, 15, -17, 19, -13, 3, 10, 17, 16, -11, -15, 20},
+                      std::vector<int32_t>{10, 17, 16, 20},
+                      element::i32,
+                      std::vector<int32_t>{10, 11, 12, 15},
+                      Strides{1, 1},
+                      Strides{2, 2},  // dilations: 2x2
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2}),
+        MaxPoolParams(Shape{1, 1, 4, 4},
+                      element::i32,
+                      std::vector<int32_t>{8, -9, 1, -16, -14, 15, -17, 19, -13, 3, 10, 17, 16, -11, -15, 20},
+                      std::vector<int32_t>{15, 19, 16, 20},
+                      element::i32,
+                      std::vector<int32_t>{5, 7, 12, 15},
+                      Strides{1, 1},
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{3, 3}),  // kernel: 3x3
+        MaxPoolParams(Shape{1, 1, 5, 5},
+                      element::i32,
+                      std::vector<int32_t>{0,  -2, 24, 13, 7,  -5, -4, 4, 21, -18, 81, 20, -15,
+                                           37, 23, 41, 18, 42, 8,  32, 9, 57, 58,  29, 3},
+                      std::vector<int32_t>{0, 21, 81, 37},
+                      element::i32,
+                      std::vector<int32_t>{0, 8, 10, 13},
+                      Strides{2, 3},  // strides: 2x3
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2}),
+        MaxPoolParams(Shape{1, 1, 5, 5},
+                      element::i32,
+                      std::vector<int32_t>{0,  -2, 24, 13, 7,  -5, -4, 4, 21, -18, 81, 20, -15,
+                                           37, 23, 41, 18, 42, 8,  32, 9, 57, 58,  29, 3},
+                      std::vector<int32_t>{0, 24, 57, 58},
+                      element::i32,
+                      std::vector<int32_t>{0, 2, 21, 22},
+                      Strides{3, 2},  // strides: 3x2
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2}),
+        MaxPoolParams(Shape{1, 1, 5, 5},
+                      element::i32,
+                      std::vector<int32_t>{0,  -2, 24, 13, 7,  -5, -4, 4, 21, -18, 81, 20, -15,
+                                           37, 23, 41, 18, 42, 8,  32, 9, 57, 58,  29, 3},
+                      std::vector<int32_t>{81, 24, 81, 58},
+                      element::i32,
+                      std::vector<int32_t>{10, 2, 10, 22},
+                      Strides{2, 2},  // strides: 2x2
+                      Strides{2, 2},  // dilations: 2x2
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2}),
+        MaxPoolParams(Shape{1, 1, 5, 5},
+                      element::i32,
+                      std::vector<int32_t>{0,  -2, 24, 13, 7,  -5, -4, 4, 21, -18, 81, 20, -15,
+                                           37, 23, 41, 18, 42, 8,  32, 9, 57, 58,  29, 3},
+                      std::vector<int32_t>{0, 24, 21, 81, 42, 37, 57, 58, 32},
+                      element::i32,
+                      std::vector<int32_t>{0, 2, 8, 10, 17, 13, 21, 22, 19},
+                      Strides{2, 2},  // strides: 2x2
+                      Strides{1, 1},
+                      Shape{1, 1},  // pads_begin: 1x1
+                      Shape{1, 1},  // pads_end: 1x1
+                      Shape{3, 3}),
+        MaxPoolParams(Shape{1, 1, 5, 5},
+                      element::i32,
+                      std::vector<int32_t>{0,  -2, 24, 13, 7,  -5, -4, 4, 21, -18, 81, 20, -15,
+                                           37, 23, 41, 18, 42, 8,  32, 9, 57, 58,  29, 3},
+                      std::vector<int32_t>{81, 37, 81, 58, 58, 58},
+                      element::i32,
+                      std::vector<int32_t>{10, 13, 10, 22, 22, 22},
+                      Strides{2, 2},  // strides: 2x2
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{2, 1},  // pads_end: 2x1
+                      Shape{3, 3}),
+        MaxPoolParams(Shape{1, 2, 3, 3},
+                      element::i64,
+                      std::vector<int64_t>{0, -2, 24, 13, 7, -5, -4, 4, 21, -18, 81, 20, -15, 37, 23, 41, 18, 42},
+                      std::vector<int64_t>{13, 24, 13, 21, 81, 81, 41, 42},
+                      element::i64,
+                      std::vector<int64_t>{3, 2, 3, 8, 1, 1, 6, 8},
+                      Strides{1, 1},
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2},
+                      op::PadType::EXPLICIT,
+                      2),  // axis: 2
+        MaxPoolParams(Shape{1, 1, 2, 2},
+                      element::i32,
+                      std::vector<int32_t>{1, 2, 3, 4},
+                      std::vector<int32_t>{1, 2, 3, 4},
+                      element::i32,
+                      std::vector<int32_t>{0, 1, 2, 3},
+                      Strides{1, 1},
+                      Strides{1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{1, 1}),  // kernel: 1x1
+        /*************************************************/
+        /***************** 3D test cases *****************/
+        /*************************************************/
+        MaxPoolParams(Shape{1, 1, 3, 3, 3},
+                      element::i32,
+                      std::vector<int32_t>{0,  1,  2,  3,  4,  5, 6, 7, 8,   10,  20, 30, 40, -20,
+                                           60, 70, 80, 50, 50, 1, 2, 3, -15, -10, 50, 30, 81},
+                      std::vector<int32_t>{40, 60, 80, 80, 50, 60, 80, 81},
+                      element::i32,
+                      std::vector<int32_t>{12, 14, 16, 16, 18, 14, 16, 26},
+                      Strides{1, 1, 1},
+                      Strides{1, 1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{2, 2, 2}),
+        MaxPoolParams(Shape{1, 1, 3, 3, 3},
+                      element::i32,
+                      std::vector<int32_t>{0,  1,  2,  3,  4,  5, 6, 7, 8,   10,  20, 30, 40, -20,
+                                           60, 70, 80, 50, 50, 1, 2, 3, -15, -10, 50, 30, 81},
+                      std::vector<int32_t>{-20, -20, -20, -20, -20, -20, -20, -20},
+                      element::i32,
+                      std::vector<int32_t>{13, 13, 13, 13, 13, 13, 13, 13},
+                      Strides{2, 2, 2},
+                      Strides{2, 2, 2},
+                      Shape{1, 1, 1},
+                      Shape{1, 1, 1},
+                      Shape{2, 2, 2}),
+        MaxPoolParams(Shape{1, 1, 3, 3, 3},
+                      element::i32,
+                      std::vector<int32_t>{0,  1,  2,  3,  4,  5, 6, 7, 8,   10,  20, 30, 40, -20,
+                                           60, 70, 80, 50, 50, 1, 2, 3, -15, -10, 50, 30, 81},
+                      std::vector<int32_t>{8, 80, 81},
+                      element::i32,
+                      std::vector<int32_t>{8, 16, 26},
+                      Strides{1, 1, 1},
+                      Strides{1, 1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{1, 3, 3}),
+        MaxPoolParams(Shape{1, 1, 3, 3, 3},
+                      element::i32,
+                      std::vector<int32_t>{0,  1,  2,  3,  4,  5, 6, 7, 8,   10,  20, 30, 40, -20,
+                                           60, 70, 80, 50, 50, 1, 2, 3, -15, -10, 50, 30, 81},
+                      std::vector<int32_t>{4, 5, 7, 8, 40, 60, 80, 80, 50, 2, 50, 81},
+                      element::i32,
+                      std::vector<int32_t>{4, 5, 7, 8, 3, 5, 7, 7, 0, 2, 6, 8},
+                      Strides{1, 1, 1},
+                      Strides{1, 1, 1},
+                      Shape{},
+                      Shape{},
+                      Shape{1, 2, 2},
+                      op::PadType::EXPLICIT,
+                      3)),
+
+    ReferenceMaxPoolLayerTest::getTestCaseName);
diff --git a/docs/template_plugin/tests/functional/op_reference/minimum.cpp b/docs/template_plugin/tests/functional/op_reference/minimum.cpp
new file mode 100644
index 00000000000000..4dfeb44a53246d
--- /dev/null
+++ b/docs/template_plugin/tests/functional/op_reference/minimum.cpp
@@ -0,0 +1,112 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <ie_core.hpp>
+#include <ie_ngraph_utils.hpp>
+#include <ngraph/ngraph.hpp>
+#include <shared_test_classes/base/layer_test_utils.hpp>
+#include <tuple>
+
+#include "base_reference_test.hpp"
+
+using namespace ngraph;
+using namespace InferenceEngine;
+using namespace reference_tests;
+
+struct MinimumParams {
+    template <class IT, class OT>
+    MinimumParams(const PartialShape& s,
+                  const element::Type& iType, const element::Type& oType,
+                  const std::vector<IT>& iValues1, const std::vector<IT>& iValues2,
+                  const std::vector<OT>& oValues)
+        : pshape(s),
+          inType(iType),
+          outType(oType),
+          inputData1(CreateBlob(iType, iValues1)),
+          inputData2(CreateBlob(iType, iValues2)),
+          refData(CreateBlob(oType, oValues)) {}
+    PartialShape pshape;
+    element::Type inType;
+    element::Type outType;
+    Blob::Ptr inputData1;
+    Blob::Ptr inputData2;
+    Blob::Ptr refData;
+};
+
+class ReferenceMinimumLayerTest : public testing::TestWithParam<MinimumParams>, public CommonReferenceTest {
+public:
+    void SetUp() override {
+        auto params = GetParam();
+        function = CreateFunction(params.pshape, params.inType);
+        inputData = {params.inputData1, params.inputData2};
+        refOutData = {params.refData};
+    }
+    static std::string getTestCaseName(const testing::TestParamInfo<MinimumParams>& obj) {
+        auto param = obj.param;
+        std::ostringstream result;
+        result << "shape=" << param.pshape << "_";
+        result << "iType=" << param.inType << "_";
+        result << "oType=" << param.outType;
+        return result.str();
+    }
+
+private:
+    static std::shared_ptr<Function> CreateFunction(const PartialShape& shape, const element::Type& data_type) {
+        auto A = std::make_shared<op::Parameter>(data_type, shape);
+        auto B = std::make_shared<op::Parameter>(data_type, shape);
+        return std::make_shared<Function>(std::make_shared<op::v1::Minimum>(A, B), ParameterVector{A, B});
+    }
+};
+
+TEST_P(ReferenceMinimumLayerTest, CompareWithHardcodedRefs) {
+    Exec();
+}
+
+INSTANTIATE_TEST_SUITE_P(
+    smoke_Minimum, ReferenceMinimumLayerTest, ::testing::Values(
+        MinimumParams(PartialShape {8},
+                   element::u8,
+                   element::u8,
+                   std::vector<uint8_t> {1, 8, 8, 17, 5, 5, 2, 3},
+                   std::vector<uint8_t> {1, 2, 4, 8, 0, 2, 1, 200},
+                   std::vector<uint8_t> {1, 2, 4, 8, 0, 2, 1, 3}),
+        MinimumParams(PartialShape {8},
+                   element::u16,
+                   element::u16,
+                   std::vector<uint16_t> {1, 8, 8, 17, 5, 7, 123, 3},
+                   std::vector<uint16_t> {1, 2, 4, 8, 0, 2, 1, 1037},
+                   std::vector<uint16_t> {1, 2, 4, 8, 0, 2, 1, 3}),
+        MinimumParams(PartialShape {8},
+                   element::u32,
+                   element::u32,
+                   std::vector<uint32_t> {1, 8, 8, 17, 5, 5, 2, 1},
+                   std::vector<uint32_t> {1, 2, 4, 8, 0, 2, 1, 222},
+                   std::vector<uint32_t> {1, 2, 4, 8, 0, 2, 1, 1}),
+        MinimumParams(PartialShape {8},
+                   element::u64,
+                   element::u64,
+                   std::vector<uint64_t> {1, 8, 8, 17, 5, 5, 2, 13},
+                   std::vector<uint64_t> {1, 2, 4, 8, 0, 2, 1, 2222},
+                   std::vector<uint64_t> {1, 2, 4, 8, 0, 2, 1, 13}),
+        MinimumParams(PartialShape {8},
+                   element::f32,
+                   element::f32,
+                   std::vector<float> {1, 8, -8, 17, -0.5, 0.5, 2, 1},
+                   std::vector<float> {1, 2, 4, 8, 0, 0, 1, 1.5},
+                   std::vector<float> {1, 2, -8, 8, -.5, 0, 1, 1}),
+        MinimumParams(PartialShape {8},
+                   element::i32,
+                   element::i32,
+                   std::vector<int32_t> {1, 8, -8, 17, -5, 67635216, 2, 1},
+                   std::vector<int32_t> {1, 2, 4, 8, 0, 18448, 1, 6},
+                   std::vector<int32_t> {1, 2, -8, 8, -5, 18448, 1, 1}),
+        MinimumParams(PartialShape {8},
+                   element::i64,
+                   element::i64,
+                   std::vector<int64_t> {1, 8, -8, 17, -5, 67635216, 2, 17179887632},
+                   std::vector<int64_t> {1, 2, 4, 8, 0, 18448, 1, 280592},
+                   std::vector<int64_t> {1, 2, -8, 8, -5, 18448, 1, 280592})),
+        ReferenceMinimumLayerTest::getTestCaseName);
diff --git a/docs/template_plugin/tests/functional/op_reference/not_equal.cpp b/docs/template_plugin/tests/functional/op_reference/not_equal.cpp
new file mode 100644
index 00000000000000..e0292ecc67a4be
--- /dev/null
+++ b/docs/template_plugin/tests/functional/op_reference/not_equal.cpp
@@ -0,0 +1,123 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <ie_core.hpp>
+#include <ie_ngraph_utils.hpp>
+#include <ngraph/ngraph.hpp>
+#include <shared_test_classes/base/layer_test_utils.hpp>
+
+#include "comparison.hpp"
+
+using namespace ngraph;
+using namespace InferenceEngine;
+using ComparisonTypes = ngraph::helpers::ComparisonTypes;
+
+
+namespace reference_tests {
+namespace ComparisonOpsRefTestDefinitions {
+namespace {
+
+template <element::Type_t IN_ET>
+std::vector<RefComparisonParams> generateComparisonParams(const element::Type& type) {
+    using T = typename element_type_traits<IN_ET>::value_type;
+    std::vector<RefComparisonParams> compParams {
+        // 1D // 2D // 3D // 4D
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{2, 2}, type, std::vector<T> {1, 0, 10, 255}})
+            .input2({{2, 2}, type, std::vector<T> {1, 0, 10, 255}})
+            .expected({{2, 2}, element::boolean, std::vector<char> {0, 0, 0, 0}}),
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{2, 3}, type, std::vector<T> {0, 15, 45, 10, 5, 10}})
+            .input2({{2, 3}, type, std::vector<T> {1, 15, 5, 10, 50, 10}})
+            .expected({{2, 3}, element::boolean, std::vector<char> {1, 0, 1, 0, 1, 0}}),
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{1}, type, std::vector<T> {20}})
+            .input2({{1}, type, std::vector<T> {10}})
+            .expected({{1}, element::boolean, std::vector<char> {1}}),
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{2, 4}, type, std::vector<T> {0, 12, 23, 0, 1, 5, 12, 8}})
+            .input2({{2, 4}, type, std::vector<T> {0, 12, 23, 0, 10, 5, 11, 8}})
+            .expected({{2, 4}, element::boolean, std::vector<char> {0, 0, 0, 0, 1, 0, 1, 0}}),
+        Builder {}
+                .compType(ComparisonTypes::NOT_EQUAL)
+                .input1({{3, 1, 2}, type, std::vector<T> {2, 7, 4, 7, 3, 7}})
+                .input2({{1, 2, 1}, type, std::vector<T> {7, 7}})
+                .expected({{3, 2, 2}, element::boolean, std::vector<char> {1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0}}),
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{2, 1, 2, 1}, type, std::vector<T> {1, 2, 1, 4}})
+            .input2({{1, 2, 1}, type, std::vector<T> {1, 1}})
+            .expected({{2, 1, 2, 1}, element::boolean, std::vector<char> {0, 1, 0, 1}})};
+    return compParams;
+}
+
+std::vector<RefComparisonParams> generateComparisonCombinedParams() {
+    const std::vector<std::vector<RefComparisonParams>> compTypeParams {
+        generateComparisonParams<element::Type_t::f32>(element::f32),
+        generateComparisonParams<element::Type_t::f16>(element::f16),
+        generateComparisonParams<element::Type_t::i32>(element::i32),
+        generateComparisonParams<element::Type_t::u32>(element::u32),
+        generateComparisonParams<element::Type_t::u8>(element::boolean)};
+    std::vector<RefComparisonParams> combinedParams;
+
+    for (const auto& params : compTypeParams) {
+        combinedParams.insert(combinedParams.end(), params.begin(), params.end());
+    }
+    return combinedParams;
+}
+
+INSTANTIATE_TEST_SUITE_P(smoke_Comparison_With_Hardcoded_Refs, ReferenceComparisonLayerTest,
+                         ::testing::ValuesIn(generateComparisonCombinedParams()),
+                         ReferenceComparisonLayerTest::getTestCaseName);
+
+template <element::Type_t IN_ET>
+std::vector<RefComparisonParams> generateNumericParams(const element::Type& type) {
+    using T = typename element_type_traits<IN_ET>::value_type;
+    std::vector<RefComparisonParams> compParams {
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{4}, type, std::vector<T> {-2.5f, 25.5f, 2.25f, NAN}})
+            .input2({{4}, type, std::vector<T> {10.0f, 5.0f, 2.25f, 10.0f}})
+            .expected({{4}, element::boolean, std::vector<char> {1, 1, 0, 1}}),
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{2, 3}, type, std::vector<T> {0.0f, NAN, NAN, 1.0f, 21.0f, -INFINITY}})
+            .input2({{2, 3}, type, std::vector<T> {1.0f, NAN, 23.0f, 1.0f, 19.0f, 21.0f}})
+            .expected({{2, 3}, element::boolean, std::vector<char> {1, 1, 1, 0, 1, 1}}),
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{1}, type, std::vector<T> {INFINITY}})
+            .input2({{1}, type, std::vector<T> {INFINITY}})
+            .expected({{1}, element::boolean, std::vector<char> {0}}),
+        Builder {}
+            .compType(ComparisonTypes::NOT_EQUAL)
+            .input1({{5}, type, std::vector<T> {-2.5f, 25.5f, 2.25f, INFINITY, 6.0f}})
+            .input2({{5}, type, std::vector<T> {10.0f, 5.0f, 2.25f, 10.0f, -INFINITY}})
+            .expected({{5}, element::boolean, std::vector<char> {1, 1, 0, 1, 1}})};
+    return compParams;
+}
+
+std::vector<RefComparisonParams> generateNumericCombinedParams() {
+    const std::vector<std::vector<RefComparisonParams>> compTypeParams {
+        generateNumericParams<element::Type_t::f16>(element::f16),
+        generateNumericParams<element::Type_t::f32>(element::f32)};
+    std::vector<RefComparisonParams> combinedParams;
+
+    for (const auto& params : compTypeParams) {
+        combinedParams.insert(combinedParams.end(), params.begin(), params.end());
+    }
+    return combinedParams;
+}
+
+INSTANTIATE_TEST_SUITE_P(smoke_Numeric_With_Hardcoded_Refs, ReferenceComparisonLayerTest, ::testing::ValuesIn(generateNumericCombinedParams()),
+                         ReferenceComparisonLayerTest::getTestCaseName);
+} // namespace
+} // namespace ComparisonOpsRefTestDefinitions
+} // namespace reference_tests
diff --git a/docs/template_plugin/tests/functional/op_reference/random_uniform.cpp b/docs/template_plugin/tests/functional/op_reference/random_uniform.cpp
new file mode 100644
index 00000000000000..2e454e4a1453ee
--- /dev/null
+++ b/docs/template_plugin/tests/functional/op_reference/random_uniform.cpp
@@ -0,0 +1,205 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <vector>
+
+#include "base_reference_test.hpp"
+#include "ngraph/opsets/opset8.hpp"
+#include "ngraph/util.hpp"
+
+using namespace ngraph;
+
+namespace reference_tests {
+namespace {
+
+struct RandomUniformParams {
+    RandomUniformParams(const std::vector<int64_t>& paramOutShape,
+                        const Tensor& paramMinValue,
+                        const Tensor& paramMaxValue,
+                        ngraph::element::Type paramOutType,
+                        int64_t paramGlobalSeed,
+                        int64_t paramOpSeed,
+                        const Tensor& paramExpected,
+                        const std::string& test_name)
+        : out_shape(paramOutShape),
+          min_val(paramMinValue),
+          max_val(paramMaxValue),
+          out_type(paramOutType),
+          global_seed(paramGlobalSeed),
+          op_seed(paramOpSeed),
+          expected(paramExpected),
+          test_case_name(test_name) {}
+    std::vector<int64_t> out_shape;
+    Tensor min_val;
+    Tensor max_val;
+    ngraph::element::Type out_type;
+    int64_t global_seed;
+    int64_t op_seed;
+    Tensor expected;
+    std::string test_case_name;
+};
+
+class ReferenceRandomUniformLayerTest : public testing::TestWithParam<RandomUniformParams>, public CommonReferenceTest {
+public:
+    void SetUp() override {
+        auto params = GetParam();
+        function = CreateFunction(params.out_shape,
+                                  params.min_val,
+                                  params.max_val,
+                                  params.out_type,
+                                  params.global_seed,
+                                  params.op_seed);
+        inputData = {params.min_val.data, params.max_val.data};
+        refOutData = {params.expected.data};
+    }
+    static std::string getTestCaseName(const testing::TestParamInfo<RandomUniformParams>& obj) {
+        auto param = obj.param;
+        return param.test_case_name;
+    }
+
+private:
+    static std::shared_ptr<Function> CreateFunction(const std::vector<int64_t>& out_shape,
+                                                    const Tensor& min_val,
+                                                    const Tensor& max_val,
+                                                    const ngraph::element::Type& out_type,
+                                                    int64_t global_seed,
+                                                    int64_t op_seed) {
+        const auto min_val_param = std::make_shared<opset8::Parameter>(min_val.type, min_val.shape);
+        const auto max_val_param = std::make_shared<opset8::Parameter>(max_val.type, max_val.shape);
+        auto out_shape_ = std::make_shared<opset8::Constant>(element::i64, Shape{out_shape.size()}, out_shape);
+
+        return std::make_shared<Function>(NodeVector{std::make_shared<opset8::RandomUniform>(out_shape_,
+                                                                                             min_val_param,
+                                                                                             max_val_param,
+                                                                                             out_type,
+                                                                                             global_seed,
+                                                                                             op_seed)},
+                                          ParameterVector{min_val_param, max_val_param});
+    }
+};
+
+TEST_P(ReferenceRandomUniformLayerTest, RandomUniformWithHardcodedRefs) {
+    Exec();
+}
+
+}  // namespace
+
+// Reference values for the following tests are obtained from single layer TensorFlow model with tf.random.uniform().
+INSTANTIATE_TEST_SUITE_P(
+    smoke_RandomUniform_With_Hardcoded_Refs,
+    ReferenceRandomUniformLayerTest,
+    ::testing::Values(
+        RandomUniformParams(std::vector<int64_t>{3, 2, 4},
+                            Tensor{{1}, element::f32, std::vector<float>{0}},
+                            Tensor{{1}, element::f32, std::vector<float>{1}},
+                            element::Type_t::f32,
+                            150,
+                            10,
+                            Tensor{{3, 2, 4},
+                                   element::f32,
+                                   std::vector<float>{0.70112360, 0.30539632, 0.93931055, 0.94560349, 0.11694777,
+                                                      0.50770056, 0.51971972, 0.22727466, 0.99137402, 0.35519040,
+                                                      0.82692313, 0.59864855, 0.31364107, 0.57481313, 0.41399086,
+                                                      0.96308255, 0.37140799, 0.85253167, 0.09358585, 0.08200955,
+                                                      0.23655081, 0.81056309, 0.74226606, 0.76106691}},
+                            "float32_default_min_max"),
+        RandomUniformParams(std::vector<int64_t>{3, 2, 4},
+                            Tensor{{1}, element::f16, std::vector<float16>{0}},
+                            Tensor{{1}, element::f16, std::vector<float16>{1}},
+                            element::Type_t::f16,
+                            150,
+                            10,
+                            Tensor{{3, 2, 4},
+                                   element::f16,
+                                   std::vector<float16>{0.60449219, 0.80664062, 0.83203125, 0.38378906, 0.03613281,
+                                                        0.08300781, 0.54394531, 0.83398438, 0.33593750, 0.71972656,
+                                                        0.15429688, 0.12890625, 0.34765625, 0.86914062, 0.41308594,
+                                                        0.57226562, 0.57421875, 0.93945312, 0.65527344, 0.82226562,
+                                                        0.82421875, 0.13281250, 0.64355469, 0.66015625}},
+                            "float16_default_min_max"),
+        RandomUniformParams(std::vector<int64_t>{3, 2, 4},
+                            Tensor{{1}, element::f32, std::vector<float>{-650}},
+                            Tensor{{1}, element::f32, std::vector<float>{450}},
+                            element::Type_t::f32,
+                            150,
+                            10,
+                            Tensor{{3, 2, 4},
+                                   element::f32,
+                                   std::vector<float>{121.23596191,  -314.06405640, 383.24157715,  390.16381836,
+                                                      -521.35742188, -91.52935791,  -78.30828857,  -399.99786377,
+                                                      440.51147461,  -259.29055786, 259.61541748,  8.51342773,
+                                                      -304.99481201, -17.70556641,  -194.61004639, 409.39074707,
+                                                      -241.45120239, 287.78485107,  -547.05554199, -559.78948975,
+                                                      -389.79409790, 241.61938477,  166.49267578,  187.17358398}},
+                            "float32_non_default_min_max"),
+        RandomUniformParams(std::vector<int64_t>{3, 2, 4},
+                            Tensor{{1}, element::f16, std::vector<float16>{-1.5}},
+                            Tensor{{1}, element::f16, std::vector<float16>{-1.0}},
+                            element::Type_t::f16,
+                            150,
+                            10,
+                            Tensor{{3, 2, 4},
+                                   element::f16,
+                                   std::vector<float16>{-1.19726562, -1.09667969, -1.08398438, -1.30859375, -1.48242188,
+                                                        -1.45898438, -1.22851562, -1.08300781, -1.33203125, -1.14062500,
+                                                        -1.42285156, -1.43554688, -1.32617188, -1.06542969, -1.29296875,
+                                                        -1.21386719, -1.21289062, -1.03027344, -1.17187500, -1.08886719,
+                                                        -1.08789062, -1.43359375, -1.17773438, -1.16992188}},
+                            "float16_non_default_min_max"),
+        RandomUniformParams(std::vector<int64_t>{2, 3, 4},
+                            Tensor{{1}, element::i32, std::vector<int32_t>{-100}},
+                            Tensor{{1}, element::i32, std::vector<int32_t>{50}},
+                            element::Type_t::i32,
+                            100,
+                            350,
+                            Tensor{{2, 3, 4},
+                                   element::i32,
+                                   std::vector<int32_t>{
+                                       22, -56, -33, -89, -98, -33, -3,  -48, -82, 5,  -66, 21,
+                                       29, -42, -73, -37, 3,   36,  -35, 20,  -11, -8, -78, 47,
+                                   }},
+                            "int32"),
+        RandomUniformParams(std::vector<int64_t>{5, 4, 3},
+                            Tensor{{1}, element::i64, std::vector<int64_t>{-2600}},
+                            Tensor{{1}, element::i64, std::vector<int64_t>{3700}},
+                            element::Type_t::i64,
+                            755,
+                            951,
+                            Tensor{{5, 4, 3},
+                                   element::i64,
+                                   std::vector<int64_t>{
+                                       2116, -1581, 2559,  -339,  -1660, 519,   90,   2027,  -210, 3330, 1831,  -1737,
+                                       2683, 2661,  3473,  1220,  3534,  -2384, 2199, 1935,  499,  2861, 2743,  3223,
+                                       -531, -836,  -65,   3435,  632,   1765,  2613, 1891,  1698, 3069, 169,   -792,
+                                       -32,  2976,  -1552, -2588, 3327,  -1756, 2637, -1084, 3567, -778, -1465, 2967,
+                                       1242, 2672,  -1585, -2271, 3536,  -1502, 400,  2241,  3126, 908,  1073,  -2110}},
+                            "int64"),
+        RandomUniformParams(std::vector<int64_t>{7, 3},
+                            Tensor{{1}, element::bf16, std::vector<bfloat16>{0}},
+                            Tensor{{1}, element::bf16, std::vector<bfloat16>{1}},
+                            element::Type_t::bf16,
+                            4978,
+                            5164,
+                            Tensor{{7, 3},
+                                   element::bf16,
+                                   std::vector<bfloat16>{0.8984375, 0.84375,   0.1640625, 0.1875,   0.46875,  0.6875,
+                                                         0.5234375, 0.3046875, 0.9140625, 0.453125, 0.953125, 0.328125,
+                                                         0.359375,  0.1875,    0.9453125, 0.390625, 0.21875,  0.9921875,
+                                                         0.8203125, 0.453125,  0.875}},
+                            "bfloat16_default_min_max"),
+        RandomUniformParams(std::vector<int64_t>{7, 3},
+                            Tensor{{1}, element::bf16, std::vector<bfloat16>{-150}},
+                            Tensor{{1}, element::bf16, std::vector<bfloat16>{200}},
+                            element::Type_t::bf16,
+                            4978,
+                            5164,
+                            Tensor{{7, 3},
+                                   element::bf16,
+                                   std::vector<bfloat16>{164, 146, -92.5, -84.5, 14,  90,    33,  -43.5, 170, 8,  182,
+                                                         -35, -24, -84.5, 180,   -14, -73.5, 198, 138,   8,   156}},
+                            "bfloat16_non_default_min_max")),
+    ReferenceRandomUniformLayerTest::getTestCaseName);
+}  // namespace reference_tests
diff --git a/docs/template_plugin/tests/functional/shared_tests_instances/behavior/infer_request_dynamic.cpp b/docs/template_plugin/tests/functional/shared_tests_instances/behavior/infer_request/infer_request_dynamic.cpp
similarity index 55%
rename from docs/template_plugin/tests/functional/shared_tests_instances/behavior/infer_request_dynamic.cpp
rename to docs/template_plugin/tests/functional/shared_tests_instances/behavior/infer_request/infer_request_dynamic.cpp
index 221fe0851581e3..bf96b05704d1e5 100644
--- a/docs/template_plugin/tests/functional/shared_tests_instances/behavior/infer_request_dynamic.cpp
+++ b/docs/template_plugin/tests/functional/shared_tests_instances/behavior/infer_request/infer_request_dynamic.cpp
@@ -4,27 +4,23 @@
 
 #include <vector>
 
-#include "behavior/infer_request_dynamic.hpp"
+#include "behavior/infer_request/infer_request_dynamic.hpp"
 
 using namespace BehaviorTestsDefinitions;
 
 namespace {
 
-const std::vector<InferenceEngine::Precision> netPrecisions = {
-    InferenceEngine::Precision::FP32,
-    InferenceEngine::Precision::FP16
-};
-
 const std::vector<std::map<std::string, std::string>> configs = {
     {}
 };
 
 INSTANTIATE_TEST_CASE_P(smoke_BehaviorTests, InferRequestDynamicTests,
                         ::testing::Combine(
-                                ::testing::ValuesIn(netPrecisions),
+                                ::testing::Values(ngraph::builder::subgraph::makeSplitConvConcat()),
+                                ::testing::Values(std::vector<std::pair<std::vector<size_t>, std::vector<size_t>>>{{{1, 4, 20, 20}, {1, 10, 18, 18}},
+                                                                                                                   {{2, 4, 20, 20}, {2, 10, 18, 18}}}),
                                 ::testing::Values(CommonTestUtils::DEVICE_TEMPLATE),
                                 ::testing::ValuesIn(configs)),
                         InferRequestDynamicTests::getTestCaseName);
 
 }  // namespace
-
diff --git a/inference-engine/CMakeLists.txt b/inference-engine/CMakeLists.txt
index 5f2fb047ce6992..70d17980991242 100644
--- a/inference-engine/CMakeLists.txt
+++ b/inference-engine/CMakeLists.txt
@@ -12,9 +12,28 @@ if(ENABLE_PYTHON)
     add_subdirectory(ie_bridges/python)
 endif()
 
-add_subdirectory(tools)
 add_subdirectory(samples)
 
+# TODO: remove this
+foreach(sample benchmark_app classification_sample_async hello_classification
+                hello_nv12_input_classification hello_query_device hello_reshape_ssd
+                ngraph_function_creation_sample object_detection_sample_ssd
+                speech_sample style_transfer_sample hello_classification_c
+                object_detection_sample_ssd_c hello_nv12_input_classification_c)
+    if(TARGET ${sample})
+        install(TARGETS ${sample}
+                RUNTIME DESTINATION tests COMPONENT tests EXCLUDE_FROM_ALL)
+    endif()
+endforeach()
+
+foreach(samples_library opencv_c_wrapper format_reader)
+    if(TARGET ${samples_library})
+        install(TARGETS ${samples_library}
+                RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
+                LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
+    endif()
+endforeach()
+
 openvino_developer_export_targets(COMPONENT openvino_common TARGETS format_reader ie_samples_utils)
 
 if(ENABLE_TESTS)
@@ -32,7 +51,7 @@ ie_cpack_add_component(cpp_samples DEPENDS cpp_samples_deps core)
 
 if(UNIX)
     install(DIRECTORY samples/
-            DESTINATION ${IE_CPACK_IE_DIR}/samples/cpp
+            DESTINATION samples/cpp
             COMPONENT cpp_samples
             USE_SOURCE_PERMISSIONS
             PATTERN *.bat EXCLUDE
@@ -40,7 +59,7 @@ if(UNIX)
             PATTERN .clang-format EXCLUDE)
 elseif(WIN32)
     install(DIRECTORY samples/
-            DESTINATION ${IE_CPACK_IE_DIR}/samples/cpp
+            DESTINATION samples/cpp
             COMPONENT cpp_samples
             USE_SOURCE_PERMISSIONS
             PATTERN *.sh EXCLUDE
@@ -48,47 +67,26 @@ elseif(WIN32)
             PATTERN .clang-format EXCLUDE)
 endif()
 
-install(TARGETS format_reader
-        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
-        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
-
-if(TARGET benchmark_app)
-    install(TARGETS benchmark_app
-            RUNTIME DESTINATION tests COMPONENT tests EXCLUDE_FROM_ALL)
-endif()
-
 # install C samples
 
 ie_cpack_add_component(c_samples DEPENDS core_c)
 
 if(UNIX)
     install(PROGRAMS samples/build_samples.sh
-            DESTINATION ${IE_CPACK_IE_DIR}/samples/c
+            DESTINATION samples/c
             COMPONENT c_samples)
 elseif(WIN32)
     install(PROGRAMS samples/build_samples_msvc.bat
-            DESTINATION ${IE_CPACK_IE_DIR}/samples/c
+            DESTINATION samples/c
             COMPONENT c_samples)
 endif()
 
 install(DIRECTORY ie_bridges/c/samples/
-        DESTINATION ${IE_CPACK_IE_DIR}/samples/c
+        DESTINATION samples/c
         COMPONENT c_samples
         PATTERN ie_bridges/c/samples/CMakeLists.txt EXCLUDE
         PATTERN ie_bridges/c/samples/.clang-format EXCLUDE)
 
 install(FILES samples/CMakeLists.txt
-        DESTINATION ${IE_CPACK_IE_DIR}/samples/c
+        DESTINATION samples/c
         COMPONENT c_samples)
-
-# install speech demo files
-
-if(SPEECH_LIBS_AND_DEMOS)
-    ie_cpack_add_component(speech_demo_files)
-
-    install(DIRECTORY ${TEMP}/deployment_tools
-                      ${TEMP}/data_processing
-            DESTINATION .
-            USE_SOURCE_PERMISSIONS
-            COMPONENT speech_demo_files)
-endif()
diff --git a/inference-engine/ie_bridges/c/docs/api_overview.md b/inference-engine/ie_bridges/c/docs/api_overview.md
index f2d9dd92b32df7..298ff4f3e650c1 100644
--- a/inference-engine/ie_bridges/c/docs/api_overview.md
+++ b/inference-engine/ie_bridges/c/docs/api_overview.md
@@ -22,7 +22,7 @@ Supported Python* versions:
 
 To configure the environment for the Inference Engine C* API, run:
 
-- On Ubuntu 16.04: `source <INSTALL_DIR>/bin/setupvars.sh .`
+- On Ubuntu 16.04: `source <INSTALL_DIR>/setupvars.sh .`
 - On Windows 10: XXXX
 
 The script automatically detects latest installed C* version and configures required environment if the version is supported.
diff --git a/inference-engine/ie_bridges/c/include/c_api/ie_c_api.h b/inference-engine/ie_bridges/c/include/c_api/ie_c_api.h
index a85f8db3775ab6..44221e203dbe76 100644
--- a/inference-engine/ie_bridges/c/include/c_api/ie_c_api.h
+++ b/inference-engine/ie_bridges/c/include/c_api/ie_c_api.h
@@ -501,7 +501,7 @@ INFERENCE_ENGINE_C_API(IE_NODISCARD IEStatusCode) ie_core_get_config(const ie_co
  * @brief Gets available devices for neural network inference.
  * @ingroup Core
  * @param core A pointer to ie_core_t instance.
- * @param avai_devices The devices are returned as { CPU, FPGA.0, FPGA.1, MYRIAD }
+ * @param avai_devices The devices are returned as { CPU, GPU.0, GPU.1, MYRIAD }
  * If there more than one device of specific type, they are enumerated with .# suffix
  * @return Status code of the operation: OK(0) for success.
  */
diff --git a/inference-engine/ie_bridges/c/samples/hello_classification/README.md b/inference-engine/ie_bridges/c/samples/hello_classification/README.md
index b51d6efe539160..8765c6e1428951 100644
--- a/inference-engine/ie_bridges/c/samples/hello_classification/README.md
+++ b/inference-engine/ie_bridges/c/samples/hello_classification/README.md
@@ -48,7 +48,7 @@ To run the sample, you need specify a model and image:
 > - The sample accepts models in ONNX format (\*.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name alexnet
 ```
@@ -72,7 +72,7 @@ The application outputs top-10 inference results.
 ```
 Top 10 results:
 
-Image C:\images\car.bmp
+Image /opt/intel/openvino/samples/scripts/car.png
 
 classid probability
 ------- -----------
diff --git a/inference-engine/ie_bridges/c/samples/hello_nv12_input_classification/README.md b/inference-engine/ie_bridges/c/samples/hello_nv12_input_classification/README.md
index 89692d73dc2366..16bc03661a753f 100644
--- a/inference-engine/ie_bridges/c/samples/hello_nv12_input_classification/README.md
+++ b/inference-engine/ie_bridges/c/samples/hello_nv12_input_classification/README.md
@@ -63,7 +63,7 @@ ffmpeg -i cat.jpg -pix_fmt nv12 cat.yuv
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name alexnet
 ```
diff --git a/inference-engine/ie_bridges/c/samples/object_detection_sample_ssd/README.md b/inference-engine/ie_bridges/c/samples/object_detection_sample_ssd/README.md
index 0eacb2164c9147..42fd1debda14f9 100644
--- a/inference-engine/ie_bridges/c/samples/object_detection_sample_ssd/README.md
+++ b/inference-engine/ie_bridges/c/samples/object_detection_sample_ssd/README.md
@@ -77,7 +77,7 @@ Options:
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name person-detection-retail-0013
 ```
diff --git a/inference-engine/ie_bridges/c/src/CMakeLists.txt b/inference-engine/ie_bridges/c/src/CMakeLists.txt
index a0e1b3469c937a..1a5f914b7d634b 100644
--- a/inference-engine/ie_bridges/c/src/CMakeLists.txt
+++ b/inference-engine/ie_bridges/c/src/CMakeLists.txt
@@ -10,11 +10,11 @@ file(GLOB HEADERS ${InferenceEngine_C_API_SOURCE_DIR}/include/*.h)
 # create library
 
 add_library(${TARGET_NAME} SHARED ${HEADERS} ${SOURCES})
+add_library(openvino::runtime::c ALIAS ${TARGET_NAME})
 
 target_link_libraries(${TARGET_NAME} PRIVATE inference_engine)
 
 target_include_directories(${TARGET_NAME} PUBLIC
-    $<INSTALL_INTERFACE:${IE_CPACK_IE_DIR}/include/ie>
     $<BUILD_INTERFACE:${InferenceEngine_C_API_SOURCE_DIR}/include>)
 
 add_cpplint_target(${TARGET_NAME}_cpplint FOR_TARGETS ${TARGET_NAME})
@@ -26,19 +26,21 @@ ie_add_vs_version_file(NAME ${TARGET_NAME}
 
 # export
 
-export(TARGETS ${TARGET_NAME} NAMESPACE IE::
-       APPEND FILE "${CMAKE_BINARY_DIR}/InferenceEngineTargets.cmake")
+set_target_properties(${TARGET_NAME} PROPERTIES EXPORT_NAME runtime::c)
+export(TARGETS ${TARGET_NAME} NAMESPACE openvino::
+       APPEND FILE "${CMAKE_BINARY_DIR}/OpenVINOTargets.cmake")
 
 # install
 
 ie_cpack_add_component(core_c DEPENDS core)
 ie_cpack_add_component(core_c_dev DEPENDS core_c)
 
-install(TARGETS ${TARGET_NAME} EXPORT InferenceEngineTargets
+install(TARGETS ${TARGET_NAME} EXPORT OpenVINOTargets
         RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT core_c
         ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT core_c
-        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT core_c)
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT core_c
+        INCLUDES DESTINATION runtime/include/ie)
 
 install(DIRECTORY ${InferenceEngine_C_API_SOURCE_DIR}/include/
-        DESTINATION ${IE_CPACK_IE_DIR}/include/ie
+        DESTINATION runtime/include/ie
         COMPONENT core_c_dev)
diff --git a/inference-engine/ie_bridges/python/CMakeLists.txt b/inference-engine/ie_bridges/python/CMakeLists.txt
index a88b1017a124f4..a320d71a5230c2 100644
--- a/inference-engine/ie_bridges/python/CMakeLists.txt
+++ b/inference-engine/ie_bridges/python/CMakeLists.txt
@@ -8,11 +8,8 @@ cmake_minimum_required (VERSION 3.13)
 # Set the project name
 project (ie_python_api)
 
-if(DEFINED OpenVINO_SOURCE_DIR)
-    set(InferenceEngine_LIBRARIES inference_engine)
-else()
+if(NOT DEFINED OpenVINO_SOURCE_DIR)
     find_package(InferenceEngineDeveloperPackage REQUIRED)
-    set(InferenceEngine_LIBRARIES IE::inference_engine)
 endif()
 
 option(ENABLE_CONDA_FOLDER "Create output folder with conda python bindings" OFF)
@@ -102,7 +99,8 @@ install(PROGRAMS src/openvino/__init__.py
 ie_cpack_add_component(python_samples)
 
 install(DIRECTORY sample/
-        DESTINATION ${IE_CPACK_IE_DIR}/samples/python
+        DESTINATION samples/python
+        USE_SOURCE_PERMISSIONS
         COMPONENT python_samples)
 
 ie_cpack(${PYTHON_COMPONENT} python_samples)
diff --git a/inference-engine/ie_bridges/python/docs/api_overview.md b/inference-engine/ie_bridges/python/docs/api_overview.md
index 577edcc080c181..3938c71b1480f2 100644
--- a/inference-engine/ie_bridges/python/docs/api_overview.md
+++ b/inference-engine/ie_bridges/python/docs/api_overview.md
@@ -26,11 +26,11 @@ Supported Python* versions:
 ## Set Up the Environment
 
 To configure the environment for the Inference Engine Python\* API, run:
- * On Ubuntu\* 18.04 or 20.04: `source <INSTALL_DIR>/bin/setupvars.sh .`
- * On CentOS\* 7.4: `source <INSTALL_DIR>/bin/setupvars.sh .`
- * On macOS\* 10.x: `source <INSTALL_DIR>/bin/setupvars.sh .`
- * On Raspbian\* 9,: `source <INSTALL_DIR>/bin/setupvars.sh .`
- * On Windows\* 10: `call <INSTALL_DIR>\bin\setupvars.bat`
+ * On Ubuntu\* 18.04 or 20.04: `source <INSTALL_DIR>/setupvars.sh .`
+ * On CentOS\* 7.4: `source <INSTALL_DIR>/setupvars.sh .`
+ * On macOS\* 10.x: `source <INSTALL_DIR>/setupvars.sh .`
+ * On Raspbian\* 9,: `source <INSTALL_DIR>/setupvars.sh .`
+ * On Windows\* 10: `call <INSTALL_DIR>\setupvars.bat`
 
 The script automatically detects latest installed Python\* version and configures required environment if the version is supported.
 If you want to use certain version of Python\*, set the environment variable `PYTHONPATH=<INSTALL_DIR>/python/<desired_python_version>`
diff --git a/inference-engine/ie_bridges/python/sample/classification_sample_async/README.md b/inference-engine/ie_bridges/python/sample/classification_sample_async/README.md
index 48b024937264b7..52f3edcd86f189 100644
--- a/inference-engine/ie_bridges/python/sample/classification_sample_async/README.md
+++ b/inference-engine/ie_bridges/python/sample/classification_sample_async/README.md
@@ -80,7 +80,7 @@ To run the sample, you need specify a model and image:
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name alexnet
 ```
diff --git a/inference-engine/ie_bridges/python/sample/hello_classification/README.md b/inference-engine/ie_bridges/python/sample/hello_classification/README.md
index b1953e777d0660..4d3795f95737e3 100644
--- a/inference-engine/ie_bridges/python/sample/hello_classification/README.md
+++ b/inference-engine/ie_bridges/python/sample/hello_classification/README.md
@@ -69,7 +69,7 @@ To run the sample, you need specify a model and image:
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name alexnet
 ```
diff --git a/inference-engine/ie_bridges/python/sample/hello_reshape_ssd/README.md b/inference-engine/ie_bridges/python/sample/hello_reshape_ssd/README.md
index 0430f07dfcddf0..12588a0c5c9bc6 100644
--- a/inference-engine/ie_bridges/python/sample/hello_reshape_ssd/README.md
+++ b/inference-engine/ie_bridges/python/sample/hello_reshape_ssd/README.md
@@ -77,7 +77,7 @@ To run the sample, you need specify a model and image:
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name mobilenet-ssd
 ```
diff --git a/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/README.md b/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/README.md
index 43a60b3a331db3..588efb3d22617c 100644
--- a/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/README.md
+++ b/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/README.md
@@ -85,7 +85,7 @@ The sample application logs each step in a standard output stream and outputs to
 
 ```
 [ INFO ] Creating Inference Engine
-[ INFO ] Loading the network using ngraph function with weights from c:\openvino\deployment_tools\inference_engine\samples\python\ngraph_function_creation_sample\lenet.bin
+[ INFO ] Loading the network using ngraph function with weights from c:\openvino\samples\python\ngraph_function_creation_sample\lenet.bin
 [ INFO ] Configuring input and output blobs
 [ INFO ] Loading the model to the plugin
 [ WARNING ] Image c:\images\3.png is inverted to white over black
diff --git a/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/ngraph_function_creation_sample.py b/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/ngraph_function_creation_sample.py
index 40499546891056..47fc46353b5891 100755
--- a/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/ngraph_function_creation_sample.py
+++ b/inference-engine/ie_bridges/python/sample/ngraph_function_creation_sample/ngraph_function_creation_sample.py
@@ -11,6 +11,7 @@
 
 import cv2
 import ngraph
+from ngraph.opset1 import max_pool
 import numpy as np
 from openvino.inference_engine import IECore, IENetwork
 
@@ -85,7 +86,7 @@ def shape_and_length(shape: list) -> typing.Tuple[list, int]:
     add_1_node = ngraph.add(conv_1_node, add_1_kernel)
 
     # maxpool 1
-    maxpool_1_node = ngraph.max_pool(add_1_node, [2, 2], padding_begin, padding_end, [2, 2], 'ceil', None)
+    maxpool_1_node = max_pool(add_1_node, [2, 2], padding_begin, padding_end, [2, 2], 'ceil')
 
     # convolution 2
     conv_2_kernel_shape, conv_2_kernel_length = shape_and_length([50, 20, 5, 5])
@@ -104,7 +105,7 @@ def shape_and_length(shape: list) -> typing.Tuple[list, int]:
     add_2_node = ngraph.add(conv_2_node, add_2_kernel)
 
     # maxpool 2
-    maxpool_2_node = ngraph.max_pool(add_2_node, [2, 2], padding_begin, padding_end, [2, 2], 'ceil', None)
+    maxpool_2_node = max_pool(add_2_node, [2, 2], padding_begin, padding_end, [2, 2], 'ceil')
 
     # reshape 1
     reshape_1_dims, reshape_1_length = shape_and_length([2])
diff --git a/inference-engine/ie_bridges/python/sample/object_detection_sample_ssd/README.md b/inference-engine/ie_bridges/python/sample/object_detection_sample_ssd/README.md
index 1ce4d2f81c770c..73e01c5bc42f74 100644
--- a/inference-engine/ie_bridges/python/sample/object_detection_sample_ssd/README.md
+++ b/inference-engine/ie_bridges/python/sample/object_detection_sample_ssd/README.md
@@ -79,7 +79,7 @@ To run the sample, you need specify a model and image:
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name mobilenet-ssd
 ```
diff --git a/inference-engine/ie_bridges/python/sample/speech_sample/README.md b/inference-engine/ie_bridges/python/sample/speech_sample/README.md
index 2f7fd4323aa61d..2809cc72a5f947 100644
--- a/inference-engine/ie_bridges/python/sample/speech_sample/README.md
+++ b/inference-engine/ie_bridges/python/sample/speech_sample/README.md
@@ -80,7 +80,8 @@ Usage message:
 usage: speech_sample.py [-h] (-m MODEL | -rg IMPORT_GNA_MODEL) -i INPUT       
                         [-o OUTPUT] [-r REFERENCE] [-d DEVICE]
                         [-bs BATCH_SIZE] [-qb QUANTIZATION_BITS]
-                        [-wg EXPORT_GNA_MODEL] [-iname INPUT_LAYERS]
+                        [-sf SCALE_FACTOR] [-wg EXPORT_GNA_MODEL] [-pc]       
+                        [-a {CORE,ATOM}] [-iname INPUT_LAYERS]
                         [-oname OUTPUT_LAYERS]
 
 optional arguments:
@@ -88,7 +89,7 @@ optional arguments:
                         Path to an .xml file with a trained model (required if
                         -rg is missing).
   -rg IMPORT_GNA_MODEL, --import_gna_model IMPORT_GNA_MODEL
-                        Read GNA model from file using path/filename provided 
+                        Read GNA model from file using path/filename provided
                         (required if -m is missing).
 
 Options:
@@ -96,7 +97,8 @@ Options:
   -i INPUT, --input INPUT
                         Required. Path to an input file (.ark or .npz).
   -o OUTPUT, --output OUTPUT
-                        Optional. Output file name to save inference results (.ark or .npz).
+                        Optional. Output file name to save inference results
+                        (.ark or .npz).
   -r REFERENCE, --reference REFERENCE
                         Optional. Read reference score file and compare
                         scores.
@@ -113,9 +115,19 @@ Options:
   -qb QUANTIZATION_BITS, --quantization_bits QUANTIZATION_BITS
                         Optional. Weight bits for quantization: 8 or 16
                         (default 16).
+  -sf SCALE_FACTOR, --scale_factor SCALE_FACTOR
+                        Optional. The user-specified input scale factor for
+                        quantization. If the network contains multiple inputs,
+                        provide scale factors by separating them with commas.
   -wg EXPORT_GNA_MODEL, --export_gna_model EXPORT_GNA_MODEL
                         Optional. Write GNA model to file using path/filename
                         provided.
+  -pc, --performance_counter
+                        Optional. Enables performance report (specify -a to
+                        ensure arch accurate results).
+  -a {CORE,ATOM}, --arch {CORE,ATOM}
+                        Optional. Specify architecture. CORE, ATOM with the
+                        combination of -pc.
   -iname INPUT_LAYERS, --input_layers INPUT_LAYERS
                         Optional. Layer names for input blobs. The names are
                         separated with ",". Allows to change the order of
@@ -165,27 +177,30 @@ The sample application logs each step in a standard output stream.
 [ INFO ] Creating Inference Engine
 [ INFO ] Reading the network: wsj_dnn5b.xml
 [ INFO ] Configuring input and output blobs
-[ INFO ] Using scale factor of 2175.4322417 calculated from first utterance.
+[ INFO ] Using scale factor(s) calculated from first utterance
+[ INFO ] For input 0 using scale factor of 2175.4322418
 [ INFO ] Loading the model to the plugin
 [ INFO ] Starting inference in synchronous mode
 [ INFO ] Utterance 0 (4k0c0301)
+[ INFO ] Output blob name: affinetransform14/Fused_Add_
 [ INFO ] Frames in utterance: 1294
-[ INFO ] Total time in Infer (HW and SW): 5305.47ms
-[ INFO ] max error: 0.7051839
-[ INFO ] avg error: 0.0448387
-[ INFO ] avg rms error: 0.0582387        
-[ INFO ] stdev error: 0.0371649
+[ INFO ] Total time in Infer (HW and SW): 6211.45ms
+[ INFO ] max error: 0.7051840
+[ INFO ] avg error: 0.0448388
+[ INFO ] avg rms error: 0.0582387
+[ INFO ] stdev error: 0.0371650
 [ INFO ]
 [ INFO ] Utterance 1 (4k0c0302)
+[ INFO ] Output blob name: affinetransform14/Fused_Add_
 [ INFO ] Frames in utterance: 1005
-[ INFO ] Total time in Infer (HW and SW): 5031.53ms
+[ INFO ] Total time in Infer (HW and SW): 4742.27ms
 [ INFO ] max error: 0.7575974
 [ INFO ] avg error: 0.0452166
 [ INFO ] avg rms error: 0.0586013
 [ INFO ] stdev error: 0.0372769
-[ INFO ]
 ...
-[ INFO ] Total sample time: 38033.09ms
+[ INFO ] Total sample time: 40219.99ms
+[ INFO ] File result.npz was created!
 [ INFO ] This sample is an API example, for any performance measurements please use the dedicated benchmark_app tool
 ```
 
diff --git a/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py b/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py
index cfc20dfb42590c..d4e2b345ea20a9 100644
--- a/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py
+++ b/inference-engine/ie_bridges/python/sample/speech_sample/arg_parser.py
@@ -28,10 +28,17 @@ def parse_args() -> argparse.Namespace:
     args.add_argument('-bs', '--batch_size', default=1, type=int, help='Optional. Batch size 1-8 (default 1).')
     args.add_argument('-qb', '--quantization_bits', default=16, type=int,
                       help='Optional. Weight bits for quantization: 8 or 16 (default 16).')
+    args.add_argument('-sf', '--scale_factor', type=str,
+                      help='Optional. The user-specified input scale factor for quantization. '
+                      'If the network contains multiple inputs, provide scale factors by separating them with commas.')
     args.add_argument('-wg', '--export_gna_model', type=str,
                       help='Optional. Write GNA model to file using path/filename provided.')
     args.add_argument('-we', '--export_embedded_gna_model', type=str, help=argparse.SUPPRESS)
     args.add_argument('-we_gen', '--embedded_gna_configuration', default='GNA1', type=str, help=argparse.SUPPRESS)
+    args.add_argument('-pc', '--performance_counter', action='store_true',
+                      help='Optional. Enables performance report (specify -a to ensure arch accurate results).')
+    args.add_argument('-a', '--arch', default='CORE', type=str.upper, choices=['CORE', 'ATOM'],
+                      help='Optional. Specify architecture. CORE, ATOM with the combination of -pc.')
     args.add_argument('-iname', '--input_layers', type=str,
                       help='Optional. Layer names for input blobs. The names are separated with ",". '
                       'Allows to change the order of input layers for -i flag. Example: Input1,Input2')
diff --git a/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py b/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py
index 8019746d177088..14d2e4fa44142e 100755
--- a/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py
+++ b/inference-engine/ie_bridges/python/sample/speech_sample/speech_sample.py
@@ -2,15 +2,21 @@
 # -*- coding: utf-8 -*-
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
+import argparse
 import logging as log
 import re
 import sys
 from timeit import default_timer
+from typing import Union
 
 import numpy as np
 from arg_parser import parse_args
 from file_options import read_utterance_file, write_utterance_file
-from openvino.inference_engine import ExecutableNetwork, IECore
+from openvino.inference_engine import ExecutableNetwork, IECore, IENetwork
+
+# Operating Frequency for GNA HW devices for Core and Atom architecture
+GNA_CORE_FREQUENCY = 400
+GNA_ATOM_FREQUENCY = 200
 
 
 def get_scale_factor(matrix: np.ndarray) -> float:
@@ -75,6 +81,54 @@ def compare_with_reference(result: np.ndarray, reference: np.ndarray):
     log.info(f'stdev error: {stdev_error:.7f}')
 
 
+def get_input_layer_list(net: Union[IENetwork, ExecutableNetwork], args: argparse.Namespace) -> list:
+    """Get a list of input layer names"""
+    return re.split(', |,', args.input_layers) if args.input_layers else [next(iter(net.input_info))]
+
+
+def get_output_layer_list(net: Union[IENetwork, ExecutableNetwork],
+                          args: argparse.Namespace, with_ports: bool) -> list:
+    """Get a list of output layer names"""
+    if args.output_layers:
+        output_name_port = [output.split(':') for output in re.split(', |,', args.output_layers)]
+        if with_ports:
+            try:
+                return [(blob_name, int(port)) for blob_name, port in output_name_port]
+            except ValueError:
+                log.error('Incorrect value for -oname/--output_layers option, please specify a port for output layer.')
+                sys.exit(-4)
+        else:
+            return [blob_name for blob_name, _ in output_name_port]
+    else:
+        return [list(net.outputs.keys())[-1]]
+
+
+def parse_scale_factors(args: argparse.Namespace) -> list:
+    """Get a list of scale factors for input files"""
+    input_files = re.split(', |,', args.input)
+    scale_factors = re.split(', |,', str(args.scale_factor))
+    scale_factors = list(map(float, scale_factors))
+
+    if len(input_files) != len(scale_factors):
+        log.error(f'Incorrect command line for multiple inputs: {len(scale_factors)} scale factors provided for '
+                  f'{len(input_files)} input files.')
+        sys.exit(-7)
+
+    for i, scale_factor in enumerate(scale_factors):
+        if float(scale_factor) < 0:
+            log.error(f'Scale factor for input #{i} (counting from zero) is out of range (must be positive).')
+            sys.exit(-8)
+
+    return scale_factors
+
+
+def set_scale_factors(plugin_config: dict, scale_factors: list):
+    """Set a scale factor provided for each input"""
+    for i, scale_factor in enumerate(scale_factors):
+        log.info(f'For input {i} using scale factor of {scale_factor:.7f}')
+        plugin_config[f'GNA_SCALE_FACTOR_{i}'] = str(scale_factor)
+
+
 def main():
     log.basicConfig(format='[ %(levelname)s ] %(message)s', level=log.INFO, stream=sys.stdout)
     args = parse_args()
@@ -91,25 +145,13 @@ def main():
 
 # ---------------------------Step 3. Configure input & output----------------------------------------------------------
         log.info('Configuring input and output blobs')
-        # Get names of input and output blobs
-        if args.input_layers:
-            input_blobs = re.split(', |,', args.input_layers)
-        else:
-            input_blobs = [next(iter(net.input_info))]
-
+        # Mark layers from args.output_layers as outputs
         if args.output_layers:
-            output_name_port = [output.split(':') for output in re.split(', |,', args.output_layers)]
-            try:
-                output_name_port = [(blob_name, int(port)) for blob_name, port in output_name_port]
-            except ValueError:
-                log.error('Output Parameter does not have a port.')
-                sys.exit(-4)
-
-            net.add_outputs(output_name_port)
+            net.add_outputs(get_output_layer_list(net, args, with_ports=True))
 
-            output_blobs = [blob_name for blob_name, port in output_name_port]
-        else:
-            output_blobs = [list(net.outputs.keys())[-1]]
+        # Get names of input and output blobs
+        input_blobs = get_input_layer_list(net, args)
+        output_blobs = get_output_layer_list(net, args, with_ports=False)
 
         # Set input and output precision manually
         for blob_name in input_blobs:
@@ -131,21 +173,33 @@ def main():
         plugin_config['GNA_DEVICE_MODE'] = gna_device_mode
         plugin_config['GNA_PRECISION'] = f'I{args.quantization_bits}'
 
-        # Get a GNA scale factor
+        # Set a GNA scale factor
         if args.import_gna_model:
-            log.info(f'Using scale factor from the imported GNA model: {args.import_gna_model}')
+            if args.scale_factor:
+                log.warning(f'Custom scale factor will be used for imported GNA model: {args.import_gna_model}')
+                set_scale_factors(plugin_config, parse_scale_factors(args))
+            else:
+                log.info(f'Using scale factor from the imported GNA model: {args.import_gna_model}')
         else:
-            utterances = read_utterance_file(args.input.split(',')[0])
-            key = sorted(utterances)[0]
-            scale_factor = get_scale_factor(utterances[key])
-            log.info(f'Using scale factor of {scale_factor:.7f} calculated from first utterance.')
+            if args.scale_factor:
+                set_scale_factors(plugin_config, parse_scale_factors(args))
+            else:
+                scale_factors = []
 
-            plugin_config['GNA_SCALE_FACTOR'] = str(scale_factor)
+                for file_name in re.split(', |,', args.input):
+                    first_utterance = next(iter(read_utterance_file(file_name).values()))
+                    scale_factors.append(get_scale_factor(first_utterance))
+
+                log.info('Using scale factor(s) calculated from first utterance')
+                set_scale_factors(plugin_config, scale_factors)
 
         if args.export_embedded_gna_model:
             plugin_config['GNA_FIRMWARE_MODEL_IMAGE'] = args.export_embedded_gna_model
             plugin_config['GNA_FIRMWARE_MODEL_IMAGE_GENERATION'] = args.embedded_gna_configuration
 
+        if args.performance_counter:
+            plugin_config['PERF_COUNT'] = 'YES'
+
     device_str = f'HETERO:{",".join(devices)}' if 'HETERO' in args.device else devices[0]
 
     log.info('Loading the model to the plugin')
@@ -153,8 +207,8 @@ def main():
         exec_net = ie.load_network(net, device_str, plugin_config)
     else:
         exec_net = ie.import_network(args.import_gna_model, device_str, plugin_config)
-        input_blobs = [next(iter(exec_net.input_info))]
-        output_blobs = [list(exec_net.outputs.keys())[-1]]
+        input_blobs = get_input_layer_list(exec_net, args)
+        output_blobs = get_output_layer_list(exec_net, args, with_ports=False)
 
     if args.input:
         input_files = re.split(', |,', args.input)
@@ -207,9 +261,9 @@ def main():
 # ---------------------------Step 7. Do inference----------------------------------------------------------------------
     log.info('Starting inference in synchronous mode')
     results = {blob_name: {} for blob_name in output_blobs}
-    infer_times = []
+    total_infer_time = 0
 
-    for key in sorted(input_data):
+    for i, key in enumerate(sorted(input_data)):
         start_infer_time = default_timer()
 
         # Reset states between utterance inferences to remove a memory impact
@@ -222,22 +276,49 @@ def main():
         for blob_name in result.keys():
             results[blob_name][key] = result[blob_name]
 
-        infer_times.append(default_timer() - start_infer_time)
+        infer_time = default_timer() - start_infer_time
+        total_infer_time += infer_time
+        num_of_frames = file_data[0][key].shape[0]
+        avg_infer_time_per_frame = infer_time / num_of_frames
 
 # ---------------------------Step 8. Process output--------------------------------------------------------------------
-    for blob_name in output_blobs:
-        for i, key in enumerate(sorted(results[blob_name])):
-            log.info(f'Utterance {i} ({key})')
+        log.info('')
+        log.info(f'Utterance {i} ({key}):')
+        log.info(f'Total time in Infer (HW and SW): {infer_time * 1000:.2f}ms')
+        log.info(f'Frames in utterance: {num_of_frames}')
+        log.info(f'Average Infer time per frame: {avg_infer_time_per_frame * 1000:.2f}ms')
+
+        for blob_name in output_blobs:
+            log.info('')
             log.info(f'Output blob name: {blob_name}')
-            log.info(f'Frames in utterance: {results[blob_name][key].shape[0]}')
-            log.info(f'Total time in Infer (HW and SW): {infer_times[i] * 1000:.2f}ms')
+            log.info(f'Number scores per frame: {results[blob_name][key].shape[1]}')
 
             if args.reference:
+                log.info('')
                 compare_with_reference(results[blob_name][key], references[blob_name][key])
 
-            log.info('')
-
-    log.info(f'Total sample time: {sum(infer_times) * 1000:.2f}ms')
+        if args.performance_counter:
+            if 'GNA' in args.device:
+                pc = exec_net.requests[0].get_perf_counts()
+                total_cycles = int(pc['1.1 Total scoring time in HW']['real_time'])
+                stall_cycles = int(pc['1.2 Stall scoring time in HW']['real_time'])
+                active_cycles = total_cycles - stall_cycles
+                frequency = 10**6
+                if args.arch == 'CORE':
+                    frequency *= GNA_CORE_FREQUENCY
+                else:
+                    frequency *= GNA_ATOM_FREQUENCY
+                total_inference_time = total_cycles / frequency
+                active_time = active_cycles / frequency
+                stall_time = stall_cycles / frequency
+                log.info('')
+                log.info('Performance Statistics of GNA Hardware')
+                log.info(f'   Total Inference Time: {(total_inference_time * 1000):.4f} ms')
+                log.info(f'   Active Time: {(active_time * 1000):.4f} ms')
+                log.info(f'   Stall Time:  {(stall_time * 1000):.4f} ms')
+
+    log.info('')
+    log.info(f'Total sample time: {total_infer_time * 1000:.2f}ms')
 
     if args.output:
         for i, blob_name in enumerate(results):
diff --git a/inference-engine/ie_bridges/python/sample/style_transfer_sample/README.md b/inference-engine/ie_bridges/python/sample/style_transfer_sample/README.md
index 42b7cc29f17241..3e4e5a5a8f5d55 100644
--- a/inference-engine/ie_bridges/python/sample/style_transfer_sample/README.md
+++ b/inference-engine/ie_bridges/python/sample/style_transfer_sample/README.md
@@ -91,7 +91,7 @@ To run the sample, you need specify a model and image:
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name fast-neural-style-mosaic-onnx
 ```
diff --git a/inference-engine/ie_bridges/python/src/openvino/__init__.py b/inference-engine/ie_bridges/python/src/openvino/__init__.py
index 7039467483f731..962d369fd34512 100644
--- a/inference-engine/ie_bridges/python/src/openvino/__init__.py
+++ b/inference-engine/ie_bridges/python/src/openvino/__init__.py
@@ -1,3 +1,4 @@
 # -*- coding: utf-8 -*-
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
+__path__ = __import__('pkgutil').extend_path(__path__, __name__)  # type: ignore  # mypy issue #1422
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/CMakeLists.txt b/inference-engine/ie_bridges/python/src/openvino/inference_engine/CMakeLists.txt
index cfab4f2d907f28..c55ae9cd1e84c6 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/CMakeLists.txt
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/CMakeLists.txt
@@ -31,7 +31,7 @@ foreach(PYX_FILE IN LISTS PYX_SOURCES)
     ov_python_disable_intel_warnings(${PYX_NAME})
     add_dependencies(${TARGET_NAME} ${PYX_NAME})
     target_include_directories(${PYX_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
-    target_link_libraries(${PYX_NAME} PRIVATE ${InferenceEngine_LIBRARIES})
+    target_link_libraries(${PYX_NAME} PRIVATE openvino::runtime)
     list(APPEND INSTALLED_TARGETS ${PYX_NAME})
     ie_python_minimal_api(${PYX_NAME})
 endforeach()
@@ -53,7 +53,7 @@ python_disable_deprecated_warnings()
 ie_python_minimal_api(${TARGET_NAME})
 
 target_include_directories(${TARGET_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
-target_link_libraries(${TARGET_NAME} PRIVATE ${InferenceEngine_LIBRARIES})
+target_link_libraries(${TARGET_NAME} PRIVATE openvino::runtime)
 
 # Compatibility with python 2.7 which has deprecated "register" specifier
 if(CMAKE_CXX_COMPILER_ID STREQUAL "Clang")
@@ -72,8 +72,10 @@ add_custom_command(TARGET ${TARGET_NAME}
 # install
 
 install(TARGETS ${INSTALLED_TARGETS}
-        RUNTIME DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/inference_engine COMPONENT ${PYTHON_COMPONENT}
-        LIBRARY DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/inference_engine COMPONENT ${PYTHON_COMPONENT})
+        RUNTIME DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/inference_engine
+        COMPONENT ${PYTHON_COMPONENT}
+        LIBRARY DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/inference_engine
+        COMPONENT ${PYTHON_COMPONENT})
 
 install(PROGRAMS __init__.py
         DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/inference_engine
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/constants.pyx b/inference-engine/ie_bridges/python/src/openvino/inference_engine/constants.pyx
index 51df6915db5a93..4a28f22aca86f4 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/constants.pyx
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/constants.pyx
@@ -9,7 +9,7 @@ from enum import Enum
 supported_precisions = ['FP32', 'FP64', 'FP16', 'I64', 'U64', 'I32', 'U32',
                         'I16', 'I4', 'I8', 'U16', 'U4', 'U8', 'BOOL', 'BIN', 'BF16']
 
-known_plugins = ['CPU', 'GPU', 'FPGA', 'MYRIAD', 'HETERO', 'HDDL', 'MULTI']
+known_plugins = ['CPU', 'GPU', 'MYRIAD', 'HETERO', 'HDDL', 'MULTI']
 
 layout_int_to_str_map = {0: 'ANY', 1: 'NCHW', 2: 'NHWC', 3: 'NCDHW', 4: 'NDHWC', 64: 'OIHW', 95: 'SCALAR', 96: 'C',
                          128: 'CHW', 192: 'HW', 193: 'NC', 194: 'CN', 200: 'BLOCKED'}
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pxd b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pxd
index e7d4f2c85a73ee..e269f93dbd77e5 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pxd
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pxd
@@ -39,7 +39,7 @@ cdef class InferRequest:
     cpdef get_perf_counts(self)
     cdef void user_callback(self, int status) with gil
     cdef public:
-        _inputs_list, _outputs_list, _py_callback, _py_data, _py_callback_used, _py_callback_called, _user_blobs
+        _inputs_list, _outputs_list, _py_callback, _py_data, _user_blobs, _inputs_is_dynamic
 
 cdef class IENetwork:
     cdef C.IENetwork impl
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pyx b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pyx
index 109a6a51a0233f..5f595850a05b0e 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pyx
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api.pyx
@@ -29,7 +29,6 @@ from .constants import WaitMode, StatusCode, MeanVariant, layout_str_to_enum, fo
 
 import numpy as np
 
-
 warnings.filterwarnings(action="module", category=DeprecationWarning)
 
 cdef extern from "<utility>" namespace "std" nogil:
@@ -53,6 +52,11 @@ cdef c_map_to_dict(map[string, string] c_map):
     return py_dict
 
 
+cdef expand_dims_to_corresponding_layout(shape, layout):
+    single_axes = [1] * (len(layout) - len(shape))
+    return single_axes + list(shape)
+
+
 def get_version():
     return C.get_version().decode()
 
@@ -271,6 +275,10 @@ cdef class Blob:
         tensor_desc = TensorDesc(precision, dims, layout_int_to_str_map[layout])
         return tensor_desc
 
+    def set_shape(self, new_shape):
+        self._initial_shape = new_shape
+        deref(self._ptr).setShape(new_shape)
+
 ## This class represents an Inference Engine entity and allows you to manipulate with plugins using unified interfaces.
 cdef class IECore:
     ## Class constructor
@@ -304,7 +312,7 @@ cdef class IECore:
         return versions
 
     ## Reads a network from Intermediate Representation (IR) or ONNX formats and creates an `IENetwork`.
-    #  @param model: A `.xml`, `.onnx`or `.prototxt` model file or string with IR.
+    #  @param model: A `.xml` or `.onnx` model file or string with IR.
     #  @param weights: A `.bin` file of the IR. Depending on `init_from_buffer` value, can be a string path or
     #                  bytes with file content.
     #  @param init_from_buffer: Defines the way of how `model` and `weights` attributes are interpreted.
@@ -533,7 +541,7 @@ cdef class IECore:
     def get_config(self, device_name: str, config_name: str):
         return self.impl.getConfig(device_name.encode(), config_name.encode())
 
-    ## A list of devices. The devices are returned as \[CPU, FPGA.0, FPGA.1, MYRIAD\].
+    ## A list of devices. The devices are returned as \[CPU, GPU.0, GPU.1, MYRIAD\].
     # If there are more than one device of a specific type, they all are listed followed by a dot and a number.
     @property
     def available_devices(self):
@@ -815,6 +823,14 @@ cdef class DataPtr:
     def initialized(self):
         return deref(self._ptr).isInitialized()
 
+    @property
+    def is_dynamic(self):
+        return deref(self._ptr).isDynamic()
+
+    ## get capsule with ngraph::PartialShape
+    def _get_partial_shape_capsule(self):
+        return C.getPartialShape_capsule(self._ptr)
+
 
 ## This class is the layer constant data representation. Provides same interface as DataPtr object except properties setters
 cdef class CDataPtr:
@@ -843,6 +859,14 @@ cdef class CDataPtr:
     def initialized(self):
         return deref(self._ptr).isInitialized()
 
+    @property
+    def is_dynamic(self):
+        return deref(self._ptr).isDynamic()
+
+    ## get capsule with ngraph::PartialShape
+    def _get_partial_shape_capsule(self):
+        return C.getPartialShape_capsule(self._ptr)
+
 
 ## This class represents a network instance loaded to plugin and ready for inference.
 cdef class ExecutableNetwork:
@@ -912,6 +936,8 @@ cdef class ExecutableNetwork:
                     infer_request.impl = &(deref(self.impl).infer_requests[i])
                 infer_request._inputs_list = list(self.input_info.keys())
                 infer_request._outputs_list = list(self.outputs.keys())
+                for input_name in infer_request._inputs_list:
+                    infer_request._inputs_is_dynamic[input_name] = self.input_info[input_name].input_data.is_dynamic
                 self._infer_requests.append(infer_request)
 
         if len(self._infer_requests) != c_infer_requests_size:
@@ -1045,14 +1071,11 @@ cdef class InferRequest:
         self._inputs_list = []
         self._outputs_list = []
         self._py_callback = lambda *args, **kwargs: None
-        self._py_callback_used = False
-        self._py_callback_called = threading.Event()
         self._py_data = None
+        self._inputs_is_dynamic = {}
 
     cdef void user_callback(self, int status) with gil:
         if self._py_callback:
-            # Set flag at first since user can call wait in callback
-            self._py_callback_called.set()
             self._py_callback(status, self._py_data)
 
     ## Description: Sets a callback function that is called on success or failure of an asynchronous request
@@ -1076,7 +1099,6 @@ cdef class InferRequest:
     def set_completion_callback(self, py_callback, py_data = None):
         self._py_callback = py_callback
         self._py_data = py_data
-        self._py_callback_used = True
         deref(self.impl).setCyCallback(<cb_type> self.user_callback, <void *> self)
 
     cpdef BlobBuffer _get_blob_buffer(self, const string & blob_name):
@@ -1194,8 +1216,6 @@ cdef class InferRequest:
     cpdef async_infer(self, inputs=None):
         if inputs is not None:
             self._fill_inputs(inputs)
-        if self._py_callback_used:
-            self._py_callback_called.clear()
         with nogil:
             deref(self.impl).infer_async()
 
@@ -1215,24 +1235,6 @@ cdef class InferRequest:
     cpdef wait(self, timeout=None):
         cdef int status
         cdef int64_t c_timeout
-        cdef int c_wait_mode
-        if self._py_callback_used:
-            # check request status to avoid blocking for idle requests
-            c_wait_mode = WaitMode.STATUS_ONLY
-            with nogil:
-                status = deref(self.impl).wait(c_wait_mode)
-            if status != StatusCode.RESULT_NOT_READY:
-                return status
-            if not self._py_callback_called.is_set():
-                if timeout == WaitMode.RESULT_READY:
-                    timeout = None
-                if timeout is not None:
-                    # Convert milliseconds to seconds
-                    timeout = float(timeout)/1000
-                if not self._py_callback_called.wait(timeout):
-                    return StatusCode.REQUEST_BUSY
-            return StatusCode.OK
-
         if timeout is None:
             timeout = WaitMode.RESULT_READY
         c_timeout = <int64_t> timeout
@@ -1308,6 +1310,9 @@ cdef class InferRequest:
     def _fill_inputs(self, inputs):
         for k, v in inputs.items():
             assert k in self._inputs_list, f"No input with name {k} found in network"
+            if self._inputs_is_dynamic[k]:
+                shape = expand_dims_to_corresponding_layout(v.shape, self.input_blobs[k].tensor_desc.layout)
+                self.input_blobs[k].set_shape(shape)
             if self.input_blobs[k].tensor_desc.precision == "FP16":
                 self.input_blobs[k].buffer[:] = v.view(dtype=np.int16)
             else:
@@ -1452,15 +1457,25 @@ cdef class IENetwork:
     #  net.reshape({input_layer: (n, c, h*2, w*2)})
     #  ```
     def reshape(self, input_shapes: dict):
-        cdef map[string, vector[size_t]] c_input_shapes
-        cdef vector[size_t] c_shape
+        cdef map[string, vector[vector[int64_t]]] c_input_shapes
+        cdef vector[vector[int64_t]] c_shape
+        cdef vector[int64_t] dim
         net_inputs = self.input_info
         for input, shape in input_shapes.items():
             c_shape = []
             if input not in net_inputs:
                 raise AttributeError(f"Specified '{input}' layer not in network inputs '{net_inputs}'! ")
             for v in shape:
-                c_shape.push_back(v)
+                if isinstance(v, list) or isinstance(v, tuple):
+                    if len(v) < 1 or len(v) > 2:
+                        raise ValueError(f"Incorrect PartialShape dimension definition '{v}' "
+                                         f"in shape '{shape}', expected one or two values for a dimension! ")
+                    for d in v:
+                        dim.push_back(d)
+                else:
+                    dim.push_back(v)
+                c_shape.push_back(dim)
+                dim.clear()
             c_input_shapes[input.encode()] = c_shape
         self.impl.reshape(c_input_shapes)
 
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp
index 7aa289377d2e92..fcd8613f444252 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.cpp
@@ -4,8 +4,8 @@
 
 #include "ie_api_impl.hpp"
 
-#include "ie_iinfer_request.hpp"
 #include "ie_plugin_config.hpp"
+#include "ngraph/partial_shape.hpp"
 
 const std::string EXPORTED_NETWORK_NAME = "undefined";
 std::map<std::string, InferenceEngine::Precision> precision_map = {{"FP32", InferenceEngine::Precision::FP32},
@@ -206,6 +206,24 @@ InferenceEnginePython::IENetwork InferenceEnginePython::read_network(std::string
     return InferenceEnginePython::IENetwork(std::make_shared<InferenceEngine::CNNNetwork>(net));
 }
 
+PyObject* InferenceEnginePython::getPartialShape_capsule(InferenceEngine::CDataPtr data) {
+    const char* py_capsule_name = "ngraph_partial_shape";
+    auto ngraph_pShape_ptr = std::make_shared<ngraph::PartialShape>(data->getPartialShape());
+    auto* sp_copy = new std::shared_ptr<const ngraph::PartialShape>(ngraph_pShape_ptr);
+    auto sp_deleter = [](PyObject* capsule) {
+        auto* capsule_ptr = PyCapsule_GetPointer(capsule, "ngraph_partial_shape");
+        auto* function_sp = static_cast<std::shared_ptr<ngraph::PartialShape>*>(capsule_ptr);
+        if (function_sp) {
+            delete function_sp;
+        }
+    };
+    if (ngraph_pShape_ptr) {
+        return PyCapsule_New(sp_copy, py_capsule_name, sp_deleter);
+    } else {
+        return nullptr;
+    }
+}
+
 InferenceEnginePython::IENetwork::IENetwork(const std::shared_ptr<InferenceEngine::CNNNetwork>& cnn_network)
     : actual(cnn_network) {
     if (actual == nullptr)
@@ -289,8 +307,21 @@ size_t InferenceEnginePython::IENetwork::getBatch() {
     return actual->getBatchSize();
 }
 
-void InferenceEnginePython::IENetwork::reshape(const std::map<std::string, std::vector<size_t>>& input_shapes) {
-    actual->reshape(input_shapes);
+void InferenceEnginePython::IENetwork::reshape(
+    const std::map<std::string, std::vector<std::vector<int64_t>>>& input_shapes) {
+    std::map<std::string, ngraph::PartialShape> inputShapes;
+    for (auto const& input : input_shapes) {
+        using ngraph::Dimension;
+        std::vector<Dimension> dims;
+        for (auto const& d : input.second) {
+            if (d.size() == 1)
+                dims.push_back(Dimension(d[0]));
+            else if (d.size() == 2)
+                dims.push_back(Dimension(d[0], d[1]));
+        }
+        inputShapes[input.first] = ngraph::PartialShape(dims);
+    }
+    actual->reshape(inputShapes);
 }
 
 InferenceEnginePython::IEExecNetwork::IEExecNetwork(const std::string& name, size_t num_requests)
@@ -514,10 +545,10 @@ void InferenceEnginePython::IEExecNetwork::createInferRequests(int num_requests)
                     auto end_time = Time::now();
                     auto execTime = std::chrono::duration_cast<ns>(end_time - infer_request.start_time);
                     infer_request.exec_time = static_cast<double>(execTime.count()) * 0.000001;
-                    infer_request.request_queue_ptr->setRequestIdle(infer_request.index);
                     if (infer_request.user_callback) {
                         infer_request.user_callback(infer_request.user_data, code);
                     }
+                    infer_request.request_queue_ptr->setRequestIdle(infer_request.index);
                 });
     }
 }
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.hpp b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.hpp
index 4823b52287c5f4..6d479784d1454d 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.hpp
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl.hpp
@@ -4,12 +4,9 @@
 
 #pragma once
 
-#include <ie_extension.h>
-
 #include <algorithm>
 #include <chrono>
 #include <condition_variable>
-#include <ie_core.hpp>
 #include <iostream>
 #include <iterator>
 #include <list>
@@ -23,6 +20,7 @@
 #include <vector>
 
 #include "Python.h"
+#include "ie_core.hpp"
 
 typedef std::chrono::high_resolution_clock Time;
 typedef std::chrono::nanoseconds ns;
@@ -62,7 +60,7 @@ struct IENetwork {
 
     const std::map<std::string, InferenceEngine::DataPtr> getOutputs();
 
-    void reshape(const std::map<std::string, std::vector<size_t>>& input_shapes);
+    void reshape(const std::map<std::string, std::vector<std::vector<int64_t>>>& input_shapes);
 
     void serialize(const std::string& path_to_xml, const std::string& path_to_bin);
 
@@ -203,4 +201,6 @@ std::string get_version();
 
 InferenceEnginePython::IENetwork read_network(std::string path_to_xml, std::string path_to_bin);
 
+PyObject* getPartialShape_capsule(InferenceEngine::CDataPtr data);
+
 };  // namespace InferenceEnginePython
diff --git a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl_defs.pxd b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl_defs.pxd
index 103c8d77d537b0..9f60f53625702b 100644
--- a/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl_defs.pxd
+++ b/inference-engine/ie_bridges/python/src/openvino/inference_engine/ie_api_impl_defs.pxd
@@ -23,6 +23,7 @@ cdef extern from "<inference_engine.hpp>" namespace "InferenceEngine":
         const CTensorDesc& getTensorDesc()  except +
         size_t element_size()  except +
         void allocate()
+        void setShape(const SizeVector& dims) except +
 
     cdef TBlob[Type].Ptr make_shared_blob[Type](const CTensorDesc& tensorDesc)
 
@@ -47,6 +48,7 @@ cdef extern from "<inference_engine.hpp>" namespace "InferenceEngine":
         const Layout getLayout() except +
         void setLayout(Layout layout) except +
         const bool isInitialized() except +
+        bool isDynamic() except +
 
     ctypedef shared_ptr[Data] DataPtr
     ctypedef weak_ptr[Data] DataWeakPtr
@@ -178,7 +180,7 @@ cdef extern from "ie_api_impl.hpp" namespace "InferenceEnginePython":
         size_t getBatch() except +
         void setLayerParams(map[string, map[string, string]] params_map) except +
         void serialize(const string& path_to_xml, const string& path_to_bin) except +
-        void reshape(map[string, vector[size_t]] input_shapes) except +
+        void reshape(map[string, vector[vector[int64_t]]] input_shapes) except +
         object getFunction() except +
         void convertToOldRepresentation() except +
         string getOVNameForTensor(const string &) except +
@@ -226,3 +228,5 @@ cdef extern from "ie_api_impl.hpp" namespace "InferenceEnginePython":
     cdef string get_version()
 
     cdef IENetwork read_network(string path_to_xml, string path_to_bin)
+
+    cdef object getPartialShape_capsule(DataPtr)
diff --git a/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt b/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt
index 512b1662be525c..0aa8280bc5c5d1 100644
--- a/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt
+++ b/inference-engine/ie_bridges/python/src/openvino/offline_transformations/CMakeLists.txt
@@ -30,14 +30,14 @@ if(COMMAND ie_add_vs_version_file)
 endif()
 
 if(TARGET offline_transformations)
-    list(APPEND InferenceEngine_LIBRARIES offline_transformations)
+    list(APPEND link_libraries offline_transformations)
 else()
-    list(APPEND InferenceEngine_LIBRARIES IE::offline_transformations)
+    list(APPEND link_libraries IE::offline_transformations)
 endif()
 
 target_include_directories(${TARGET_NAME} SYSTEM PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/../inference_engine")
 target_include_directories(${TARGET_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
-target_link_libraries(${TARGET_NAME} PRIVATE ${InferenceEngine_LIBRARIES})
+target_link_libraries(${TARGET_NAME} PRIVATE openvino::runtime ${link_libraries})
 
 # Compatibility with python 2.7 which has deprecated "register" specifier
 if(CMAKE_CXX_COMPILER_ID STREQUAL "Clang")
@@ -59,9 +59,11 @@ add_custom_command(TARGET ${TARGET_NAME}
 # ie_cpack_add_component(${PYTHON_VERSION}_dev DEPENDS ${PYTHON_COMPONENT})
 
 install(TARGETS ${TARGET_NAME}
-        RUNTIME DESTINATION python/${PYTHON_VERSION}/openvino/offline_transformations COMPONENT ${PYTHON_COMPONENT}
-        LIBRARY DESTINATION python/${PYTHON_VERSION}/openvino/offline_transformations COMPONENT ${PYTHON_COMPONENT})
+        RUNTIME DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations
+        COMPONENT ${PYTHON_COMPONENT}
+        LIBRARY DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations
+        COMPONENT ${PYTHON_COMPONENT})
 
 install(PROGRAMS __init__.py
-        DESTINATION python/${PYTHON_VERSION}/openvino/offline_transformations
+        DESTINATION ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION}/openvino/offline_transformations
         COMPONENT ${PYTHON_COMPONENT})
diff --git a/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt b/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt
index 9d3e1e0ffc082d..cb071162e3537a 100644
--- a/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt
+++ b/inference-engine/ie_bridges/python/src/openvino/test_utils/CMakeLists.txt
@@ -30,14 +30,14 @@ if(COMMAND ie_add_vs_version_file)
 endif()
 
 if(TARGET commonTestUtils)
-    list(APPEND InferenceEngine_LIBRARIES commonTestUtils)
+    list(APPEND link_libraries commonTestUtils)
 else()
-    list(APPEND InferenceEngine_LIBRARIES IE::commonTestUtils)
+    list(APPEND link_libraries IE::commonTestUtils)
 endif()
 
 target_include_directories(${TARGET_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
 target_include_directories(${TARGET_NAME} SYSTEM PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/../inference_engine")
-target_link_libraries(${TARGET_NAME} PRIVATE ${InferenceEngine_LIBRARIES})
+target_link_libraries(${TARGET_NAME} PRIVATE ${link_libraries})
 
 # Compatibility with python 2.7 which has deprecated "register" specifier
 if(CMAKE_CXX_COMPILER_ID STREQUAL "Clang")
diff --git a/inference-engine/ie_bridges/python/tests/conftest.py b/inference-engine/ie_bridges/python/tests/conftest.py
index e697b58ee63daf..f0e5059d04017e 100644
--- a/inference-engine/ie_bridges/python/tests/conftest.py
+++ b/inference-engine/ie_bridges/python/tests/conftest.py
@@ -3,6 +3,7 @@
 
 import os
 import pytest
+import numpy as np
 
 
 def model_path(is_myriad=False):
@@ -38,3 +39,22 @@ def plugins_path():
 @pytest.fixture(scope='session')
 def device():
     return os.environ.get("TEST_DEVICE") if os.environ.get("TEST_DEVICE") else "CPU"
+
+
+def pytest_configure(config):
+    # register an additional markers
+    config.addinivalue_line(
+        "markers", "ngraph_dependent_test"
+    )
+    config.addinivalue_line(
+        "markers", "template_plugin"
+    )
+
+
+def create_ngraph_function(inputShape):
+    import ngraph as ng
+    inputShape = ng.impl.PartialShape(inputShape)
+    param = ng.parameter(inputShape, dtype=np.float32, name="data")
+    result = ng.relu(param, name='out')
+    function  = ng.Function(result, [param], "TestFunction")
+    return function
diff --git a/inference-engine/ie_bridges/python/tests/test_Blob.py b/inference-engine/ie_bridges/python/tests/test_Blob.py
index 83d5daa701c4d4..cd2a48a2724bfe 100644
--- a/inference-engine/ie_bridges/python/tests/test_Blob.py
+++ b/inference-engine/ie_bridges/python/tests/test_Blob.py
@@ -100,6 +100,7 @@ def test_incompatible_input_precision():
 
 
 # issue 49903
+@pytest.mark.ngraph_dependent_test
 @pytest.mark.skip(reason="Test will enable when CPU fix will be merge")
 @pytest.mark.skipif(os.environ.get("TEST_DEVICE", "CPU") != "CPU", reason="Device dependent test")
 def test_buffer_values_after_add_outputs(device):
@@ -120,3 +121,34 @@ def test_buffer_values_after_add_outputs(device):
     result = exec_net.infer(feed_dict)
     assert np.all(abs(result[output_layer])<30)
     assert result[output_layer].dtype == np.float16
+
+
+def test_set_shape():
+    tensor_desc = TensorDesc("FP32", [1, 3, 127, 127], "NHWC")
+    blob = Blob(tensor_desc)
+    blob.set_shape([1, 4, 128, 128])
+    assert blob.tensor_desc.dims == [1, 4, 128, 128]
+    assert blob.buffer.shape == (1, 4, 128, 128)
+
+    array = np.ones([1, 3, 127, 127], dtype=np.float32)
+    blob = Blob(tensor_desc, array)
+    blob.set_shape([1, 4, 128, 128])
+    assert blob.tensor_desc.dims == [1, 4, 128, 128]
+    assert blob.buffer.shape == (1, 4, 128, 128)
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_blob_set_shape_after_async_infer():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([ng.Dimension(0,5), ng.Dimension(4), ng.Dimension(20), ng.Dimension(20)])
+    net = ng.function_to_cnn(function)
+    ie_core = IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    request = exec_net.requests[0]
+    request.async_infer({"data": np.ones([4, 4, 20, 20])})
+    with pytest.raises(RuntimeError) as e:
+        request.input_blobs['data'].set_shape([3, 4, 20, 20])
+    assert "REQUEST_BUSY" in str(e.value)
diff --git a/inference-engine/ie_bridges/python/tests/test_CDataPtr.py b/inference-engine/ie_bridges/python/tests/test_CDataPtr.py
index d81dd46a5cc18d..4969aba4a5cb3f 100644
--- a/inference-engine/ie_bridges/python/tests/test_CDataPtr.py
+++ b/inference-engine/ie_bridges/python/tests/test_CDataPtr.py
@@ -56,3 +56,21 @@ def test_initialized(device):
     net = ie.read_network(model=test_net_xml, weights=test_net_bin)
     exec_net = ie.load_network(net, device, num_requests=5)
     assert exec_net.outputs['fc_out'].initialized, "Incorrect value for initialized property for layer 'fc_out"
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_is_dynamic():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([-1, 3, 20, 20])
+    net = ng.function_to_cnn(function)
+    ie = IECore()
+    ie.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie.load_network(net, "TEMPLATE")
+    assert exec_net.outputs["out"].is_dynamic
+    p_shape = ng.partial_shape_from_data(exec_net.outputs["out"])
+    assert isinstance(p_shape, ng.impl.PartialShape)
+    with pytest.raises(RuntimeError) as e:
+       exec_net.outputs["out"].shape
+    assert  "Cannot return dims for Data with dynamic shapes!" in str(e.value)
diff --git a/inference-engine/ie_bridges/python/tests/test_DataPtr.py b/inference-engine/ie_bridges/python/tests/test_DataPtr.py
index 9b125fb585405c..40ae28b2001317 100644
--- a/inference-engine/ie_bridges/python/tests/test_DataPtr.py
+++ b/inference-engine/ie_bridges/python/tests/test_DataPtr.py
@@ -43,3 +43,27 @@ def test_layout():
 
 def test_initialized():
     assert layer_out_data().initialized, "Incorrect value for initialized property for layer 'fc_out'"
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_is_dynamic():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([-1, 3, 20, 20])
+    net = ng.function_to_cnn(function)
+    assert net.input_info["data"].input_data.is_dynamic
+    assert net.outputs["out"].is_dynamic
+    p_shape = ng.partial_shape_from_data(net.input_info["data"].input_data)
+    assert isinstance(p_shape, ng.impl.PartialShape)
+    p_shape = ng.partial_shape_from_data(net.outputs["out"])
+    assert isinstance(p_shape, ng.impl.PartialShape)
+    with pytest.raises(RuntimeError) as e:
+        net.input_info["data"].input_data.shape
+    assert  "Cannot return dims for Data with dynamic shapes!" in str(e.value)
+    ie = IECore()
+    ie.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie.load_network(net, "TEMPLATE")
+    assert exec_net.input_info["data"].input_data.is_dynamic
+    p_shape = ng.partial_shape_from_data(exec_net.input_info["data"].input_data)
+    assert isinstance(p_shape, ng.impl.PartialShape)
diff --git a/inference-engine/ie_bridges/python/tests/test_ExecutableNetwork.py b/inference-engine/ie_bridges/python/tests/test_ExecutableNetwork.py
index 65811503d986e4..3b03b0339f1d74 100644
--- a/inference-engine/ie_bridges/python/tests/test_ExecutableNetwork.py
+++ b/inference-engine/ie_bridges/python/tests/test_ExecutableNetwork.py
@@ -5,6 +5,7 @@
 import os
 import pytest
 import warnings
+import time
 
 from openvino.inference_engine import ie_api as ie
 from conftest import model_path, image_path
@@ -173,6 +174,26 @@ def test_wait_before_start(device):
   del ie_core
 
 
+def test_wait_for_callback(device):
+    def callback(status, callbacks_info):
+        time.sleep(0.01)
+        callbacks_info['finished'] += 1
+
+    ie_core = ie.IECore()
+    net = ie_core.read_network(model=test_net_xml, weights=test_net_bin)
+    num_requests = 3
+    exec_net = ie_core.load_network(net, device, num_requests=num_requests)
+    callbacks_info = {}
+    callbacks_info['finished'] = 0
+    img = read_image()
+    for request in exec_net.requests:
+        request.set_completion_callback(callback, callbacks_info)
+        request.async_infer({'data': img})
+
+    exec_net.wait(num_requests)
+    assert callbacks_info['finished'] == num_requests
+
+
 def test_wrong_request_id(device):
     ie_core = ie.IECore()
     net = ie_core.read_network(model=test_net_xml, weights=test_net_bin)
diff --git a/inference-engine/ie_bridges/python/tests/test_IECore.py b/inference-engine/ie_bridges/python/tests/test_IECore.py
index ed15b12d9b9df3..924e4a543ed2c2 100644
--- a/inference-engine/ie_bridges/python/tests/test_IECore.py
+++ b/inference-engine/ie_bridges/python/tests/test_IECore.py
@@ -61,12 +61,10 @@ def test_load_network_wrong_device():
     assert 'Device with "BLA" name is not registered in the InferenceEngine' in str(e.value)
 
 
+@pytest.mark.ngraph_dependent_test
 def test_query_network(device):
-    ie = IECore()
-    if device == "CPU":
-        if ie.get_metric(device, "FULL_DEVICE_NAME") == "arm_compute::NEON":
-            pytest.skip("Can't run on ARM plugin due-to ngraph")
     import ngraph as ng
+    ie = IECore()
     net = ie.read_network(model=test_net_xml, weights=test_net_bin)
     query_res = ie.query_network(net, device)
     func_net = ng.function_from_cnn(net)
diff --git a/inference-engine/ie_bridges/python/tests/test_IENetwork.py b/inference-engine/ie_bridges/python/tests/test_IENetwork.py
index d808e1772340c1..607c8296f4b009 100644
--- a/inference-engine/ie_bridges/python/tests/test_IENetwork.py
+++ b/inference-engine/ie_bridges/python/tests/test_IENetwork.py
@@ -134,12 +134,10 @@ def test_batch_size_after_reshape():
     assert net.input_info['data'].input_data.shape == [8, 3, 32, 32]
 
 
-def test_serialize(device):
-    ie = IECore()
-    if device == "CPU":
-        if ie.get_metric(device, "FULL_DEVICE_NAME") == "arm_compute::NEON":
-            pytest.skip("Can't run on ARM plugin due-to ngraph")
+@pytest.mark.ngraph_dependent_test
+def test_serialize():
     import ngraph as ng
+    ie = IECore()
     net = ie.read_network(model=test_net_xml, weights=test_net_bin)
     net.serialize("./serialized_net.xml", "./serialized_net.bin")
     serialized_net = ie.read_network(model="./serialized_net.xml", weights="./serialized_net.bin")
@@ -158,6 +156,43 @@ def test_reshape():
     ie = IECore()
     net = ie.read_network(model=test_net_xml, weights=test_net_bin)
     net.reshape({"data": (2, 3, 32, 32)})
+    assert net.input_info["data"].input_data.shape == [2, 3, 32, 32]
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.parametrize("shape, p_shape", [
+    ([1, 3, 22, 22], [1, 3, -1, 25]),
+    ([1, 3, 22, 22], [-1, -1, -1, -1]),
+    ([1, 3, -1, 25], [1, 3, 22, -1])
+])
+def test_reshape_with_partial_shape(device, shape, p_shape):
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function(shape)
+    net = ng.function_to_cnn(function)
+    net.reshape({"data": p_shape})
+    changedFunction = ng.function_from_cnn(net)
+    p_shape = ng.impl.PartialShape(p_shape)
+    assert changedFunction.get_parameters()[0].get_partial_shape().is_dynamic
+    assert changedFunction.get_results()[0].get_output_partial_shape(0).is_dynamic
+    assert function.get_parameters()[0].get_partial_shape().is_dynamic
+    assert function.get_results()[0].get_output_partial_shape(0).is_dynamic
+    assert changedFunction.get_parameters()[0].get_partial_shape() == p_shape
+    assert changedFunction.get_results()[0].get_output_partial_shape(0) == p_shape
+    assert function.get_parameters()[0].get_partial_shape() == p_shape
+    assert function.get_results()[0].get_output_partial_shape(0) == p_shape
+
+
+@pytest.mark.ngraph_dependent_test
+def test_incorrect_reshape(device):
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([1, 3, 22, 22])
+    net = ng.function_to_cnn(function)
+    with pytest.raises(ValueError) as e:
+        net.reshape({"data": [(2, 4, 6), 3, 22, 22]})
+    assert "Incorrect PartialShape dimension definition '(2, 4, 6)' " \
+           "in shape '[(2, 4, 6), 3, 22, 22]', expected one or two values for a dimension! " in str(e.value)
 
 
 def test_net_from_buffer_valid():
@@ -247,3 +282,18 @@ def test_tensor_names():
     assert net.get_ov_name_for_tensor("relu_t") == "activation"
     assert net.get_ov_name_for_tensor("identity_t") == "activation"
     assert net.get_ov_name_for_tensor("input") == "in1"
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_create_two_exec_net():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([ng.Dimension(0,5), ng.Dimension(4), ng.Dimension(20), ng.Dimension(20)])
+    net = ng.function_to_cnn(function)
+    ie_core = IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net1 = ie_core.load_network(net, "TEMPLATE", num_requests=2)
+    assert ng.function_from_cnn(net) != None
+    exec_net2 = ie_core.load_network(net, "TEMPLATE", num_requests=2)
+    assert ng.function_from_cnn(net) != None
diff --git a/inference-engine/ie_bridges/python/tests/test_InferRequest.py b/inference-engine/ie_bridges/python/tests/test_InferRequest.py
index 44afdfa9b6108d..a1ea7ce8bcee92 100644
--- a/inference-engine/ie_bridges/python/tests/test_InferRequest.py
+++ b/inference-engine/ie_bridges/python/tests/test_InferRequest.py
@@ -7,6 +7,7 @@
 import warnings
 import threading
 from datetime import datetime
+import time
 
 from openvino.inference_engine import ie_api as ie
 from conftest import model_path, image_path
@@ -17,9 +18,8 @@
 
 
 def create_function_with_memory(input_shape, data_type):
-    import ngraph as ng
     from ngraph.impl import Function, Type
-
+    import ngraph as ng
     input_data = ng.parameter(input_shape, name="input_data", dtype=data_type)
     rv = ng.read_value(input_data, "var_id_667")
     add = ng.add(rv, input_data, name="MemoryAdd")
@@ -350,7 +350,7 @@ def execute(self, input_data):
             self.cv.release()
             status = self.request.wait(ie.WaitMode.RESULT_READY)
             assert status == ie.StatusCode.OK
-            assert self.status_code == ie.StatusCode.OK
+            assert self.status_code == ie.StatusCode.RESULT_NOT_READY
 
     ie_core = ie.IECore()
     net = ie_core.read_network(test_net_xml, test_net_bin)
@@ -362,11 +362,27 @@ def execute(self, input_data):
     del ie_core
 
 
+def test_async_infer_wait_while_callback_will_not_finish(device):
+    def callback(status, callback_status):
+        time.sleep(0.01)
+        callback_status['finished'] = True
+
+    ie_core = ie.IECore()
+    net = ie_core.read_network(test_net_xml, test_net_bin)
+    exec_net = ie_core.load_network(net, device, num_requests=1)
+    callback_status = {}
+    callback_status['finished'] = False
+    request = exec_net.requests[0]
+    request.set_completion_callback(callback, py_data=callback_status)
+    img = read_image()
+    request.async_infer({'data': img})
+    request.wait()
+    assert callback_status['finished'] == True
+
+
+@pytest.mark.ngraph_dependent_test
 def test_get_perf_counts(device):
     ie_core = ie.IECore()
-    if device == "CPU":
-        if ie_core.get_metric(device, "FULL_DEVICE_NAME") == "arm_compute::NEON":
-            pytest.skip("Can't run on ARM plugin due-to ngraph")
     net = ie_core.read_network(test_net_xml, test_net_bin)
     ie_core.set_config({"PERF_COUNT": "YES"}, device)
     exec_net = ie_core.load_network(net, device)
@@ -513,6 +529,7 @@ def test_resize_algorithm_work(device):
     assert np.allclose(res_1, res_2, atol=1e-2, rtol=1e-2)
 
 
+@pytest.mark.ngraph_dependent_test
 @pytest.mark.parametrize("mode", ["set_init_memory_state", "reset_memory_state", "normal"])
 @pytest.mark.parametrize("data_type", ["FP32", "FP16", "I32"])
 @pytest.mark.parametrize("input_shape", [[10], [10, 10], [10, 10, 10], [2, 10, 10, 10]])
@@ -564,4 +581,221 @@ def test_query_state_write_buffer(device, input_shape, data_type, mode):
             expected_res = np.full(input_shape, i, dtype=format_map[data_type])
 
         assert np.allclose(res['MemoryAdd'], expected_res, atol=1e-6), \
-            "Expected values: {} \n Actual values: {} \n".format(expected_res, res)
\ No newline at end of file
+            "Expected values: {} \n Actual values: {} \n".format(expected_res, res)
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+@pytest.mark.parametrize("shape, p_shape, ref_shape", [
+    ([1, 4, 20, 20], [-1, 4, 20, 20], [5, 4, 20, 20]),
+    ([1, 4, 20, 20], [(0,5), 4, 20, 20], [3, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [2, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [6, 4, 20, 20]),
+])
+def test_infer_dynamic_network_with_set_shape(shape, p_shape, ref_shape):
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function(shape)
+    net = ng.function_to_cnn(function)
+    net.reshape({"data": p_shape})
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    exec_net.requests[0].input_blobs["data"].set_shape(ref_shape)
+    assert exec_net.requests[0].input_blobs["data"].tensor_desc.dims == ref_shape
+    exec_net.infer({"data": np.ones(ref_shape)})
+    request = exec_net.requests[0]
+    request.async_infer({"data": np.ones(ref_shape)})
+    status = request.wait(ie.WaitMode.RESULT_READY)
+    assert status == ie.StatusCode.OK
+    assert request.output_blobs['out'].tensor_desc.dims == ref_shape
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+@pytest.mark.parametrize("shape, p_shape, ref_shape", [
+    ([1, 4, 20, 20], [-1, 4, 20, 20], [5, 4, 20, 20]),
+    ([1, 4, 20, 20], [(0,5), 4, 20, 20], [3, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [2, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [6, 4, 20, 20]),
+])
+def test_infer_dynamic_network_without_set_shape(shape, p_shape, ref_shape):
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function(shape)
+    net = ng.function_to_cnn(function)
+    net.reshape({"data": p_shape})
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    exec_net.infer({"data": np.ones(ref_shape)})
+    assert exec_net.requests[0].input_blobs["data"].tensor_desc.dims == ref_shape
+    request = exec_net.requests[0]
+    request.async_infer({"data": np.ones(ref_shape)})
+    status = request.wait(ie.WaitMode.RESULT_READY)
+    assert status == ie.StatusCode.OK
+    assert request.output_blobs['out'].tensor_desc.dims == ref_shape
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+@pytest.mark.parametrize("shape, p_shape, ref_shape", [
+    ([1, 4, 20, 20], [-1, 4, 20, 20], [5, 4, 20, 20]),
+    ([1, 4, 20, 20], [(0,5), 4, 20, 20], [3, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [2, 4, 20, 20]),
+    ([1, 4, 20, 20], [(3,5), 3, 20, 20], [6, 4, 20, 20]),
+])
+def test_infer_dynamic_network_with_set_blob(shape, p_shape, ref_shape):
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function(shape)
+    net = ng.function_to_cnn(function)
+    net.reshape({"data": p_shape})
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    tensor_desc = exec_net.requests[0].input_blobs["data"].tensor_desc
+    tensor_desc.dims = ref_shape
+    blob = ie.Blob(tensor_desc)
+    exec_net.requests[0].set_blob("data", blob)
+    assert exec_net.requests[0].input_blobs["data"].tensor_desc.dims == ref_shape
+    request = exec_net.requests[0]
+    request.infer({"data": np.ones(ref_shape)})
+    request.async_infer({"data": np.ones(ref_shape)})
+    status = request.wait(ie.WaitMode.RESULT_READY)
+    assert status == ie.StatusCode.OK
+    assert request.output_blobs["out"].tensor_desc.dims == ref_shape
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_infer_dynamic_network_twice():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    shape, p_shape = [1, 4, 20, 20], [(0,5), 4, 20, 20]
+    ref_shape1, ref_shape2 = [2, 4, 20, 20], [3, 4, 20, 20]
+    function = create_ngraph_function(shape)
+    net = ng.function_to_cnn(function)
+    net.reshape({"data": p_shape})
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    request = exec_net.requests[0]
+    request.infer({"data": np.ones(ref_shape1)})
+    assert exec_net.requests[0].input_blobs["data"].tensor_desc.dims == ref_shape1
+    assert request.output_blobs['out'].tensor_desc.dims == ref_shape1
+    request.infer({"data": np.ones(ref_shape2)})
+    assert exec_net.requests[0].input_blobs["data"].tensor_desc.dims == ref_shape2
+    assert request.output_blobs['out'].tensor_desc.dims == ref_shape2
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_infer_dynamic_network_with_set_blob_twice():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    shape, p_shape = [1, 4, 20, 20], [(0,5), 4, 20, 20]
+    ref_shape1, ref_shape2 = [2, 4, 20, 20], [3, 4, 20, 20]
+    function = create_ngraph_function(shape)
+    net = ng.function_to_cnn(function)
+    net.reshape({"data": p_shape})
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    request = exec_net.requests[0]
+    td = request.input_blobs['data'].tensor_desc
+    td.dims = ref_shape1
+    blob = ie.Blob(td)
+    request.set_blob("data", blob)
+    request.infer({"data": np.ones(ref_shape1)})
+    assert exec_net.requests[0].input_blobs["data"].tensor_desc.dims == ref_shape1
+    assert request.output_blobs['out'].tensor_desc.dims == ref_shape1
+    td = request.input_blobs['data'].tensor_desc
+    td.dims = ref_shape2
+    blob = ie.Blob(td)
+    request.set_blob("data", blob)
+    request.infer({"data": np.ones(ref_shape2)})
+    assert exec_net.requests[0].input_blobs["data"].tensor_desc.dims == ref_shape2
+    assert request.output_blobs['out'].tensor_desc.dims == ref_shape2
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+@pytest.mark.parametrize("shapes", [
+    ([3, 4, 20, 20], [3, 4, 20, 20], [3, 4, 20, 20]),
+    ([3, 4, 20, 20], [3, 6, 20, 20], [3, 8, 20, 20]),
+])
+def test_async_infer_dynamic_network_3_requests(shapes):
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([3, 4, 20, 20])
+    net = ng.function_to_cnn(function)
+    net.reshape({"data": [3, (2, 10), 20, 20]})
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE", num_requests=3)
+    for i,request in enumerate(exec_net.requests):
+        request.async_infer({"data": np.ones(shapes[i])})
+    for i,request in enumerate(exec_net.requests):
+        status = request.wait(ie.WaitMode.RESULT_READY)
+        assert status == ie.StatusCode.OK
+        assert request.output_blobs['out'].tensor_desc.dims == shapes[i]
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_set_blob_with_incorrect_name():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([4, 4, 20, 20])
+    net = ng.function_to_cnn(function)
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    tensor_desc = exec_net.requests[0].input_blobs["data"].tensor_desc
+    tensor_desc.dims = [4, 4, 20, 20]
+    blob = ie.Blob(tensor_desc)
+    with pytest.raises(RuntimeError) as e:
+        exec_net.requests[0].set_blob("incorrect_name", blob)
+    assert f"Failed to find input or output with name: 'incorrect_name'" in str(e.value)
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_set_blob_with_incorrect_size():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([4, 4, 20, 20])
+    net = ng.function_to_cnn(function)
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    tensor_desc = exec_net.requests[0].input_blobs["data"].tensor_desc
+    tensor_desc.dims = [tensor_desc.dims[0]*2, 4, 20, 20]
+    blob = ie.Blob(tensor_desc)
+    with pytest.raises(RuntimeError) as e:
+        exec_net.requests[0].set_blob("data", blob)
+    assert f"Input blob size is not equal network input size" in str(e.value)
+    with pytest.raises(RuntimeError) as e:
+        exec_net.requests[0].set_blob("out", blob)
+    assert f"Output blob size is not equal network output size" in str(e.value)
+
+
+@pytest.mark.ngraph_dependent_test
+@pytest.mark.template_plugin
+def test_set_blob_after_async_infer():
+    from conftest import create_ngraph_function
+    import ngraph as ng
+    function = create_ngraph_function([ng.Dimension(0,5), ng.Dimension(4), ng.Dimension(20), ng.Dimension(20)])
+    net = ng.function_to_cnn(function)
+    ie_core = ie.IECore()
+    ie_core.register_plugin("templatePlugin", "TEMPLATE")
+    exec_net = ie_core.load_network(net, "TEMPLATE")
+    request = exec_net.requests[0]
+    tensor_desc = request.input_blobs['data'].tensor_desc
+    tensor_desc.dims = [2, 4, 20, 20]
+    blob = ie.Blob(tensor_desc)
+    request.async_infer({"data": np.ones([4, 4, 20, 20])})
+    with pytest.raises(RuntimeError) as e:
+        request.set_blob("data", blob)
+    assert "REQUEST_BUSY" in str(e.value)
diff --git a/inference-engine/ie_bridges/python/tests/test_NGraph.py b/inference-engine/ie_bridges/python/tests/test_NGraph.py
index 6d5c110b9c8518..139d132eb0f65c 100644
--- a/inference-engine/ie_bridges/python/tests/test_NGraph.py
+++ b/inference-engine/ie_bridges/python/tests/test_NGraph.py
@@ -6,17 +6,14 @@
 from ngraph.impl.op import Parameter
 from ngraph.impl import Function, Shape, Type
 
-from conftest import model_path
+from conftest import model_path, create_ngraph_function
 
 
 test_net_xml, test_net_bin = model_path()
 
 
 def test_create_IENetwork_from_nGraph():
-    element_type = Type.f32
-    param = Parameter(element_type, Shape([1, 3, 22, 22]))
-    relu = ng.relu(param)
-    func = Function([relu], [param], 'test')
+    func = create_ngraph_function([1, 3, 22, 22])
     caps = Function.to_capsule(func)
     cnnNetwork = IENetwork(caps)
     assert cnnNetwork != None
@@ -26,10 +23,7 @@ def test_create_IENetwork_from_nGraph():
 
 
 def test_get_IENetwork_from_nGraph():
-    element_type = Type.f32
-    param = Parameter(element_type, Shape([1, 3, 22, 22]))
-    relu = ng.relu(param)
-    func = Function([relu], [param], 'test')
+    func = create_ngraph_function([1, 3, 22, 22])
     caps = Function.to_capsule(func)
     cnnNetwork = IENetwork(caps)
     assert cnnNetwork != None
diff --git a/inference-engine/ie_bridges/python/wheel/.env.in b/inference-engine/ie_bridges/python/wheel/.env.in
index 9ba0660d5d2557..760f8bcb358f29 100644
--- a/inference-engine/ie_bridges/python/wheel/.env.in
+++ b/inference-engine/ie_bridges/python/wheel/.env.in
@@ -9,8 +9,6 @@ WHEEL_REQUIREMENTS=@WHEEL_REQUIREMENTS@
 WHEEL_OVERVIEW=@WHEEL_OVERVIEW@
 
 CMAKE_BUILD_DIR=@CMAKE_BINARY_DIR@
-CORE_LIBS_DIR=@IE_CPACK_RUNTIME_PATH@
-PLUGINS_LIBS_DIR=@PLUGINS_LIBS_DIR@
-NGRAPH_LIBS_DIR=@NGRAPH_LIBS_DIR@
+OV_RUNTIME_LIBS_DIR=@IE_CPACK_RUNTIME_PATH@
 TBB_LIBS_DIR=@TBB_LIBS_DIR@
 PY_PACKAGES_DIR=@PY_PACKAGES_DIR@
diff --git a/inference-engine/ie_bridges/python/wheel/CMakeLists.txt b/inference-engine/ie_bridges/python/wheel/CMakeLists.txt
index 1b1931c08a493d..00deb5b0887cab 100644
--- a/inference-engine/ie_bridges/python/wheel/CMakeLists.txt
+++ b/inference-engine/ie_bridges/python/wheel/CMakeLists.txt
@@ -18,11 +18,8 @@ set(WHEEL_OVERVIEW "${CMAKE_CURRENT_SOURCE_DIR}/meta/pypi_overview.md" CACHE STR
 set(SETUP_PY "${CMAKE_CURRENT_SOURCE_DIR}/setup.py")
 set(SETUP_ENV "${CMAKE_CURRENT_SOURCE_DIR}/.env.in")
 
-set(CORE_LIBS_DIR ${IE_CPACK_RUNTIME_PATH})
-set(PLUGINS_LIBS_DIR ${IE_CPACK_RUNTIME_PATH})
-set(NGRAPH_LIBS_DIR deployment_tools/ngraph/lib)
 set(PY_PACKAGES_DIR ${PYTHON_BRIDGE_CPACK_PATH}/${PYTHON_VERSION})
-set(TBB_LIBS_DIR deployment_tools/inference_engine/external/tbb/lib)
+set(TBB_LIBS_DIR runtime/3rdparty/tbb/lib)
 
 if(APPLE)
     set(WHEEL_PLATFORM macosx_10_15_x86_64)
@@ -30,7 +27,7 @@ elseif(UNIX)
     set(WHEEL_PLATFORM manylinux2014_x86_64)
 elseif(WIN32)
     set(WHEEL_PLATFORM win_amd64)
-    set(TBB_LIBS_DIR deployment_tools/inference_engine/external/tbb/bin)
+    set(TBB_LIBS_DIR runtime/3rdparty/tbb/bin)
 else()
     message(FATAL_ERROR "This platform is not supported")
 endif()
diff --git a/inference-engine/ie_bridges/python/wheel/meta/pypi_overview.md b/inference-engine/ie_bridges/python/wheel/meta/pypi_overview.md
index 91b3b11f6948f8..418a04bc16a74d 100644
--- a/inference-engine/ie_bridges/python/wheel/meta/pypi_overview.md
+++ b/inference-engine/ie_bridges/python/wheel/meta/pypi_overview.md
@@ -5,7 +5,7 @@ OpenVINO™ toolkit quickly deploys applications and solutions that emulate huma
 OpenVINO™ toolkit:
 
 - Enables CNN-based deep learning inference on the edge
-- Supports heterogeneous execution across an Intel® CPU, Intel® Integrated Graphics, Intel® FPGA,  Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
+- Supports heterogeneous execution across an Intel® CPU, Intel® Integrated Graphics, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs
 - Speeds time-to-market via an easy-to-use library of computer vision functions and pre-optimized kernels
 - Includes optimized calls for computer vision standards, including OpenCV\* and OpenCL™
 
diff --git a/inference-engine/ie_bridges/python/wheel/setup.py b/inference-engine/ie_bridges/python/wheel/setup.py
index 6b233ff4284175..436baa7a7c923a 100644
--- a/inference-engine/ie_bridges/python/wheel/setup.py
+++ b/inference-engine/ie_bridges/python/wheel/setup.py
@@ -7,6 +7,7 @@
 import errno
 import subprocess  # nosec
 import typing
+import platform
 import multiprocessing
 from fnmatch import fnmatchcase
 from pathlib import Path
@@ -19,18 +20,30 @@
 from setuptools import setup, find_namespace_packages, Extension
 from setuptools.command.build_ext import build_ext
 from setuptools.command.build_clib import build_clib
+from setuptools.command.install import install
 from decouple import config
 
 WHEEL_LIBS_INSTALL_DIR = os.path.join('openvino', 'libs')
 WHEEL_LIBS_PACKAGE = 'openvino.libs'
 PYTHON_VERSION = f'python{sys.version_info.major}.{sys.version_info.minor}'
 
+LIBS_DIR = 'bin' if platform.system() == 'Windows' else 'lib'
+CONFIG = 'Release' if platform.system() == 'Windows' else ''
+
+machine = platform.machine()
+if machine == 'x86_64' or machine == 'AMD64':
+    ARCH = 'intel64'
+elif machine == 'X86':
+    ARCH = 'ia32'
+elif machine == 'arm':
+    ARCH = 'arm'
+elif machine == 'aarch64':
+    ARCH = 'arm64'
+
 # The following variables can be defined in environment or .env file
 CMAKE_BUILD_DIR = config('CMAKE_BUILD_DIR', '.')
-CORE_LIBS_DIR = config('CORE_LIBS_DIR', 'deployment_tools/inference_engine/lib/intel64')
-PLUGINS_LIBS_DIR = config('PLUGINS_LIBS_DIR', 'deployment_tools/inference_engine/lib/intel64')
-NGRAPH_LIBS_DIR = config('NGRAPH_LIBS_DIR', 'deployment_tools/ngraph/lib')
-TBB_LIBS_DIR = config('TBB_LIBS_DIR', 'deployment_tools/inference_engine/external/tbb/lib')
+OV_RUNTIME_LIBS_DIR = config('OV_RUNTIME_LIBS_DIR', f'runtime/{LIBS_DIR}/{ARCH}/{CONFIG}')
+TBB_LIBS_DIR = config('TBB_LIBS_DIR', f'runtime/3rdparty/tbb/{LIBS_DIR}')
 PY_PACKAGES_DIR = config('PY_PACKAGES_DIR', f'python/{PYTHON_VERSION}')
 LIBS_RPATH = '$ORIGIN' if sys.platform == 'linux' else '@loader_path'
 
@@ -38,49 +51,43 @@
     'ie_libs': {
         'name': 'core',
         'prefix': 'libs.core',
-        'install_dir': CORE_LIBS_DIR,
+        'install_dir': OV_RUNTIME_LIBS_DIR,
         'rpath': LIBS_RPATH,
     },
     'hetero_plugin': {
         'name': 'hetero',
-        'prefix': 'libs.plugins',
-        'install_dir': PLUGINS_LIBS_DIR,
+        'prefix': 'libs.core',
+        'install_dir': OV_RUNTIME_LIBS_DIR,
         'rpath': LIBS_RPATH,
     },
     'gpu_plugin': {
         'name': 'gpu',
-        'prefix': 'libs.plugins',
-        'install_dir': PLUGINS_LIBS_DIR,
+        'prefix': 'libs.core',
+        'install_dir': OV_RUNTIME_LIBS_DIR,
         'rpath': LIBS_RPATH,
     },
     'cpu_plugin': {
         'name': 'cpu',
-        'prefix': 'libs.plugins',
-        'install_dir': PLUGINS_LIBS_DIR,
+        'prefix': 'libs.core',
+        'install_dir': OV_RUNTIME_LIBS_DIR,
         'rpath': LIBS_RPATH,
     },
     'multi_plugin': {
         'name': 'multi',
-        'prefix': 'libs.plugins',
-        'install_dir': PLUGINS_LIBS_DIR,
-        'rpath': LIBS_RPATH,
-    },
-    'auto_plugin': {
-        'name': 'auto',
-        'prefix': 'libs.plugins',
-        'install_dir': PLUGINS_LIBS_DIR,
+        'prefix': 'libs.core',
+        'install_dir': OV_RUNTIME_LIBS_DIR,
         'rpath': LIBS_RPATH,
     },
     'myriad_plugin': {
         'name': 'myriad',
-        'prefix': 'libs.plugins',
-        'install_dir': PLUGINS_LIBS_DIR,
+        'prefix': 'libs.core',
+        'install_dir': OV_RUNTIME_LIBS_DIR,
         'rpath': LIBS_RPATH,
     },
     'ngraph_libs': {
         'name': 'ngraph',
-        'prefix': 'libs.ngraph',
-        'install_dir': NGRAPH_LIBS_DIR,
+        'prefix': 'libs.core',
+        'install_dir': OV_RUNTIME_LIBS_DIR,
         'rpath': LIBS_RPATH,
     },
     'tbb_libs': {
@@ -165,10 +172,10 @@ def run(self):
 
         # if setup.py is directly called use CMake to build product
         if CMAKE_BUILD_DIR == '.':
-            openvino_root_dir = os.path.normpath(os.path.join(CMAKE_BUILD_DIR, '../../../../'))
-            self.announce('Configuring cmake project', level=3)
-
-            self.spawn(['cmake', '-H' + openvino_root_dir, '-B' + self.build_temp,
+            # set path to the root of OpenVINO CMakeList file
+            openvino_root_dir = Path(__file__).resolve().parents[4]
+            self.announce(f'Configuring cmake project: {openvino_root_dir}', level=3)
+            self.spawn(['cmake', '-H' + str(openvino_root_dir), '-B' + self.build_temp,
                         '-DCMAKE_BUILD_TYPE={type}'.format(type=self.config),
                         '-DENABLE_PYTHON=ON',
                         '-DNGRAPH_ONNX_FRONTEND_ENABLE=ON'])
@@ -177,8 +184,8 @@ def run(self):
             self.spawn(['cmake', '--build', self.build_temp,
                         '--config', self.config, '-j', str(self.jobs)])
             CMAKE_BUILD_DIR = self.build_temp
-
         self.run_command('build_clib')
+
         build.run(self)
         # Copy extra package_data content filtered by find_packages
         dst = Path(self.build_lib)
@@ -243,6 +250,10 @@ class CopyExt(build_ext):
     """Copy extension files to the build directory"""
 
     def run(self):
+        if len(self.extensions) == 1:
+            self.run_command('build_clib')
+            self.extensions = []
+            self.extensions = find_prebuilt_extensions(get_dir_list(PY_INSTALL_CFG))
         for extension in self.extensions:
             if not isinstance(extension, PrebuiltExtension):
                 raise DistutilsSetupError(f'copy_ext can accept PrebuiltExtension only, but got {extension.name}')
@@ -257,10 +268,17 @@ def run(self):
                 elif sys.platform == 'darwin':
                     rpath = os.path.join('@loader_path', rpath, WHEEL_LIBS_INSTALL_DIR)
                 set_rpath(rpath, os.path.realpath(src))
-
             copy_file(src, dst, verbose=self.verbose, dry_run=self.dry_run)
 
 
+class CustomInstall(install):
+    """Enable build_clib during the installation"""
+
+    def run(self):
+        self.run_command('build')
+        install.run(self)
+
+
 class CustomClean(clean):
     """Clean up staging directories"""
 
@@ -356,6 +374,8 @@ def find_prebuilt_extensions(search_dirs):
         ext_pattern = '**/*.so'
     for base_dir in search_dirs:
         for path in Path(base_dir).glob(ext_pattern):
+            if path.match('openvino/libs/*'):
+                continue
             relpath = path.relative_to(base_dir)
             if relpath.parent != '.':
                 package_names = str(relpath.parent).split(os.path.sep)
@@ -364,6 +384,8 @@ def find_prebuilt_extensions(search_dirs):
             package_names.append(path.name.split('.', 1)[0])
             name = '.'.join(package_names)
             extensions.append(PrebuiltExtension(name, sources=[str(path)]))
+    if not extensions:
+        extensions.append(PrebuiltExtension('openvino', sources=[str('setup.py')]))
     return extensions
 
 
@@ -419,12 +441,13 @@ def get_package_dir(install_cfg):
 
 packages = find_namespace_packages(get_package_dir(PY_INSTALL_CFG))
 package_data: typing.Dict[str, list] = {}
-
+pkg_name = config('WHEEL_PACKAGE_NAME', 'openvino')
+ext_modules = find_prebuilt_extensions(get_dir_list(PY_INSTALL_CFG)) if pkg_name == 'openvino' else []
 
 setup(
     version=config('WHEEL_VERSION', '0.0.0'),
     author_email=config('WHEEL_AUTHOR_EMAIL', 'openvino_pushbot@intel.com'),
-    name=config('WHEEL_PACKAGE_NAME', 'openvino'),
+    name=pkg_name,
     license=config('WHEEL_LICENCE_TYPE', 'OSI Approved :: Apache Software License'),
     author=config('WHEEL_AUTHOR', 'Intel Corporation'),
     description=config('WHEEL_DESC', 'Inference Engine Python* API'),
@@ -435,11 +458,12 @@ def get_package_dir(install_cfg):
     url=config('WHEEL_URL', 'https://docs.openvinotoolkit.org/latest/index.html'),
     cmdclass={
         'build': CustomBuild,
+        'install': CustomInstall,
         'build_clib': PrepareLibs,
         'build_ext': CopyExt,
         'clean': CustomClean,
     },
-    ext_modules=find_prebuilt_extensions(get_dir_list(PY_INSTALL_CFG)),
+    ext_modules=ext_modules,
     packages=packages,
     package_dir={'': get_package_dir(PY_INSTALL_CFG)},
     package_data=package_data,
diff --git a/inference-engine/samples/CMakeLists.txt b/inference-engine/samples/CMakeLists.txt
index 3e42fa84f2e429..b78e32b2fa79a3 100644
--- a/inference-engine/samples/CMakeLists.txt
+++ b/inference-engine/samples/CMakeLists.txt
@@ -33,11 +33,8 @@ endif()
 
 if(OpenVINO_SOURCE_DIR)
     # in case if samples are built from IE repo
-    set(IE_MAIN_SAMPLES_DIR ${OpenVINO_SOURCE_DIR})
-    # hint for find_package(InferenceEngine in the samples folder)
-    set(InferenceEngine_DIR "${CMAKE_BINARY_DIR}")
-    # hint for find_package(ngraph in the samples folder)
-    set(ngraph_DIR ${CMAKE_BINARY_DIR}/ngraph)
+    set(IE_MAIN_SAMPLES_DIR "${OpenVINO_SOURCE_DIR}")
+    set(OpenVINO_DIR "${CMAKE_BINARY_DIR}")
 else()
     # in case if samples are built out of IE repo
     set(IE_MAIN_SAMPLES_DIR ${CMAKE_CURRENT_BINARY_DIR})
@@ -128,8 +125,8 @@ if(EXISTS "${CMAKE_CURRENT_SOURCE_DIR}/common/utils")
     add_subdirectory(common/utils)
 endif()
 
-# format reader must be added after find_package(InferenceEngine) to get
-# exactly the same OpenCV_DIR path which was used for the InferenceEngine build
+# format reader must be added after find_package(OpenVINO) to get
+# exactly the same OpenCV_DIR path which was used for the OpenVINO build
 if(EXISTS "${CMAKE_CURRENT_SOURCE_DIR}/common/format_reader")
     add_subdirectory(common/format_reader)
 elseif(EXISTS "${CMAKE_CURRENT_SOURCE_DIR}/common/opencv_c_wrapper")
@@ -209,14 +206,13 @@ macro(ie_add_sample)
         set(folder_name c_samples)
     endif()
 
+    find_package(OpenVINO REQUIRED COMPONENTS Runtime)
     if(c_sample)
-        set(ie_component inference_engine_c_api)
+        set(ov_link_libraries openvino::runtime::c)
     else()
-        set(ie_component inference_engine)
+        set(ov_link_libraries openvino::runtime)
     endif()
 
-    find_package(InferenceEngine REQUIRED COMPONENTS ${ie_component})
-
     set_target_properties(${IE_SAMPLE_NAME} PROPERTIES FOLDER ${folder_name}
                                                        COMPILE_PDB_NAME ${IE_SAMPLE_NAME})
 
@@ -225,7 +221,7 @@ macro(ie_add_sample)
     endif()
     target_include_directories(${IE_SAMPLE_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/../common")
 
-    target_link_libraries(${IE_SAMPLE_NAME} PRIVATE ${OpenCV_LIBRARIES} ${InferenceEngine_LIBRARIES}
+    target_link_libraries(${IE_SAMPLE_NAME} PRIVATE ${OpenCV_LIBRARIES} ${ov_link_libraries}
                                                     ${IE_SAMPLE_DEPENDENCIES})
     if(NOT c_sample)
         target_link_libraries(${IE_SAMPLE_NAME} PRIVATE gflags)
diff --git a/inference-engine/samples/benchmark_app/CMakeLists.txt b/inference-engine/samples/benchmark_app/CMakeLists.txt
index b37495e5e4387a..e3412774f279c1 100644
--- a/inference-engine/samples/benchmark_app/CMakeLists.txt
+++ b/inference-engine/samples/benchmark_app/CMakeLists.txt
@@ -2,11 +2,46 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
+set(TARGET_NAME "benchmark_app")
+
 file (GLOB SRC ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp)
 file (GLOB HDR ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp)
 
-ie_add_sample(NAME benchmark_app
+ie_add_sample(NAME ${TARGET_NAME}
               SOURCES ${SRC}
               HEADERS ${HDR}
               DEPENDENCIES format_reader ie_samples_utils
               OPENCV_DEPENDENCIES core)
+
+find_package(OpenCL)
+
+find_path(OpenCL_HPP_INCLUDE_DIR
+    NAMES
+      CL/cl2.hpp OpenCL/cl2.hpp
+    HINTS
+      ${opencl_root_hints}
+      ENV "PROGRAMFILES(X86)"
+      ENV AMDAPPSDKROOT
+      ENV INTELOCLSDKROOT
+      ENV NVSDKCOMPUTE_ROOT
+      ENV CUDA_PATH
+      ENV ATISTREAMSDKROOT
+      ENV OCL_ROOT
+    PATH_SUFFIXES
+      include
+      OpenCL/common/inc
+      "AMD APP/include")
+
+if(OPENCL_HEADERS_DIR)
+    # Use OpenCL CPP headers from sources if present
+    set(OpenCL_HEADERS OPENCL_HEADERS_DIR)
+elseif(OpenCL_HPP_INCLUDE_DIR)
+    # Append OpenCL CPP headers to C headers and use both
+    set(OpenCL_HEADERS OpenCL_INCLUDE_DIR OpenCL_HPP_INCLUDE_DIR)
+endif()
+
+if(OpenCL_FOUND AND OpenCL_HEADERS)
+    target_link_libraries(${TARGET_NAME} PRIVATE OpenCL::OpenCL)
+    target_include_directories(${TARGET_NAME} PRIVATE ${OpenCL_HEADERS})
+    target_compile_definitions(${TARGET_NAME} PRIVATE HAVE_GPU_DEVICE_MEM_SUPPORT)
+endif()
diff --git a/inference-engine/samples/benchmark_app/README.md b/inference-engine/samples/benchmark_app/README.md
index c705d592ce357a..c19fb5c4f70d56 100644
--- a/inference-engine/samples/benchmark_app/README.md
+++ b/inference-engine/samples/benchmark_app/README.md
@@ -1,24 +1,31 @@
 # Benchmark C++ Tool {#openvino_inference_engine_samples_benchmark_app_README}
 
-This topic demonstrates how to use the Benchmark C++ Tool to estimate deep learning inference performance on supported devices. Performance can be measured for two inference modes: synchronous (latency-oriented) and asynchronous (throughput-oriented).
+This topic demonstrates how to use the Benchmark C++ Tool to estimate deep learning inference performance on supported devices.
+Performance can be measured for two inference modes: latency- and throughput-oriented.
 
 > **NOTE:** This topic describes usage of C++ implementation of the Benchmark Tool. For the Python* implementation, refer to [Benchmark Python* Tool](../../../tools/benchmark_tool/README.md).
 
-> **TIP**: You also can work with the Benchmark Tool inside the OpenVINO™ [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench).
-> [DL Workbench](@ref workbench_docs_Workbench_DG_Introduction) is a platform built upon OpenVINO™ and provides a web-based graphical environment that enables you to optimize, fine-tune, analyze, visualize, and compare
-> performance of deep learning models on various Intel® architecture
-> configurations. In the DL Workbench, you can use most of OpenVINO™ toolkit components.
-> <br>
-> Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub) to get started.
+> **TIP**: You can quick start with the Benchmark Tool inside the OpenVINO™ [Deep Learning Workbench](@ref openvino_docs_get_started_get_started_dl_workbench) (DL Workbench).
+> [DL Workbench](@ref workbench_docs_Workbench_DG_Introduction) is the OpenVINO™ toolkit UI you to
+> import a model, analyze its performance and accuracy, visualize the outputs, optimize and prepare the model for 
+> deployment on various Intel® platforms.
+
 
 ## How It Works
 
-Upon start-up, the application reads command-line parameters and loads a network and images/binary files to the Inference Engine plugin, which is chosen depending on a specified device. The number of infer requests and execution approach depend on the mode defined with the `-api` command-line parameter.
+Upon start-up, the application reads command-line parameters and loads a network and inputs (images/binary files) to the specified device.
 
-> **NOTE**: By default, Inference Engine samples, tools and demos expect input with BGR channels order. If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the sample or demo application or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified. For more information about the argument, refer to **When to Reverse Input Channels** section of [Converting a Model Using General Conversion Parameters](../../../docs/MO_DG/prepare_model/convert_model/Converting_Model_General.md).
+  **NOTE**: By default, Inference Engine samples, tools and demos expect input with BGR channels order.
+  If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the sample or demo application
+  or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified.
+  For more information about the argument, refer to **When to Reverse Input Channels** section of
+  [Converting a Model Using General Conversion Parameters](../../../docs/MO_DG/prepare_model/convert_model/Converting_Model_General.md).
 
-If you run the application in the synchronous mode, it creates one infer request and executes the `Infer` method.
-If you run the application in the asynchronous mode, it creates as many infer requests as specified in the `-nireq` command-line parameter and executes the `StartAsync` method for each of them. If `-nireq` is not set, the application will use the default value for specified device.
+Device-specific execution parameters (number of streams, threads, and so on) can be either explicitly specified through the command line
+or left default. In the last case, the sample logic will select the values for the optimal throughput.
+While experimenting with individual parameters allows to find the performance sweet spot, usually, the parameters are not very performance-portable,
+so the values from one machine or device are not necessarily optimal for another.
+From this perspective, the most portable way is experimenting only with the performance hints. To learn more, refer to the section on the command-line parameters below.
 
 A number of execution steps is defined by one of the following parameters:
 * Number of iterations specified with the `-niter` command-line argument
@@ -26,14 +33,9 @@ A number of execution steps is defined by one of the following parameters:
 * Both of them (execution will continue until both conditions are met)
 * Predefined duration if `-niter` and `-t` are not specified. Predefined duration value depends on a device.
 
-During the execution, the application collects latency for each executed infer request.
-
-Reported latency value is calculated as a median value of all collected latencies. Reported throughput value is reported
-in frames per second (FPS) and calculated as a derivative from:
-* Reported latency in the Sync mode
-* The total execution time in the Async mode
-
-Throughput value also depends on batch size.
+During the execution, the application calculates latency (if applicable) and overall throughput:
+* By default, the median latency value is reported
+* Throughput is calculated as overall_inference_time/number_of_processed_requests. Note that the throughput value also depends on batch size.
 
 The application also collects per-layer Performance Measurement (PM) counters for each executed infer request if you
 enable statistics dumping by setting the `-report_type` parameter to one of the possible values:
@@ -57,7 +59,7 @@ Note that the benchmark_app usually produces optimal performance for any device
 ./benchmark_app -m <model> -i <input> -d CPU
 ```
 
-But it is still may be non-optimal for some cases, especially for very small networks. More details can read in [Introduction to Performance Topics](../../../docs/IE_DG/Intro_to_Performance.md).
+But it is still may be sub-optimal for some cases, especially for very small networks. More details can read in [Introduction to Performance Topics](../../../docs/IE_DG/Intro_to_Performance.md).
 
 As explained in the  [Introduction to Performance Topics](../../../docs/IE_DG/Intro_to_Performance.md) section, for all devices, including new [MULTI device](../../../docs/IE_DG/supported_plugins/MULTI.md) it is preferable to use the FP16 IR for the model.
 Also if latency of the CPU inference on the multi-socket machines is of concern, please refer to the same
@@ -84,7 +86,12 @@ Options:
     -l "<absolute_path>"        Required for CPU custom layers. Absolute path to a shared library with the kernels implementations.
           Or
     -c "<absolute_path>"        Required for GPU custom kernels. Absolute path to an .xml file with the kernels description.
-    -api "<sync/async>"         Optional. Enable Sync/Async API. Default value is "async".
+    -hint "<throughput(or just 'tput')/latency">
+                                Optional. Performance hint (optimize for latency or throughput).
+                                The hint allows the OpenVINO device to select the right network-specific settings,
+                                as opposite to just accepting specific values from the sample command line.
+                                So you can specify only the hint without setting explicit 'nstreams' or other device-specific options.
+    -api "<sync/async>"         Optional (deprecated). Enable Sync/Async API. Default value is "async".
     -niter "<integer>"          Optional. Number of iterations. If not specified, the number of iterations is calculated depending on a device.
     -nireq "<integer>"          Optional. Number of infer requests. Default value is determined automatically for a device.
     -b "<integer>"              Optional. Batch size value. If not specified, the batch size value is determined from Intermediate Representation.
@@ -141,39 +148,39 @@ To run the tool, you can use [public](@ref omz_models_group_public) or [Intel's]
 
 ## Examples of Running the Tool
 
-This section provides step-by-step instructions on how to run the Benchmark Tool with the `googlenet-v1` public model on CPU or FPGA devices. As an input, the `car.png` file from the `<INSTALL_DIR>/deployment_tools/demo/` directory is used.
+This section provides step-by-step instructions on how to run the Benchmark Tool with the `googlenet-v1` public model on CPU or GPU devices. As an input, the `car.png` file from the `<INSTALL_DIR>/samples/scripts/` directory is used.
 
 > **NOTE:** The Internet access is required to execute the following steps successfully. If you have access to the Internet through the proxy server only, please make sure that it is configured in your OS environment.
 
 1. Download the model. Go to the the Model Downloader directory and run the `downloader.py` script with specifying the model name and directory to download the model to:
    ```sh
-   cd <INSTAL_DIR>/deployment_tools/open_model_zoo/tools/downloader
+   cd <INSTAL_DIR>/extras/open_model_zoo/tools/downloader
    ```
    ```sh
    python3 downloader.py --name googlenet-v1 -o <models_dir>
    ```
 2. Convert the model to the Inference Engine IR format. Go to the Model Optimizer directory and run the `mo.py` script with specifying the path to the model, model format (which must be FP32 for CPU and FPG) and output directory to generate the IR files:
    ```sh
-   cd <INSTALL_DIR>/deployment_tools/model_optimizer
+   cd <INSTALL_DIR>/tools/model_optimizer
    ```
    ```sh
    python3 mo.py --input_model <models_dir>/public/googlenet-v1/googlenet-v1.caffemodel --data_type FP32 --output_dir <ir_dir>
    ```
-3. Run the tool with specifying the `<INSTALL_DIR>/deployment_tools/demo/car.png` file as an input image, the IR of the `googlenet-v1` model and a device to perform inference on. The following commands demonstrate running the Benchmark Tool in the asynchronous mode on CPU and FPGA devices:
+3. Run the tool with specifying the `<INSTALL_DIR>/samples/scripts/car.png` file as an input image, the IR of the `googlenet-v1` model and a device to perform inference on. The following commands demonstrate running the Benchmark Tool in the asynchronous mode on CPU and GPU devices:
 
    * On CPU:
    ```sh
-   ./benchmark_app -m <ir_dir>/googlenet-v1.xml -i <INSTALL_DIR>/deployment_tools/demo/car.png  -d CPU -api async --progress true
+   ./benchmark_app -m <ir_dir>/googlenet-v1.xml -i <INSTALL_DIR>/samples/scripts/car.png  -d CPU -api async --progress true
    ```
-   * On FPGA:
+   * On GPU:
    ```sh
-   ./benchmark_app -m <ir_dir>/googlenet-v1.xml -i <INSTALL_DIR>/deployment_tools/demo/car.png -d HETERO:FPGA,CPU -api async --progress true
+   ./benchmark_app -m <ir_dir>/googlenet-v1.xml -i <INSTALL_DIR>/samples/scripts/car.png -d GPU -api async --progress true
    ```
 
 The application outputs the number of executed iterations, total duration of execution, latency, and throughput.
 Additionally, if you set the `-report_type` parameter, the application outputs statistics report. If you set the `-pc` parameter, the application outputs performance counters. If you set `-exec_graph_path`, the application reports executable graph information serialized. All measurements including per-layer PM counters are reported in milliseconds.
 
-Below are fragments of sample output for CPU and FPGA devices:
+Below are fragments of sample output for CPU and GPU devices:
 
 * For CPU:
    ```
@@ -190,7 +197,7 @@ Below are fragments of sample output for CPU and FPGA devices:
    Throughput: 76.73 FPS
    ```
 
-* For FPGA:
+* For GPU:
    ```
    [Step 10/11] Measuring performance (Start inference asynchronously, 5 inference requests using 4 streams for CPU, limits: 120000 ms duration)
    Progress: [....................] 100% done
diff --git a/inference-engine/samples/benchmark_app/benchmark_app.hpp b/inference-engine/samples/benchmark_app/benchmark_app.hpp
index a752152ec2299a..6395db4ff293e0 100644
--- a/inference-engine/samples/benchmark_app/benchmark_app.hpp
+++ b/inference-engine/samples/benchmark_app/benchmark_app.hpp
@@ -4,6 +4,10 @@
 
 #pragma once
 
+#if defined(HAVE_GPU_DEVICE_MEM_SUPPORT)
+#    define HAVE_DEVICE_MEM_SUPPORT
+#endif
+
 #include <gflags/gflags.h>
 
 #include <iostream>
@@ -19,11 +23,18 @@ static const char input_message[] =
 
 /// @brief message for model argument
 static const char model_message[] =
-    "Required. Path to an .xml/.onnx/.prototxt file with a trained model or to a .blob files with "
+    "Required. Path to an .xml/.onnx file with a trained model or to a .blob files with "
     "a trained compiled model.";
 
+/// @brief message for performance hint
+static const char hint_message[] =
+    "Optional. Performance hint (optimize for latency or throughput). "
+    "The hint allows the OpenVINO device to select the right network-specific settings,"
+    "as opposite to just accepting specific values from the sample command line."
+    "So you can specify only the hint without setting  explicit 'nstreams' or other device-specific options";
+
 /// @brief message for execution mode
-static const char api_message[] = "Optional. Enable Sync/Async API. Default value is \"async\".";
+static const char api_message[] = "Optional (deprecated). Enable Sync/Async API. Default value is \"async\".";
 
 /// @brief message for assigning cnn calculation to device
 static const char target_device_message[] =
@@ -125,6 +136,12 @@ static const char progress_message[] =
 // @brief message for performance counters option
 static const char pc_message[] = "Optional. Report performance counters.";
 
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+// @brief message for switching memory allocation type option
+static const char use_device_mem_message[] =
+    "Optional. Switch between host and device memory allocation for input and output buffers.";
+#endif
+
 #ifdef USE_OPENCV
 // @brief message for load config option
 static const char load_config_message[] =
@@ -193,6 +210,9 @@ DEFINE_string(i, "", input_message);
 /// It is a required parameter
 DEFINE_string(m, "", model_message);
 
+/// @brief Define execution mode
+DEFINE_string(hint, "", hint_message);
+
 /// @brief Define execution mode
 DEFINE_string(api, "async", api_message);
 
@@ -256,6 +276,11 @@ DEFINE_bool(progress, false, progress_message);
 /// @brief Define flag for showing performance counters <br>
 DEFINE_bool(pc, false, pc_message);
 
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+/// @brief Define flag for switching beetwen host and device memory allocation for input and output buffers
+DEFINE_bool(use_device_mem, false, use_device_mem_message);
+#endif
+
 #ifdef USE_OPENCV
 /// @brief Define flag for loading configuration file <br>
 DEFINE_string(load_config, "", load_config_message);
@@ -329,6 +354,9 @@ static void showUsage() {
     std::cout << "    -nthreads \"<integer>\"     " << infer_num_threads_message << std::endl;
     std::cout << "    -enforcebf16=<true/false>     " << enforce_bf16_message << std::endl;
     std::cout << "    -pin \"YES\"/\"HYBRID_AWARE\"/\"NO\"/\"NUMA\"   " << infer_threads_pinning_message << std::endl;
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+    std::cout << "    -use_device_mem           " << use_device_mem_message << std::endl;
+#endif
     std::cout << std::endl << "  Statistics dumping options:" << std::endl;
     std::cout << "    -report_type \"<type>\"     " << report_type_message << std::endl;
     std::cout << "    -report_folder            " << report_folder_message << std::endl;
diff --git a/inference-engine/samples/benchmark_app/infer_request_wrap.hpp b/inference-engine/samples/benchmark_app/infer_request_wrap.hpp
index 5e15f597e7e662..dd10a28eb7ac26 100644
--- a/inference-engine/samples/benchmark_app/infer_request_wrap.hpp
+++ b/inference-engine/samples/benchmark_app/infer_request_wrap.hpp
@@ -65,6 +65,10 @@ class InferReqWrap final {
         return _request.GetBlob(name);
     }
 
+    void setBlob(const std::string& name, const InferenceEngine::Blob::Ptr& data) {
+        _request.SetBlob(name, data);
+    }
+
     double getExecutionTimeInMilliseconds() const {
         auto execTime = std::chrono::duration_cast<ns>(_endTime - _startTime);
         return static_cast<double>(execTime.count()) * 0.000001;
diff --git a/inference-engine/samples/benchmark_app/main.cpp b/inference-engine/samples/benchmark_app/main.cpp
index 53aa0f1922df9f..9120ce7136ef49 100644
--- a/inference-engine/samples/benchmark_app/main.cpp
+++ b/inference-engine/samples/benchmark_app/main.cpp
@@ -21,6 +21,7 @@
 #include "infer_request_wrap.hpp"
 #include "inputs_filling.hpp"
 #include "progress_bar.hpp"
+#include "remote_blobs_filling.hpp"
 #include "statistics_report.hpp"
 #include "utils.hpp"
 
@@ -59,7 +60,10 @@ bool ParseAndCheckCommandLine(int argc, char* argv[]) {
     if (FLAGS_api != "async" && FLAGS_api != "sync") {
         throw std::logic_error("Incorrect API. Please set -api option to `sync` or `async` value.");
     }
-
+    if (!FLAGS_hint.empty() && FLAGS_hint != "throughput" && FLAGS_hint != "tput" && FLAGS_hint != "latency") {
+        throw std::logic_error("Incorrect performance hint. Please set -hint option to"
+                               "either `throughput`(tput) or `latency' value.");
+    }
     if (!FLAGS_report_type.empty() && FLAGS_report_type != noCntReport && FLAGS_report_type != averageCntReport &&
         FLAGS_report_type != detailedCntReport) {
         std::string err = "only " + std::string(noCntReport) + "/" + std::string(averageCntReport) + "/" +
@@ -208,6 +212,11 @@ int main(int argc, char* argv[]) {
         // ----------------- 3. Setting device configuration
         // -----------------------------------------------------------
         next_step();
+        std::string ov_perf_hint;
+        if (FLAGS_hint == "throughput" || FLAGS_hint == "tput")
+            ov_perf_hint = CONFIG_VALUE(THROUGHPUT);
+        else if (FLAGS_hint == "latency")
+            ov_perf_hint = CONFIG_VALUE(LATENCY);
 
         bool perf_counts = false;
         // Update config per device according to command line parameters
@@ -219,6 +228,13 @@ int main(int argc, char* argv[]) {
                 config[device] = {};
             std::map<std::string, std::string>& device_config = config.at(device);
 
+            // high-level performance modes
+            if (!ov_perf_hint.empty()) {
+                device_config[CONFIG_KEY(PERFORMANCE_HINT)] = ov_perf_hint;
+                if (FLAGS_nireq != 0)
+                    device_config[CONFIG_KEY(PERFORMANCE_HINT_NUM_REQUESTS)] = std::to_string(FLAGS_nireq);
+            }
+
             // Set performance counter
             if (isFlagSetInCommandLine("pc")) {
                 // set to user defined value
@@ -241,6 +257,7 @@ int main(int argc, char* argv[]) {
             }
             perf_counts = (device_config.at(CONFIG_KEY(PERF_COUNT)) == CONFIG_VALUE(YES)) ? true : perf_counts;
 
+            // the rest are individual per-device settings (overriding the values set with perf modes)
             auto setThroughputStreams = [&]() {
                 const std::string key = device + "_THROUGHPUT_STREAMS";
                 if (device_nstreams.count(device)) {
@@ -255,7 +272,7 @@ int main(int argc, char* argv[]) {
                                                " or via configuration file.");
                     }
                     device_config[key] = device_nstreams.at(device);
-                } else if (!device_config.count(key) && (FLAGS_api == "async")) {
+                } else if (ov_perf_hint.empty() && !device_config.count(key) && (FLAGS_api == "async")) {
                     slog::warn << "-nstreams default value is determined automatically for " << device
                                << " device. "
                                   "Although the automatic selection usually provides a "
@@ -484,9 +501,24 @@ int main(int argc, char* argv[]) {
                 batchSize = 1;
             }
         }
-        // ----------------- 8. Setting optimal runtime parameters
+        // ----------------- 8. Querying optimal runtime parameters
         // -----------------------------------------------------
         next_step();
+        // output of the actual settings that the device selected based on the hint
+        if (!ov_perf_hint.empty()) {
+            for (const auto& device : devices) {
+                std::vector<std::string> supported_config_keys =
+                    ie.GetMetric(device, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
+                slog::info << "Device: " << device << slog::endl;
+                for (const auto& cfg : supported_config_keys) {
+                    try {
+                        slog::info << "  {" << cfg << " , " << exeNetwork.GetConfig(cfg).as<std::string>();
+                    } catch (...) {
+                    };
+                    slog::info << " }" << slog::endl;
+                }
+            }
+        }
 
         // Update number of streams
         for (auto&& ds : device_nstreams) {
@@ -561,7 +593,16 @@ int main(int argc, char* argv[]) {
         next_step();
 
         InferRequestsQueue inferRequestsQueue(exeNetwork, nireq);
-        fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
+        if (isFlagSetInCommandLine("use_device_mem")) {
+            if (device_name.find("GPU") == 0)
+                ::gpu::fillRemoteBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests, exeNetwork);
+            else if (device_name.find("CPU") == 0)
+                fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
+            else
+                IE_THROW() << "Requested device doesn't support `use_device_mem` option.";
+        } else {
+            fillBlobs(inputFiles, batchSize, app_inputs_info, inferRequestsQueue.requests);
+        }
 
         // ----------------- 10. Measuring performance
         // ------------------------------------------------------------------
diff --git a/inference-engine/samples/benchmark_app/remote_blobs_filling.cpp b/inference-engine/samples/benchmark_app/remote_blobs_filling.cpp
new file mode 100644
index 00000000000000..dc6d9fbf34a54d
--- /dev/null
+++ b/inference-engine/samples/benchmark_app/remote_blobs_filling.cpp
@@ -0,0 +1,140 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "remote_blobs_filling.hpp"
+
+#include <memory>
+#include <string>
+#include <utility>
+#include <vector>
+
+namespace gpu {
+
+template <typename T>
+using uniformDistribution = typename std::conditional<
+    std::is_floating_point<T>::value,
+    std::uniform_real_distribution<T>,
+    typename std::conditional<std::is_integral<T>::value, std::uniform_int_distribution<T>, void>::type>::type;
+
+template <typename T, typename T2>
+void fillBufferRandom(void* inputBuffer,
+                      size_t elementsNum,
+                      T rand_min = std::numeric_limits<uint8_t>::min(),
+                      T rand_max = std::numeric_limits<uint8_t>::max()) {
+    std::mt19937 gen(0);
+    uniformDistribution<T2> distribution(rand_min, rand_max);
+    auto inputBufferData = static_cast<T*>(inputBuffer);
+    for (size_t i = 0; i < elementsNum; i++) {
+        inputBufferData[i] = static_cast<T>(distribution(gen));
+    }
+}
+
+void fillBuffer(void* inputBuffer, size_t elementsNum, InferenceEngine::Precision precision) {
+    if (precision == InferenceEngine::Precision::FP32) {
+        fillBufferRandom<float, float>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::FP16) {
+        fillBufferRandom<short, short>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I32) {
+        fillBufferRandom<int32_t, int32_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I64) {
+        fillBufferRandom<int64_t, int64_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::U8) {
+        // uniform_int_distribution<uint8_t> is not allowed in the C++17
+        // standard and vs2017/19
+        fillBufferRandom<uint8_t, uint32_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I8) {
+        // uniform_int_distribution<int8_t> is not allowed in the C++17 standard
+        // and vs2017/19
+        fillBufferRandom<int8_t, int32_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::U16) {
+        fillBufferRandom<uint16_t, uint16_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::I16) {
+        fillBufferRandom<int16_t, int16_t>(inputBuffer, elementsNum);
+    } else if (precision == InferenceEngine::Precision::BOOL) {
+        fillBufferRandom<uint8_t, uint32_t>(inputBuffer, elementsNum, 0, 1);
+    } else {
+        IE_THROW() << "Requested precision is not supported";
+    }
+}
+
+size_t getBytesPerElement(InferenceEngine::Precision precision) {
+    switch (precision) {
+    case InferenceEngine::Precision::FP32:
+        return 4;
+    case InferenceEngine::Precision::FP16:
+        return 2;
+    case InferenceEngine::Precision::I32:
+        return 4;
+    case InferenceEngine::Precision::I64:
+        return 8;
+    case InferenceEngine::Precision::U8:
+        return 1;
+    case InferenceEngine::Precision::I8:
+        return 1;
+    case InferenceEngine::Precision::U16:
+        return 2;
+    case InferenceEngine::Precision::I16:
+        return 2;
+    case InferenceEngine::Precision::BOOL:
+        return 1;
+    default:
+        IE_THROW() << "Requested precision is not supported";
+    }
+}
+
+void fillRemoteBlobs(const std::vector<std::string>& inputFiles,
+                     const size_t& batchSize,
+                     benchmark_app::InputsInfo& app_inputs_info,
+                     std::vector<InferReqWrap::Ptr> requests,
+                     const InferenceEngine::ExecutableNetwork& exeNetwork) {
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+    slog::info << "Device memory will be used for input and output blobs" << slog::endl;
+    if (inputFiles.size()) {
+        slog::warn << "Device memory supports only random data at this moment, input images will be ignored"
+                   << slog::endl;
+    }
+    auto context = exeNetwork.GetContext();
+    auto oclContext = std::dynamic_pointer_cast<InferenceEngine::gpu::ClContext>(context)->get();
+    auto oclInstance = std::make_shared<OpenCL>(oclContext);
+
+    auto setShared = [&](size_t requestId,
+                         const std::string name,
+                         const InferenceEngine::TensorDesc& desc,
+                         bool fillRandom = false) {
+        cl_int err;
+        auto inputDims = desc.getDims();
+        auto elementsNum = std::accumulate(begin(inputDims), end(inputDims), 1, std::multiplies<size_t>());
+        auto inputSize = elementsNum * getBytesPerElement(desc.getPrecision());
+
+        cl::Buffer sharedBuffer =
+            cl::Buffer(oclInstance->_context, CL_MEM_READ_WRITE, (cl::size_type)inputSize, NULL, &err);
+
+        if (fillRandom) {
+            void* mappedPtr = oclInstance->_queue.enqueueMapBuffer(sharedBuffer,
+                                                                   CL_TRUE,
+                                                                   CL_MEM_READ_WRITE,
+                                                                   0,
+                                                                   (cl::size_type)inputSize);
+            fillBuffer(mappedPtr, elementsNum, desc.getPrecision());
+            oclInstance->_queue.enqueueUnmapMemObject(sharedBuffer, mappedPtr);
+        }
+
+        InferenceEngine::Blob::Ptr sharedBlob = InferenceEngine::gpu::make_shared_blob(desc, context, sharedBuffer);
+
+        requests.at(requestId)->setBlob(name, sharedBlob);
+    };
+
+    for (size_t requestId = 0; requestId < requests.size(); requestId++) {
+        for (auto& item : exeNetwork.GetInputsInfo())
+            setShared(requestId, item.first, item.second->getTensorDesc(), true);
+
+        for (auto& item : exeNetwork.GetOutputsInfo())
+            setShared(requestId, item.first, item.second->getTensorDesc());
+    }
+#else
+    IE_THROW() << "Device memory requested for GPU device, but OpenCL was not linked";
+#endif
+}
+
+}  // namespace gpu
diff --git a/inference-engine/samples/benchmark_app/remote_blobs_filling.hpp b/inference-engine/samples/benchmark_app/remote_blobs_filling.hpp
new file mode 100644
index 00000000000000..66e2b1b2c66ef7
--- /dev/null
+++ b/inference-engine/samples/benchmark_app/remote_blobs_filling.hpp
@@ -0,0 +1,64 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#if defined(HAVE_GPU_DEVICE_MEM_SUPPORT)
+#    define HAVE_DEVICE_MEM_SUPPORT
+#    include <gpu/gpu_context_api_ocl.hpp>
+#endif
+
+#include <inference_engine.hpp>
+
+#include "infer_request_wrap.hpp"
+#include "utils.hpp"
+
+namespace gpu {
+
+#ifdef HAVE_DEVICE_MEM_SUPPORT
+struct OpenCL {
+    cl::Context _context;
+    cl::Device _device;
+    cl::CommandQueue _queue;
+
+    explicit OpenCL(std::shared_ptr<std::vector<cl_context_properties>> media_api_context_properties = nullptr) {
+        // get Intel GPU OCL device, create context and queue
+        {
+            std::vector<cl::Device> devices;
+            std::vector<cl::Platform> platforms;
+            const unsigned int refVendorID = 0x8086;
+
+            cl::Platform::get(&platforms);
+            for (auto& p : platforms) {
+                p.getDevices(CL_DEVICE_TYPE_GPU, &devices);
+                for (auto& d : devices) {
+                    if (refVendorID == d.getInfo<CL_DEVICE_VENDOR_ID>()) {
+                        _device = d;
+                        _context = cl::Context(_device);
+                        break;
+                    }
+                }
+            }
+
+            cl_command_queue_properties props = CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE;
+            _queue = cl::CommandQueue(_context, _device, props);
+        }
+    }
+
+    explicit OpenCL(cl_context context) {
+        // user-supplied context handle
+        _context = cl::Context(context, true);
+        _device = cl::Device(_context.getInfo<CL_CONTEXT_DEVICES>()[0].get(), true);
+
+        cl_command_queue_properties props = CL_QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE;
+        _queue = cl::CommandQueue(_context, _device, props);
+    }
+};
+#endif
+
+void fillRemoteBlobs(const std::vector<std::string>& inputFiles,
+                     const size_t& batchSize,
+                     benchmark_app::InputsInfo& app_inputs_info,
+                     std::vector<InferReqWrap::Ptr> requests,
+                     const InferenceEngine::ExecutableNetwork& exeNetwork);
+
+}  // namespace gpu
diff --git a/inference-engine/samples/benchmark_app/utils.cpp b/inference-engine/samples/benchmark_app/utils.cpp
index c98e8c1b94e4da..ac5a30b0ea7869 100644
--- a/inference-engine/samples/benchmark_app/utils.cpp
+++ b/inference-engine/samples/benchmark_app/utils.cpp
@@ -59,7 +59,6 @@ uint32_t deviceDefaultDeviceDurationInSeconds(const std::string& device) {
                                                                                 {"VPU", 60},
                                                                                 {"MYRIAD", 60},
                                                                                 {"HDDL", 60},
-                                                                                {"FPGA", 120},
                                                                                 {"UNKNOWN", 120}};
     uint32_t duration = 0;
     for (const auto& deviceDurationInSeconds : deviceDefaultDurationInSeconds) {
diff --git a/inference-engine/samples/build_samples.sh b/inference-engine/samples/build_samples.sh
index d584a11011985d..ad92920ae50be8 100755
--- a/inference-engine/samples/build_samples.sh
+++ b/inference-engine/samples/build_samples.sh
@@ -19,12 +19,10 @@ SAMPLES_PATH="$( cd "$( dirname "${BASH_SOURCE[0]-$0}" )" && pwd )"
 printf "\nSetting environment variables for building samples...\n"
 
 if [ -z "$INTEL_OPENVINO_DIR" ]; then
-    if [ -e "$SAMPLES_PATH/../../../bin/setupvars.sh" ]; then
-        setvars_path="$SAMPLES_PATH/../../../bin/setupvars.sh"
-    elif [ -e "$SAMPLES_PATH/../../../../bin/setupvars.sh" ]; then
-        setvars_path="$SAMPLES_PATH/../../../../bin/setupvars.sh"
+    if [ -e "$SAMPLES_PATH/../../setupvars.sh" ]; then
+        setvars_path="$SAMPLES_PATH/../../setupvars.sh"
     else
-        printf "Error: Failed to set the environment variables automatically. To fix, run the following command:\n source <INSTALL_DIR>/bin/setupvars.sh\n where INSTALL_DIR is the OpenVINO installation directory.\n\n"
+        printf "Error: Failed to set the environment variables automatically. To fix, run the following command:\n source <INSTALL_DIR>/setupvars.sh\n where INSTALL_DIR is the OpenVINO installation directory.\n\n"
         exit 1
     fi
     if ! source "$setvars_path" ; then
@@ -33,7 +31,7 @@ if [ -z "$INTEL_OPENVINO_DIR" ]; then
     fi
 else
     # case for run with `sudo -E` 
-    source "$INTEL_OPENVINO_DIR/bin/setupvars.sh"
+    source "$INTEL_OPENVINO_DIR/setupvars.sh"
 fi
 
 if ! command -v cmake &>/dev/null; then
diff --git a/inference-engine/samples/build_samples_msvc.bat b/inference-engine/samples/build_samples_msvc.bat
index d7f0bce1dd4c1d..d986d7277d0667 100644
--- a/inference-engine/samples/build_samples_msvc.bat
+++ b/inference-engine/samples/build_samples_msvc.bat
@@ -9,7 +9,6 @@ set "ROOT_DIR=%~dp0"
 FOR /F "delims=\" %%i IN ("%ROOT_DIR%") DO set SAMPLES_TYPE=%%~nxi
 
 set "SOLUTION_DIR64=%USERPROFILE%\Documents\Intel\OpenVINO\inference_engine_%SAMPLES_TYPE%_samples_build"
-if "%InferenceEngine_DIR%"=="" set "InferenceEngine_DIR=%ROOT_DIR%\..\share"
 
 set MSBUILD_BIN=
 set VS_PATH=
@@ -30,19 +29,16 @@ if not "%1" == "" (
 )
 
 if "%INTEL_OPENVINO_DIR%"=="" (
-    if exist "%ROOT_DIR%\..\..\..\bin\setupvars.bat" (
-        call "%ROOT_DIR%\..\..\..\bin\setupvars.bat"
+    if exist "%ROOT_DIR%\..\..\setupvars.bat" (
+        call "%ROOT_DIR%\..\..\setupvars.bat"
     ) else (
-        if exist "%ROOT_DIR%\..\..\..\..\bin\setupvars.bat" (
-            call "%ROOT_DIR%\..\..\..\..\bin\setupvars.bat" 
-      ) else (
          echo Failed to set the environment variables automatically    
-         echo To fix, run the following command: ^<INSTALL_DIR^>\bin\setupvars.bat
+         echo To fix, run the following command: ^<INSTALL_DIR^>\setupvars.bat
          echo where INSTALL_DIR is the OpenVINO installation directory.
          GOTO errorHandling
       )
     )
-) 
+)
 
 if "%PROCESSOR_ARCHITECTURE%" == "AMD64" (
    set "PLATFORM=x64"
diff --git a/inference-engine/samples/classification_sample_async/README.md b/inference-engine/samples/classification_sample_async/README.md
index fd63346078b464..8a0d19cdeb3895 100644
--- a/inference-engine/samples/classification_sample_async/README.md
+++ b/inference-engine/samples/classification_sample_async/README.md
@@ -86,7 +86,7 @@ Options:
 Running the application with the empty list of options yields the usage message given above and an error message.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name alexnet
 ```
diff --git a/inference-engine/samples/common/utils/CMakeLists.txt b/inference-engine/samples/common/utils/CMakeLists.txt
index 9bdc0516af818f..534ab26160df8c 100644
--- a/inference-engine/samples/common/utils/CMakeLists.txt
+++ b/inference-engine/samples/common/utils/CMakeLists.txt
@@ -12,9 +12,9 @@ set_target_properties(${TARGET_NAME} PROPERTIES FOLDER "src")
 target_include_directories(${TARGET_NAME}
     PUBLIC "${CMAKE_CURRENT_SOURCE_DIR}/include")
 
-find_package(InferenceEngine REQUIRED COMPONENTS inference_engine)
+find_package(OpenVINO REQUIRED COMPONENTS Runtime)
 
-target_link_libraries(${TARGET_NAME} PUBLIC ${InferenceEngine_LIBRARIES} gflags)
+target_link_libraries(${TARGET_NAME} PUBLIC openvino::runtime gflags)
 
 if(COMMAND add_clang_format_target)
     add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME})
diff --git a/inference-engine/samples/hello_classification/README.md b/inference-engine/samples/hello_classification/README.md
index f70f74343d2e48..eebad1ef8ff2b5 100644
--- a/inference-engine/samples/hello_classification/README.md
+++ b/inference-engine/samples/hello_classification/README.md
@@ -48,7 +48,7 @@ To run the sample, you need specify a model and image:
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name alexnet
 ```
@@ -72,7 +72,7 @@ The application outputs top-10 inference results.
 ```
 Top 10 results:
 
-Image C:\images\car.bmp
+Image /opt/intel/openvino/samples/scripts/car.png
 
 classid probability
 ------- -----------
diff --git a/inference-engine/samples/hello_nv12_input_classification/README.md b/inference-engine/samples/hello_nv12_input_classification/README.md
index ff088bea6ebf73..5f90b4db30b3c8 100644
--- a/inference-engine/samples/hello_nv12_input_classification/README.md
+++ b/inference-engine/samples/hello_nv12_input_classification/README.md
@@ -65,7 +65,7 @@ ffmpeg -i cat.jpg -pix_fmt nv12 cat.yuv
 > - The sample accepts models in ONNX format (.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name alexnet
 ```
diff --git a/inference-engine/samples/hello_reshape_ssd/CMakeLists.txt b/inference-engine/samples/hello_reshape_ssd/CMakeLists.txt
index 5c47b6e2fe83fd..5be6137ab2a716 100644
--- a/inference-engine/samples/hello_reshape_ssd/CMakeLists.txt
+++ b/inference-engine/samples/hello_reshape_ssd/CMakeLists.txt
@@ -7,6 +7,3 @@ ie_add_sample(NAME hello_reshape_ssd
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/reshape_ssd_extension.hpp"
               DEPENDENCIES ie_samples_utils
               OPENCV_DEPENDENCIES core imgproc imgcodecs)
-
-find_package(ngraph REQUIRED)
-target_link_libraries(hello_reshape_ssd PRIVATE ${NGRAPH_LIBRARIES})
diff --git a/inference-engine/samples/hello_reshape_ssd/README.md b/inference-engine/samples/hello_reshape_ssd/README.md
index 995fb537144cc2..d5e03e187ef7af 100644
--- a/inference-engine/samples/hello_reshape_ssd/README.md
+++ b/inference-engine/samples/hello_reshape_ssd/README.md
@@ -56,7 +56,7 @@ You can use the following command to do inference on CPU of an image using a tra
 ```
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name person-detection-retail-0013
 ```
diff --git a/inference-engine/samples/ngraph_function_creation_sample/CMakeLists.txt b/inference-engine/samples/ngraph_function_creation_sample/CMakeLists.txt
index 37fd62c2eccdeb..4a9b406d6bb8a0 100644
--- a/inference-engine/samples/ngraph_function_creation_sample/CMakeLists.txt
+++ b/inference-engine/samples/ngraph_function_creation_sample/CMakeLists.txt
@@ -8,6 +8,3 @@ ie_add_sample(NAME ngraph_function_creation_sample
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/ngraph_function_creation_sample.hpp"
               DEPENDENCIES format_reader ie_samples_utils)
-
-find_package(ngraph REQUIRED)
-target_link_libraries(${TARGET_NAME} PRIVATE ${NGRAPH_LIBRARIES})
diff --git a/inference-engine/samples/object_detection_sample_ssd/CMakeLists.txt b/inference-engine/samples/object_detection_sample_ssd/CMakeLists.txt
index 46dbb6bfe23c7e..af58af8d6b224d 100644
--- a/inference-engine/samples/object_detection_sample_ssd/CMakeLists.txt
+++ b/inference-engine/samples/object_detection_sample_ssd/CMakeLists.txt
@@ -6,6 +6,3 @@ ie_add_sample(NAME object_detection_sample_ssd
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/object_detection_sample_ssd.h"
               DEPENDENCIES format_reader ie_samples_utils)
-
-find_package(ngraph REQUIRED)
-target_link_libraries(object_detection_sample_ssd PRIVATE ${NGRAPH_LIBRARIES})
diff --git a/inference-engine/samples/object_detection_sample_ssd/README.md b/inference-engine/samples/object_detection_sample_ssd/README.md
index 4c21ab2da87b52..026a7e89fc45d1 100644
--- a/inference-engine/samples/object_detection_sample_ssd/README.md
+++ b/inference-engine/samples/object_detection_sample_ssd/README.md
@@ -76,7 +76,7 @@ Running the application with the empty list of options yields the usage message
 > - The sample accepts models in ONNX format (\*.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name person-detection-retail-0013
 ```
diff --git a/inference-engine/samples/speech_libs_and_demos/Kaldi_SLM_conversion_tool.md b/inference-engine/samples/speech_libs_and_demos/Kaldi_SLM_conversion_tool.md
deleted file mode 100644
index a429f70577fbbe..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/Kaldi_SLM_conversion_tool.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# Kaldi* Statistical Language Model Conversion Tool {#openvino_inference_engine_samples_speech_libs_and_demos_Kaldi_SLM_conversion_tool}
-
-The Kaldi* Statistical Language Model (SLM) Conversion Tool is a command-line tool that converts [Kaldi](https://kaldi-asr.org/) language model resources to the format supported by the OpenVINO&trade; Speech Recognition Demos.
-
-## Command Line
-
-`kaldi_slm_convertion_tool HCLG.const.fst transitions.txt words.txt slm.fst labels.bin`
-
-## Input Parameters
-
-**HCLG.fst**
-
-The `HCLG.const.fst` parameter is the input weighted finite-state transducer (WFST) file in the OpenFST const format.
- 
-Most example scripts create a language model file in that format. If you have a WFST in a different OpenFST format, convert it with the following command:
-
-```sh
-$KALDI_ROOT/tools/openfst/bin/fstconvert --fst_type=const HCLG.fst HCLG.const.fst
-```
- 
-The source Kaldi language model file `HCLG.fst` can be found in directories like `exp/tri2b/graph_xyz`, where `tri2b` is the name of the model used for speech recognition tests.
-
-**transitions.txt**
-The WFST transitions file describes the relations between WFST transitions and neural acoustic model outputs. This file is usually not generated by Kaldi example scripts, so you have to create it with the following command:
-
-```sh
-$KALDI_ROOT/src/bin/show-transitions phones.txt final.mdl > transitions.txt
-```
- 
-For this call, the `phones.txt` file is the phoneme description file, which can often be found in `data/lang/phones.txt`.
-The `final.mdl` file is the neural acoustic model that is used for speech recognition.
-
-**words.txt**
-
-The `words.txt` file defines the mappings from word IDs used internally to their text representation. For many Kaldi example scripts, the file can be found in the same directory as `HCLG.fst`.
-
-## Output Parameters
-
-**slm.fst**
-
-The output file `slm.fst` is generated by the SLM Conversion Tool. It contains the information needed for the OpenVINO&trade; speech recognition demos for decoding.
-
-**labels.bin**
-
-The `labels.bin` file defines mappings from word IDs to word strings, like the `words.txt` file, but in the binary format. The OpenVINO&trade; speech recognition example needs the `labels.bin` file to convert recognized words into a human-readable format.
diff --git a/inference-engine/samples/speech_libs_and_demos/Live_speech_recognition_demo.md b/inference-engine/samples/speech_libs_and_demos/Live_speech_recognition_demo.md
deleted file mode 100644
index 778f8574a9636f..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/Live_speech_recognition_demo.md
+++ /dev/null
@@ -1,78 +0,0 @@
-# Live Speech Recognition Demo {#openvino_inference_engine_samples_speech_libs_and_demos_Live_speech_recognition_demo}
-
-This demo provides a GUI interface for automatic speech recognition using selected OpenVINO&trade; Inference Engine plugin, OpenVINO&trade; Feature Extraction Library, and OpenVINO&trade; Decoder Library.
-
-## How It Works
-
-The application transcribes audio from a WAV file and/or audio device. It supports recognition of two audio sources in parallel, for example audio coming from your microphone and audio coming from your PC (loopback). That enables use cases like audio conference or transcribing audio from an online video stream. Among other things, user can select a specific plugin to use for the recognition, set batch size, and control volume.
-
-The software stack used by the demo is as follows:
-
-![](img/sw_components.png)
-
-## Running
-
-The application main window looks like this:
-
-![](img/live_speech_recognition_demo_annotated.jpg)
-
-Refer to the sections below for instructions for particular scenarios.
-
-### Transcribing Speech from WAV File
-
-Click **Select File (9)** and navigate to the audio file using the file selection window dialog. Ensure the selected audio format is 16 kHz, 16 bit, 1 channel stored as WAV.
-
-Alternatively, use the audio file that is already selected upon launching the app.
-
-Click **Recognize (10)**.
-
-Transcription appear in the **Source 1** box.
-
-### Transcribing Speech from Audio or Video Playback (Loopback)
-
-Select a proper audio output device **(3)**.
-
-Click **Recognize (5)** and play your video or other multimedia.
-
-Transcription appears in the **Source 1** box.
-
-> **NOTE**: Loopback on Linux\* OS may need manual settings in PulseAudio Control or via a config file.
-
-### Transcribing Speech Captured with Microphone
-
-Select a microphone **(6)**.
-
-Click **Recognize (8)** and start speaking.
-
-Transcription appears in the **Source 2** box.
-
-### Transcribing Speech from Audio Output and Microphone at the Same Time (Audio Conference)
-
-Select an audio output device **(3)**.
-
-Select a microphone **(6)**.
-
-Click both **Recognize** buttons: **(5)** and **(8)**. Then start speaking.
-
-Transcriptions appear in both **Source 1** and **Source 2** boxes.
-
-> **NOTE**: Loopback on Linux OS may need manual settings in PulseAudio Control or via a config file.
-
-### Changing Speech Recognition Model
-
-Select the desired configuration from the dropdown list **(1)**.
-
-To reset the application to default configuration, click **Reload (2)**.
-
-### Controlling Volume
-
-Audio volume for each stream can be controlled with sliders **(4)** and **(7)**.
-Current audio levels of each stream are shown in the bar on the same row as its source selector.
-
-### Selecting Inference Engine Plugin
-
-Select an Inference Engine plugin and batch size with **(11)** and **(12)**.
-
-## Demo Output
-
-The resulting transcription for each audio source is presented in the application in real time.
diff --git a/inference-engine/samples/speech_libs_and_demos/Offline_speech_recognition_demo.md b/inference-engine/samples/speech_libs_and_demos/Offline_speech_recognition_demo.md
deleted file mode 100644
index 10594e2c321e1c..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/Offline_speech_recognition_demo.md
+++ /dev/null
@@ -1,90 +0,0 @@
-# Offline Speech Recognition Demo {#openvino_inference_engine_samples_speech_libs_and_demos_Offline_speech_recognition_demo}
-
-This demo provides a command-line interface for automatic speech recognition using OpenVINO&trade;.
-Components used by this executable:
-
-* `lspeech_s5_ext` model     - Example pre-trained LibriSpeech DNN
-* `speech_library.dll` (`.so`) - Open source speech recognition library that uses OpenVINO&trade; Inference Engine, Intel&reg; Speech Feature Extraction and Intel&reg; Speech Decoder libraries
-
-## How It Works
-
-The application transcribes speech from a given WAV file and outputs the text to the console.
-
-## Running
-
-The application requires two command-line parameters, which point to an audio file with speech to transcribe and a configuration file describing the resources to use for transcription.
-
-### Parameters for Executable
-
-* `-wave` - Path to input WAV to process. WAV file needs to be in the following format: RIFF WAVE PCM 16bit, 16kHz, 1 channel, with header.
-* `-c`, `--config` - Path to configuration file with paths to resources and other parameters.
-
-Example usage:
-
-```sh
-offline_speech_recognition_app.exe -wave="<path_to_audio>/inputAudio.wav" -c="<path_to_config>/configFile.cfg"
-```
-
-### Configuration File Description
-
-The configuration file is an ASCII text file where:
-* Parameter name and its value are separated with the space character
-* Parameter and value pair ends with the end of line character
-
-#### Parameter Description
-
-| Parameter | Description | Value used for demo |
-| --- | --- | --- |
-| `-fe:rt:numCeps` | Number of MFCC cepstrums | *13* |
-| `-fe:rt:contextLeft` | Numbers of past frames that are stacked to form input vector for neural network inference | *5* |
-| `-fe:rt:contextRight` | Numbers of future frames that are stacked to form input vector for neural network inference | *5* |
-| `-fe:rt:hpfBeta` | High pass filter beta coefficient, where 0.0f means no filtering | *0.0f* |
-| `-fe:rt:inputDataType` | Feature extraction input format description | *INT16_16KHZ* |
-| `-fe:rt:cepstralLifter` | Lifting factor | *22.0f* |
-| `-fe:rt:noDct` | Flag: use DCT as final step or not | *0* |
-| `-fe:rt:featureTransform` | [Kaldi](https://kaldi-asr.org/) feature transform file that normalizes stacked features for neural network inference | |
-| `-dec:wfst:acousticModelFName` | Full path to the acoustic model file, for example `openvino_ir.xml`| |
-| `-dec:wfst:acousticScaleFactor` | The acoustic log likelihood scaling factor | *0.1f* |
-| `-dec:wfst:beamWidth` | Viterbi search beam width | *14.0f* |
-| `-dec:wfst:latticeWidth` | Lattice beam width (extends the beam width) | *0.0f* |
-| `-dec:wfst:nbest` | Number of n-best hypothesis to be generated | *1* |
-| `-dec:wfst:confidenceAcousticScaleFactor` | Scaling parameter to factor in acoustic scores in confidence computations | *1.0f* |
-| `-dec:wfst:confidenceLMScaleFactor` | Scaling parameter to factor in language model in confidence computations | *1.0f* |
-| `-dec:wfst:hmmModelFName` | Full path to HMM model | |
-| `-dec:wfst:fsmFName` | Full path to pronunciation model or full statically composed LM, if static composition is used | |
-| `-dec:wfstotf:gramFsmFName` | Full path to grammar model | |
-| `-dec:wfst:outSymsFName` | Full path to the output symbols (lexicon) filename | |
-| `-dec:wfst:tokenBufferSize` | Token pool size expressed in number of DWORDs | *150000* |
-| `-dec:wfstotf:traceBackLogSize` | Number of entries in traceback expressed as log2(N) | *19* |
-| `-dec:wfstotf:minStableFrames` | The time expressed in frames, after which the winning hypothesis is recognized as stable and the final result can be printed | *45* |
-| `-dec:wfst:maxCumulativeTokenSize` | Maximum fill rate of token buffer before token beam is adjusted to keep token buffer fill constant. Expressed as factor of buffer size (0.0, 1.0) | *0.2f* |
-| `-dec:wfst:maxTokenBufferFill` | Active token count number triggering beam tightening expressed as factor of buffer size | *0.6f* |
-| `-dec:wfst:maxAvgTokenBufferFill` | Average active token count number for utterance, which triggers beam tightening when exceeded. Expressed as factor of buffer size | *1.0f* |
-| `-dec:wfst:tokenBufferMinFill` | Minimum fill rate of token buffer | *0.1f* |
-| `-dec:wfst:pruningTighteningDelta` | Beam tightening value when token pool usage reaches the pool capacity | *1.0f* |
-| `-dec:wfst:pruningRelaxationDelta` | Beam relaxation value when token pool is not meeting minimum fill ratio criterion | *0.5f* |
-| `-dec:wfst:useScoreTrendForEndpointing` | Extend end pointing with acoustic feedback | *1* |
-| `-dec:wfstotf:cacheLogSize` | Number of entries in LM cache expressed as log2(N) | *16* |
-| `-eng:output:format` | Format of the speech recognition output | *text* |
-| `-inference:contextLeft` | IE: Additional stacking option, independent from feature extraction | *0* |
-| `-inference:contextRight` | IE: Additional stacking option, independent from feature extraction | *0* |
-| `-inference:device`  | IE: Device used for neural computations | CPU |
-| `-inference:numThreads` | IE: Number of threads used by GNA in SW mode | *1* |
-| `-inference:scaleFactor` | IE: Scale factor used for static quantization | *3000.0* |
-| `-inference:quantizationBits` | IE: Quantization resolution in bits | *16* or *8* |
-
-
-## Demo Output
-
-The resulting transcription for the sample audio file:
-
-```sh
-[ INFO ] Using feature transformation
-[ INFO ] InferenceEngine API
-[ INFO ] Device info:
-[ INFO ]        CPU: MKLDNNPlugin
-[ INFO ] Batch size: 1
-[ INFO ] Model loading time: 61.01 ms
-Recognition result:
-HOW ARE YOU DOING
-```
diff --git a/inference-engine/samples/speech_libs_and_demos/Speech_library.md b/inference-engine/samples/speech_libs_and_demos/Speech_library.md
deleted file mode 100644
index b407447156787a..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/Speech_library.md
+++ /dev/null
@@ -1,52 +0,0 @@
-# Speech Library {#openvino_inference_engine_samples_speech_libs_and_demos_Speech_library}
-
-## Overview
-
-Speech Library provides an easy way to work with the end-to-end speech recognition pipeline.
-The software stack is created to minimize effort required to build speech-enabled applications.
-Speech Library wraps all of the processing blocks and exposes a simple API. The library takes care of proper initialization and data passing between all the components in the pipeline.
-
-Speech Library contains:
-
-- Two core binary libraries in the `lib` folder: Intel&reg; Feature Extraction library and Intel&reg; Speech Decoder
-- Speech library source code in the `src` folder
-- Speech library header files in the `include` folder. The library API is in the file `speech_library.h`.
-
-To compile the libraries, please run a `.bat/.sh` file in the root folder of speech libraries and demos, or run the demonstration script `<INSTALL_DIR>/deployment_tools/demo/speech_recogintion.bat/sh`. 
-
-## Architecture
-
-The implementation of speech recognition pipeline used in demo applications is based on classic HMM/DNN approach.
-
-The pipeline consists of the following stages:
-
-1. Mel-frequency cepstral coefficients (MFCC) feature extraction: the input audio signal or waveform is processed by Intel&reg; Feature Extraction library to create a series of MFCC features
-2. Neural acoustic scoring: the OpenVINO &trade; Inference Engine transcribes the extracted features into a sequence of phonemes using a neural acoustic model
-3. Language model decoding: the Intel&reg; Speech Decoder turns the phonemes into text hypothesis. The decoding graph takes into account the grammar of the data, as well as the distribution and probabilities of contiguous specific words (n-grams)
-
-![](img/asr_pipeline.png)
-
-## Speech Library API
-
-The Speech Library API consists of simple routines:
-
-* Build recognizer pipeline
-* Provide audio samples for processing
-* Inform about new stable recognition result
-
-The flow is described below:
-![](img/speech_library_api.png)
-
-See `<INSTALL_DIR>/data_processing/audio/speech_recognition/include/speech_library.h` for details about the API.
-
-A great example on how to use the API is the source code of [offline speech recognition demo](Offline_speech_recognition_demo.md).
-
-## Run Your Application
-
-Before running compiled binary files, make sure your application can find the Inference Engine, Speech, Decoder, and Feature Extraction libraries.
-
-On Linux* operating systems, including Ubuntu*, the `LD_LIBRARY_PATH` environment variable is usually used to specify directories to search libraries in.
-
-You can update the `LD_LIBRARY_PATH` with paths to the directories in the Inference Engine installation directory where the libraries are placed.
-
-Please check `run_demo.sh` of offline and live speech recognition demos to learn how the `LD_LIBRARY_PATH` environment parameter can be set.
diff --git a/inference-engine/samples/speech_libs_and_demos/Speech_libs_and_demos.md b/inference-engine/samples/speech_libs_and_demos/Speech_libs_and_demos.md
deleted file mode 100644
index 5bd8b99d82a6e6..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/Speech_libs_and_demos.md
+++ /dev/null
@@ -1,133 +0,0 @@
-# Speech Library and Speech Recognition Demos {#openvino_inference_engine_samples_speech_libs_and_demos_Speech_libs_and_demos}
-
-Intel® distributions of OpenVINO&trade; toolkit for Linux* OS and Windows* OS provide a set of libraries and demos to
-demonstrate end-to-end speech recognition, as well as new acoustic and language models that can work with these demos.
-The libraries are designed for preprocessing (feature extraction) to get a feature vector from a speech signal, as well
-as postprocessing (decoding) to produce text from scores. Together with OpenVINO&trade;-based neural-network speech recognition,
-these libraries provide an end-to-end pipeline converting speech to text. This pipeline is demonstrated by the
-end-to-end demos:
-
-![](img/new_speech_demos.png)
-
-Note that the OpenVINO&trade; package also includes an [automatic speech recognition sample](../speech_sample/README.md) demonstrating acoustic model inference based on Kaldi\* neural networks. The sample works with Kaldi ARK files only, so it does not cover an end-to-end speech recognition scenario (speech to text),requiring additional preprocessing (feature extraction) to get a feature vector from a speech signal, as well as postprocessing (decoding) to produce text from scores:
-
-![](img/speech_sample.png)
-
-The main purpose of the sample is to demonstrate a variety of features and options provided by OpenVINO&trade;
-for speech recognition neural networks.
-
-Find new libraries, demos, and models at `<INSTALL_DIR>/data_processing/audio/speech_recognition`.
-
-> **NOTE**: These components are installed only if you select the **Inference Engine Runtime for Intel&reg; Gaussian & Neural Accelerator** component during installation. However, the Speech Library and speech recognition demos do not require the GNA accelerator. See <a href="#hardware-support">Hardware support</a> for details.
-
-## Package Components
-
-The package contains the following components:
-
-* [Speech Library](Speech_library.md), which includes a feature extractor and decoder
-
-* [Offline Speech Recognition Demo](Offline_speech_recognition_demo.md), which can process wave files with recorded speech
-
-* [Live Speech Recognition Demo](Live_speech_recognition_demo.md), which showcases transcription from a microphone or speakers
-
-* [Kaldi Statistical Language Model Conversion Tool](Kaldi_SLM_conversion_tool.md), which converts custom language models to use in the decoder
-
-Additionally, new acoustic and language models are available in the OpenVINO&trade; [storage](https://storage.openvinotoolkit.org/models_contrib/speech/2021.2/librispeech_s5/).
-
-## <a name="run-demos">Run Speech Recognition Demos with Pre-trained Models</a>
-
-To download pre-trained models and build all dependencies:
-
-* On Linux* OS, use the shell script `<INSTALL_DIR>/deployment_tools/demo/demo_speech_recognition.sh`
-
-* On Windows* OS, use the batch file `<INSTALL_DIR>\deployment_tools\demo\demo_speech_recognition.bat`
-
-The script follows the steps below:
-
-  1. Downloads US English models trained on the LibriSpeech dataset prepared for direct usage by the Inference Engine
-  2. Installs the required components
-  3. Runs the command line offline demo
-  4. Runs live speech recognition application with graphical interface
-
-If you are behind a proxy, set the following environment variables in a console session before running the script:
-
-* On Linux* OS:
-
-```sh
-export http_proxy=http://{proxyHost}:{proxyPort}
-export https_proxy=https://{proxyHost}:{proxyPort}
-```
-
-* On Windows* OS:
-
-```sh
-set http_proxy=http://{proxyHost}:{proxyPort}
-set https_proxy=https://{proxyHost}:{proxyPort}
-```
-
-## <a name="hardware-support">Hardware Support</a>
-
-The provided acoustic models have been tested on a CPU, graphics processing unit (GPU), and Intel&reg; Gaussian & Neural Accelerator (Intel&reg; GNA), and you can switch between these targets in offline and live speech recognition demos.
-
-> **NOTE**: Intel&reg; GNA is a specific low-power coprocessor, which offloads some workloads, thus saving power and CPU resources. If you use a processor supporting the GNA, such as Intel&reg; Core&trade; i3-8121U and Intel&reg; Core&trade; i7-1065G7, you can notice that CPU load is much lower when GNA is selected. If you selected GNA as a device for inference, and your processor does not support GNA, then execution is performed in the emulation mode (on CPU) because `GNA_AUTO` configuration option is used.
-> See [the GNA plugin documentation](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_supported_plugins_GNA.html) for more information.
-
-Speech Library provides a highly optimized implementation of preprocessing and postprocessing (feature extraction and decoding) on CPU only.
-
-## Custom Models Requirements
-
-Before running demonstration applications with custom models, follow the steps below:
-
-1. Build the Speech Library and demonstration application using the `demo_speech_recognition.sh/.bat` file mentioned in <a href="#run-demos">Run Speech Recognition Demos with Pre-trained Models</a>
-2. Train acoustic and statistical language models using the Kaldi framework (if required)
-3. [Convert the acoustic model](../../../docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Kaldi.md) using Model Optimizer for Kaldi
-4. [Convert the language model](Kaldi_SLM_conversion_tool.md) using the Kaldi toolkit and provided converter
-5. Create a configuration file that lists all the models required for recognition
-6. Copy configuration file to `{OpenVINO build folder}/data_processing/audio/speech_recognition/models/{LANG}`. The demo models are trained for US English, so use `en-us` for the `{LANG}` folder name.
-
-Then you can use new models in the live speech recognition demo.
-To perform speech recognition using a new model and the command-line application, provide the path to the new configuration file as an input argument of the application.
-
-## Convert Acoustic Model with OpenVINO&trade; Model Optimizer for Kaldi*
-
-In order to convert acoustic models, the following Kaldi files are required:
-
-- Acoustic model file, `final.nnet` – RAW neural network without topology information
-- Counts file, `pdf.counts` (if used)
-- Feature transformation file, `final.feature_transform` (if used)
-
-For conversion steps, follow [Converting a Kaldi* Model](../../../docs/MO_DG/prepare_model/convert_model/Convert_Model_From_Kaldi.md).
-
-> **NOTE**: Set the path to the XML file with the converted model in the configuration file.
-
-## Convert Language Model with Provided Converter
-
-In order to convert language models, the following Kaldi files are required:
-- Acoustic model with the Hidden Markov Model (HMM) topology, `final.mdl`
-- Language model Weighted Finite-State Transducers (WFST) graph, `HCLG.wfst`
-- Label symbol file, `words.txt`.
-
-All these files are required to create resources for demo applications.
-
-Model conversion from Kaldi requires the following steps:
-
-1. Save HCLG WFST as the openFST const type:
-   ```
-   $KALDI_ROOT/tools/openfst/bin/fstconvert --fst_type=const HCLG.fst HCLG.const_fst
-   ```
-
-2. Generate transition ID information using `phones.txt` and `final.mdl`:
-   ```
-   $KALDI_ROOT/src/bin/show-transitions phones.txt final.mdl > transitions.txt
-   ```
-
-3. Convert HCLG WFST using resource conversion executable:
-   ```
-   kaldi_slm_conversion_tool HCLG.const_fst transitions.txt words.txt cl.fst labels.bin
-   ```
-
-> **NOTE**: Put the paths to `cl.fst` and `labels.bin` files in the configuration file to use them with the Live Speech Recognition Demo Application.
-
-See the [offline speech recognition demo documentation](Offline_speech_recognition_demo.md) to learn about the configuration file format.
-
-See [Kaldi* Statistical Language Model Conversion Tool](Kaldi_SLM_conversion_tool.md) for more information on the conversion tool.
diff --git a/inference-engine/samples/speech_libs_and_demos/img/asr_pipeline.png b/inference-engine/samples/speech_libs_and_demos/img/asr_pipeline.png
deleted file mode 100644
index 84a631f0397eb5..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/asr_pipeline.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:620b57920f377725860bd8a2add72a8a9f33e5c1aee3aaf560c02d91f31817e1
-size 115336
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_1.png b/inference-engine/samples/speech_libs_and_demos/img/icon_1.png
deleted file mode 100644
index 0848289692f2be..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_1.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:844ddf108bceba2b7ca998809927aae6d463e32d5f4ee82af19e480752fac1c1
-size 658
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_10.png b/inference-engine/samples/speech_libs_and_demos/img/icon_10.png
deleted file mode 100644
index f20734dedb62e9..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_10.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:11089fbf62b5011215a6767d83920eacc292405f013842b753e58bf5fa2555ec
-size 865
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_11.png b/inference-engine/samples/speech_libs_and_demos/img/icon_11.png
deleted file mode 100644
index 2014e4cd32e3e3..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_11.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b54202be4a359184b17bfa501bd77a6efb5b66c1d5c8da7eb8e4ce53d1192cd1
-size 717
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_12.png b/inference-engine/samples/speech_libs_and_demos/img/icon_12.png
deleted file mode 100644
index 744f79b032abf9..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_12.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:62a4231a21a63ec9e2fc186da14ed3059498e3fc4723cdca8d771622633ef92d
-size 845
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_2.png b/inference-engine/samples/speech_libs_and_demos/img/icon_2.png
deleted file mode 100644
index 3bd4c0f2640a5d..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_2.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:01a0e88e53ea004212e6386b920bb5bffd7269164a3535f006c733aa0c25adf0
-size 764
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_3.png b/inference-engine/samples/speech_libs_and_demos/img/icon_3.png
deleted file mode 100644
index da109c06b11080..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_3.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:43c0ddfa3ff5f9edd30e03b15b0de1cdc201fb3f03ebc3f014db4c3bd0f03630
-size 802
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_4.png b/inference-engine/samples/speech_libs_and_demos/img/icon_4.png
deleted file mode 100644
index 0b73ab4c6908c7..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_4.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0103887a8cfc7fc03150762ab21fd7c1991ce9bfa8b1ae2ffc62051026e29543
-size 695
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_5.png b/inference-engine/samples/speech_libs_and_demos/img/icon_5.png
deleted file mode 100644
index 67d31c454d1a06..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_5.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:65d16aaa28d91b4fc2c0e3ee7e570fabb03e95d9178b96bff1580b7b0ce14b03
-size 776
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_6.png b/inference-engine/samples/speech_libs_and_demos/img/icon_6.png
deleted file mode 100644
index ca86e52cd6c529..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_6.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:8984135312b3342675bcfa20351738a97c7e795c641b377d91b6b92cd071eb62
-size 843
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_7.png b/inference-engine/samples/speech_libs_and_demos/img/icon_7.png
deleted file mode 100644
index 885e20f9aabd93..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_7.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fd0a6dbecfb8b6fa9b7514372ff1ab3ca361dced155cbdf14ba3c7c41b7c357e
-size 709
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_8.png b/inference-engine/samples/speech_libs_and_demos/img/icon_8.png
deleted file mode 100644
index 272ca19b5e6a64..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_8.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d9775faed5d611f092bb7f7254fe1d1232bd90b0960ebd03d3fe69a24236febe
-size 840
diff --git a/inference-engine/samples/speech_libs_and_demos/img/icon_9.png b/inference-engine/samples/speech_libs_and_demos/img/icon_9.png
deleted file mode 100644
index 1d5d33762144a4..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/icon_9.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:4931e6ddeeb2512e997c2fc8a51b064f4e753470d7bf6661120ff4580b7830bd
-size 846
diff --git a/inference-engine/samples/speech_libs_and_demos/img/live_speech_recognition_demo_annotated.jpg b/inference-engine/samples/speech_libs_and_demos/img/live_speech_recognition_demo_annotated.jpg
deleted file mode 100644
index d17c55374399a5..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/live_speech_recognition_demo_annotated.jpg
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b54c302e27470d139285c0958026b0b64d9f91ea41b0bf030e6be933bfd06d02
-size 86985
diff --git a/inference-engine/samples/speech_libs_and_demos/img/new_speech_demos.png b/inference-engine/samples/speech_libs_and_demos/img/new_speech_demos.png
deleted file mode 100644
index d42ddbf6841d00..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/new_speech_demos.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a1dea7d13713a9c37bad21a1df8077d43696f67cbbab5eb1e87b92b3b91b2a29
-size 29798
diff --git a/inference-engine/samples/speech_libs_and_demos/img/speech_library_api.png b/inference-engine/samples/speech_libs_and_demos/img/speech_library_api.png
deleted file mode 100644
index 79db4604f80486..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/speech_library_api.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:1b8a55d04d813db595af843de7dfb89f0776709ec6d1b46d795802cbe424b304
-size 20367
diff --git a/inference-engine/samples/speech_libs_and_demos/img/speech_sample.png b/inference-engine/samples/speech_libs_and_demos/img/speech_sample.png
deleted file mode 100644
index f3a8f468408ac0..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/speech_sample.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:62b8315db0436299decd3e60c7a2171d575735e405610312bb9784e6a1b0b79c
-size 29120
diff --git a/inference-engine/samples/speech_libs_and_demos/img/sw_components.png b/inference-engine/samples/speech_libs_and_demos/img/sw_components.png
deleted file mode 100644
index 79b066a3ef9df8..00000000000000
--- a/inference-engine/samples/speech_libs_and_demos/img/sw_components.png
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f965a796362dc4881e1bc129e6936d582d923ae83f2d97d3798fd186f152bbc9
-size 15294
diff --git a/inference-engine/samples/style_transfer_sample/README.md b/inference-engine/samples/style_transfer_sample/README.md
index 9e791f168a7739..ee8c57bed0ae1e 100644
--- a/inference-engine/samples/style_transfer_sample/README.md
+++ b/inference-engine/samples/style_transfer_sample/README.md
@@ -77,7 +77,7 @@ Running the application with the empty list of options yields the usage message
 > - The sample accepts models in ONNX format (\*.onnx) that do not require preprocessing.
 
 ### Example
-1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader_README):
+1. Download a pre-trained model using [Model Downloader](@ref omz_tools_downloader):
 ```
 python <path_to_omz_tools>/downloader.py --name fast-neural-style-mosaic-onnx
 ```
diff --git a/inference-engine/src/CMakeLists.txt b/inference-engine/src/CMakeLists.txt
index 4ac1a0da14b304..ceb077de7a73d4 100644
--- a/inference-engine/src/CMakeLists.txt
+++ b/inference-engine/src/CMakeLists.txt
@@ -30,8 +30,6 @@ endif()
 
 add_subdirectory(hetero_plugin)
 
-add_subdirectory(auto_plugin)
-
 add_subdirectory(multi_device)
 
 add_subdirectory(transformations)
diff --git a/inference-engine/src/auto_plugin/CMakeLists.txt b/inference-engine/src/auto_plugin/CMakeLists.txt
deleted file mode 100644
index 7d430d64961f19..00000000000000
--- a/inference-engine/src/auto_plugin/CMakeLists.txt
+++ /dev/null
@@ -1,19 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-set (TARGET_NAME "AutoPlugin")
-
-file(GLOB SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp)
-file(GLOB HEADERS ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp)
-
-ie_add_plugin(NAME ${TARGET_NAME}
-              DEVICE_NAME "AUTO"
-              SOURCES ${SOURCES} ${HEADERS}
-              VERSION_DEFINES_FOR auto_plugin.cpp)
-
-target_link_libraries(${TARGET_NAME} PRIVATE ngraph inference_engine inference_engine_transformations)
-
-ie_add_api_validator_post_build_step(TARGET ${TARGET_NAME})
-
-set_target_properties(${TARGET_NAME} PROPERTIES INTERPROCEDURAL_OPTIMIZATION_RELEASE ${ENABLE_LTO})
diff --git a/inference-engine/src/auto_plugin/auto_plugin.cpp b/inference-engine/src/auto_plugin/auto_plugin.cpp
deleted file mode 100644
index 5ad9d46984aac6..00000000000000
--- a/inference-engine/src/auto_plugin/auto_plugin.cpp
+++ /dev/null
@@ -1,11 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include "auto_plugin.hpp"
-
-namespace AutoPlugin {
-// define CreatePluginEngine to create plugin instance
-static const InferenceEngine::Version version = {{2, 1}, CI_BUILD_NUMBER, "AutoPlugin"};
-IE_DEFINE_PLUGIN_CREATE_FUNCTION(AutoInferencePlugin, version)
-}  // namespace AutoPlugin
diff --git a/inference-engine/src/auto_plugin/auto_plugin.hpp b/inference-engine/src/auto_plugin/auto_plugin.hpp
deleted file mode 100644
index 77e22d1ab03b9a..00000000000000
--- a/inference-engine/src/auto_plugin/auto_plugin.hpp
+++ /dev/null
@@ -1,17 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <cpp_interfaces/interface/ie_internal_plugin_config.hpp>
-#include <cpp_interfaces/interface/ie_iplugin_internal.hpp>
-
-namespace AutoPlugin {
-class AutoInferencePlugin : public InferenceEngine::IInferencePlugin {
-public:
-    AutoInferencePlugin() = default;
-    ~AutoInferencePlugin() = default;
-};
-
-}  // namespace AutoPlugin
diff --git a/inference-engine/src/cldnn_engine/cldnn_config.cpp b/inference-engine/src/cldnn_engine/cldnn_config.cpp
index 3de19bdff87dcc..28aa8063e4757f 100644
--- a/inference-engine/src/cldnn_engine/cldnn_config.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_config.cpp
@@ -46,8 +46,10 @@ void Config::UpdateFromMap(const std::map<std::string, std::string>& configMap)
     for (auto& kvp : configMap) {
         std::string key = kvp.first;
         std::string val = kvp.second;
-
-        if (key.compare(PluginConfigParams::KEY_PERF_COUNT) == 0) {
+        const auto hints = perfHintsConfig.SupportedKeys();
+        if (hints.end() != std::find(hints.begin(), hints.end(), key)) {
+            perfHintsConfig.SetConfig(key, val);
+        } else if (key.compare(PluginConfigParams::KEY_PERF_COUNT) == 0) {
             if (val.compare(PluginConfigParams::YES) == 0) {
                 useProfiling = true;
             } else if (val.compare(PluginConfigParams::NO) == 0) {
@@ -341,6 +343,9 @@ void Config::adjustKeyMapValues() {
         key_config_map[GPUConfigParams::KEY_GPU_ENABLE_LOOP_UNROLLING] = PluginConfigParams::YES;
     else
         key_config_map[GPUConfigParams::KEY_GPU_ENABLE_LOOP_UNROLLING] = PluginConfigParams::NO;
+    key_config_map.insert({ PluginConfigParams::KEY_PERFORMANCE_HINT, perfHintsConfig.ovPerfHint });
+    key_config_map.insert({ PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS,
+                     std::to_string(perfHintsConfig.ovPerfHintNumRequests) });
 }
 IE_SUPPRESS_DEPRECATED_END
 
diff --git a/inference-engine/src/cldnn_engine/cldnn_config.h b/inference-engine/src/cldnn_engine/cldnn_config.h
index 873c01e2188445..4400b6c295ee4b 100644
--- a/inference-engine/src/cldnn_engine/cldnn_config.h
+++ b/inference-engine/src/cldnn_engine/cldnn_config.h
@@ -8,7 +8,7 @@
 #include <string>
 
 #include "cldnn_custom_layer.h"
-
+#include <ie_performance_hints.hpp>
 #include <cldnn/graph/network.hpp>
 
 namespace CLDNNPlugin {
@@ -62,6 +62,7 @@ struct Config {
     bool enable_loop_unrolling;
 
     std::map<std::string, std::string> key_config_map;
+    InferenceEngine::PerfHintsConfig  perfHintsConfig;
 };
 
 }  // namespace CLDNNPlugin
diff --git a/inference-engine/src/cldnn_engine/cldnn_engine.cpp b/inference-engine/src/cldnn_engine/cldnn_engine.cpp
index 90e42510eaebe3..67204de6a4836b 100644
--- a/inference-engine/src/cldnn_engine/cldnn_engine.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_engine.cpp
@@ -308,18 +308,6 @@ InferenceEngine::CNNNetwork clDNNEngine::CloneAndTransformNetwork(const Inferenc
                     return true;
                 });
 
-            pass_config->set_callback<ngraph::pass::ConvertNMS1ToNMS5,
-                                      ngraph::pass::ConvertNMS3ToNMS5,
-                                      ngraph::pass::ConvertNMS4ToNMS5,
-                                      ngraph::pass::ConvertNMSToNMSIEInternal>(
-                    [](const_node_ptr &node) -> bool {
-                        return node->input_value(0).get_shape().back() == 4lu &&
-                               node->input_value(0).get_shape().front() == node->input_value(1).get_shape().front() &&
-                               node->input_value(0).get_shape()[1] == node->input_value(1).get_shape().back() &&
-                               node->input_value(0).get_shape().size() == 3lu &&
-                               node->input_value(1).get_shape().size() == 3lu;
-                    });
-
             pass_config->set_callback<ngraph::pass::MVN6Decomposition>(
                 [](const_node_ptr &node) -> bool {
                     const auto mvn = std::dynamic_pointer_cast<const ngraph::op::v6::MVN>(node);
@@ -565,14 +553,40 @@ void clDNNEngine::UpdateConfig(CLDNNPlugin::Config& conf, const InferenceEngine:
     }
 }
 
+std::map<std::string, std::string> clDNNEngine::ConvertPerfHintsToConfig(
+        const std::map<std::string, std::string>& network_config,
+        const CLDNNPlugin::Config& plugin_config) const {
+    // deduces the actual settings from the performance hints and returns fully-defined config
+    auto config = network_config;
+    const auto &mode = config.find(PluginConfigParams::KEY_PERFORMANCE_HINT);
+    // the mode may have just arrived to the LoadNetwork, or was set with the plugins' SetConfig
+    if (mode != config.end() || !plugin_config.perfHintsConfig.ovPerfHint.empty()) {
+        const auto mode_name = (mode != config.end())
+                               ? PerfHintsConfig::CheckPerformanceHintValue(mode->second)
+                               : plugin_config.perfHintsConfig.ovPerfHint;
+        //checking streams (to avoid overriding what user might explicitly set in the incoming config or previously via SetConfig)
+        const auto streams = config.find(PluginConfigParams::KEY_GPU_THROUGHPUT_STREAMS);
+        if (streams == config.end() && !streamsSet) {
+            if (mode_name == CONFIG_VALUE(LATENCY)) {
+                config[PluginConfigParams::KEY_GPU_THROUGHPUT_STREAMS] = std::to_string(1);
+            } else if (mode_name == CONFIG_VALUE(THROUGHPUT)) {
+                config[PluginConfigParams::KEY_GPU_THROUGHPUT_STREAMS] = CONFIG_VALUE(GPU_THROUGHPUT_AUTO);
+                config[GPUConfigParams::KEY_GPU_PLUGIN_THROTTLE] = std::to_string(1);
+            }
+        }
+    }
+    return config;
+}
+
 IExecutableNetworkInternal::Ptr clDNNEngine::LoadExeNetworkImpl(const InferenceEngine::CNNNetwork &network,
-                                                                const std::map<std::string, std::string> &config) {
+                                                                const std::map<std::string, std::string> &orig_config) {
     OV_ITT_SCOPED_TASK(itt::domains::CLDNNPlugin, "clDNNEngine::LoadExeNetworkImpl");
     // verification of supported input
     InferenceEngine::InputsDataMap _networkInputs = network.getInputsInfo();
     check_inputs(_networkInputs);
 
     CLDNNPlugin::Config conf = _impl->m_config;
+    auto config = ConvertPerfHintsToConfig(orig_config, conf);
     UpdateConfig(conf, network, config);
 
     CLDNNRemoteCLContext::Ptr context;
@@ -617,8 +631,8 @@ IExecutableNetworkInternal::Ptr clDNNEngine::LoadExeNetworkImpl(const InferenceE
 }
 
 IExecutableNetworkInternal::Ptr clDNNEngine::LoadExeNetworkImpl(const InferenceEngine::CNNNetwork &network,
-                                                                const IRemoteContext::Ptr &context,
-                                                                const std::map<std::string, std::string> &config) {
+                                                                const RemoteContext::Ptr &context,
+                                                                const std::map<std::string, std::string> &orig_config) {
     InferenceEngine::InputsDataMap _networkInputs = network.getInputsInfo();
     check_inputs(_networkInputs);
 
@@ -628,13 +642,14 @@ IExecutableNetworkInternal::Ptr clDNNEngine::LoadExeNetworkImpl(const InferenceE
     }
 
     CLDNNPlugin::Config conf = getContextImpl(casted)->GetConfig();
+    auto config = ConvertPerfHintsToConfig(orig_config, conf);
     UpdateConfig(conf, network, config);
 
     auto transformedNetwork = CloneAndTransformNetwork(network, conf);
     return std::make_shared<CLDNNExecNetwork>(transformedNetwork, casted, conf);
 }
 
-IRemoteContext::Ptr clDNNEngine::CreateContext(const ParamMap& params) {
+RemoteContext::Ptr clDNNEngine::CreateContext(const ParamMap& params) {
     // parameter map is non-empty
     std::string contextTypeStr = _StrFromParams(params, GPU_PARAM_KEY(CONTEXT_TYPE));
 
@@ -651,7 +666,7 @@ IRemoteContext::Ptr clDNNEngine::CreateContext(const ParamMap& params) {
     }
 }
 
-IRemoteContext::Ptr clDNNEngine::GetDefaultContext(const ParamMap& params) {
+RemoteContext::Ptr clDNNEngine::GetDefaultContext(const ParamMap& params) {
     if (nullptr == m_defaultContext) {
         m_defaultContext.reset(new CLDNNRemoteCLContext(shared_from_this(), params, _impl->m_config));
     }
@@ -659,6 +674,7 @@ IRemoteContext::Ptr clDNNEngine::GetDefaultContext(const ParamMap& params) {
 }
 
 void clDNNEngine::SetConfig(const std::map<std::string, std::string> &config) {
+    streamsSet = (config.find(PluginConfigParams::KEY_GPU_THROUGHPUT_STREAMS) != config.end());
     _impl->m_config.UpdateFromMap(config);
 }
 
diff --git a/inference-engine/src/cldnn_engine/cldnn_engine.h b/inference-engine/src/cldnn_engine/cldnn_engine.h
index 12ac3203205b21..0afcc5db6adad4 100644
--- a/inference-engine/src/cldnn_engine/cldnn_engine.h
+++ b/inference-engine/src/cldnn_engine/cldnn_engine.h
@@ -20,6 +20,7 @@ class clDNNEngine : public InferenceEngine::IInferencePlugin,
                     public InferenceEngine::gpu::details::param_map_obj_getter {
     struct impl;
     std::shared_ptr<impl> _impl;
+    bool streamsSet = false;
 
     // key: device_id, value: cldnn device
     std::map<std::string, cldnn::device::ptr> device_map;
@@ -31,6 +32,9 @@ class clDNNEngine : public InferenceEngine::IInferencePlugin,
     InferenceEngine::CNNNetwork CloneAndTransformNetwork(const InferenceEngine::CNNNetwork& network,
                                                          const CLDNNPlugin::Config& config) const;
 
+    std::map<std::string, std::string> ConvertPerfHintsToConfig(const std::map<std::string, std::string>& network_config,
+                                                               const CLDNNPlugin::Config& plugin_config) const;
+
     void RegisterPrimitives();
     void UpdateConfig(Config& conf, const InferenceEngine::CNNNetwork &network, const std::map<std::string, std::string> &params) const;
 public:
@@ -40,7 +44,7 @@ class clDNNEngine : public InferenceEngine::IInferencePlugin,
                                                                         const std::map<std::string, std::string> &config) override;
 
     InferenceEngine::IExecutableNetworkInternal::Ptr LoadExeNetworkImpl(const InferenceEngine::CNNNetwork &network,
-                                                                        const std::shared_ptr<InferenceEngine::IRemoteContext> &context,
+                                                                        const std::shared_ptr<InferenceEngine::RemoteContext> &context,
                                                                         const std::map<std::string, std::string> &config) override;
 
     void SetConfig(const std::map<std::string, std::string> &config) override;
@@ -49,8 +53,8 @@ class clDNNEngine : public InferenceEngine::IInferencePlugin,
     InferenceEngine::QueryNetworkResult QueryNetwork(const InferenceEngine::CNNNetwork& network,
                                                      const std::map<std::string, std::string>& config) const override;
 
-    std::shared_ptr<InferenceEngine::IRemoteContext> CreateContext(const InferenceEngine::ParamMap& params) override;
-    std::shared_ptr<InferenceEngine::IRemoteContext> GetDefaultContext(const InferenceEngine::ParamMap& params) override;
+    std::shared_ptr<InferenceEngine::RemoteContext> CreateContext(const InferenceEngine::ParamMap& params) override;
+    std::shared_ptr<InferenceEngine::RemoteContext> GetDefaultContext(const InferenceEngine::ParamMap& params) override;
 };
 
 };  // namespace CLDNNPlugin
diff --git a/inference-engine/src/cldnn_engine/cldnn_executable_network.cpp b/inference-engine/src/cldnn_engine/cldnn_executable_network.cpp
index 7102a0ac43913d..2b1258566315f9 100644
--- a/inference-engine/src/cldnn_engine/cldnn_executable_network.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_executable_network.cpp
@@ -32,13 +32,14 @@ using namespace InferenceEngine::details;
 
 namespace CLDNNPlugin {
 
-CLDNNExecNetwork::CLDNNExecNetwork(InferenceEngine::CNNNetwork &network, std::shared_ptr<IRemoteContext> context, Config config) :
+CLDNNExecNetwork::CLDNNExecNetwork(InferenceEngine::CNNNetwork &network, std::shared_ptr<RemoteContext> context, Config config) :
     InferenceEngine::ExecutableNetworkThreadSafeDefault{[&]()->InferenceEngine::ITaskExecutor::Ptr {
-        if (config.throughput_streams > 1) {
+        if (config.exclusiveAsyncRequests) {
+            //exclusiveAsyncRequests essentially disables the streams (and hence should be checked first) => aligned with the CPU behavior
+            return ExecutorManager::getInstance()->getExecutor("GPU");
+        }  else if (config.throughput_streams > 1) {
             return std::make_shared<InferenceEngine::CPUStreamsExecutor>(
                 IStreamsExecutor::Config{"CLDNNPlugin executor", config.throughput_streams});
-        } else if (config.exclusiveAsyncRequests) {
-            return ExecutorManager::getInstance()->getExecutor("GPU");
         } else {
             return std::make_shared<InferenceEngine::CPUStreamsExecutor>(
                 IStreamsExecutor::Config{"CLDNNPlugin executor", 1});
@@ -135,7 +136,7 @@ InferenceEngine::Parameter CLDNNExecNetwork::GetMetric(const std::string &name)
     }
 }
 
-std::shared_ptr<IRemoteContext> CLDNNExecNetwork::GetContext() const {
+std::shared_ptr<RemoteContext> CLDNNExecNetwork::GetContext() const {
     return m_context;
 }
 
diff --git a/inference-engine/src/cldnn_engine/cldnn_executable_network.h b/inference-engine/src/cldnn_engine/cldnn_executable_network.h
index 88267797d71e4d..689c12fcc23cd8 100644
--- a/inference-engine/src/cldnn_engine/cldnn_executable_network.h
+++ b/inference-engine/src/cldnn_engine/cldnn_executable_network.h
@@ -23,7 +23,7 @@ class CLDNNExecNetwork : public InferenceEngine::ExecutableNetworkThreadSafeDefa
 public:
     typedef std::shared_ptr<CLDNNExecNetwork> Ptr;
 
-    CLDNNExecNetwork(InferenceEngine::CNNNetwork &network, std::shared_ptr<InferenceEngine::IRemoteContext> context, Config config);
+    CLDNNExecNetwork(InferenceEngine::CNNNetwork &network, std::shared_ptr<InferenceEngine::RemoteContext> context, Config config);
 
     std::shared_ptr<ngraph::Function> GetExecGraphInfo() override;
     InferenceEngine::IInferRequestInternal::Ptr CreateInferRequest() override;
@@ -32,7 +32,7 @@ class CLDNNExecNetwork : public InferenceEngine::ExecutableNetworkThreadSafeDefa
 
     InferenceEngine::Parameter GetMetric(const std::string &name) const override;
     InferenceEngine::Parameter GetConfig(const std::string &name) const override;
-    std::shared_ptr<InferenceEngine::IRemoteContext> GetContext() const override;
+    std::shared_ptr<InferenceEngine::RemoteContext> GetContext() const override;
 
     std::vector<std::shared_ptr<CLDNNGraph>> m_graphs;
     InferenceEngine::gpu::ClContext::Ptr m_context;
diff --git a/inference-engine/src/cldnn_engine/cldnn_graph.cpp b/inference-engine/src/cldnn_engine/cldnn_graph.cpp
index 75ea9d2a25177b..49d5212d37ede6 100644
--- a/inference-engine/src/cldnn_engine/cldnn_graph.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_graph.cpp
@@ -60,8 +60,6 @@ CLDNNGraph::CLDNNGraph(std::shared_ptr<CLDNNGraph> graph, uint16_t stream_id)
 void CLDNNGraph::UpdateLayersMaps() {
     OV_ITT_SCOPED_TASK(itt::domains::CLDNNPlugin, "CLDNNGraph::UpdateLayersMaps");
     primitiveIDs = m_program->primitiveIDs;
-    primitivesToIRLayersMap = m_program->primitivesToIRLayersMap;
-    IRToNgraphLayersMap = m_program->IRToNgraphLayersMap;
     prevPrimitiveIDs = m_program->prevPrimitiveIDs;
     profilingIDs = m_program->profilingIDs;
     perfMap = m_program->perfMap;
@@ -219,25 +217,6 @@ std::shared_ptr<ngraph::Function> CLDNNGraph::GetExecGraphInfoByPrimitivesInfo(s
         return res;
     };
 
-    auto split_string = [](std::string src, std::string delimiter = ",") -> std::vector<std::string> {
-        std::vector<std::string> tokens;
-        std::string tokenBuf;
-        size_t prev = 0, pos = 0, srcLength = src.length(), delimLength = delimiter.length();
-        do {
-            pos = src.find(delimiter, prev);
-            if (pos == std::string::npos) {
-                pos = srcLength;
-            }
-            tokenBuf = src.substr(prev, pos - prev);
-            if (!tokenBuf.empty()) {
-                tokens.push_back(tokenBuf);
-            }
-            prev = pos + delimLength;
-        } while (pos < srcLength && prev < srcLength);
-
-        return tokens;
-    };
-
     auto remove_type_from_name = [](const std::string& name) -> std::string {
         auto it = std::find(name.begin(), name.end(), ':');
         if (it == name.end() || (it + 1) == name.end())
@@ -246,22 +225,13 @@ std::shared_ptr<ngraph::Function> CLDNNGraph::GetExecGraphInfoByPrimitivesInfo(s
         return std::string((it+1), name.end());
     };
 
+    auto extIdMap = GetNetwork()->get_ext_id_mapping();
+
     auto find_origin_layers = [&](const std::string& name) -> std::vector<std::string> {
-        if (primitivesToIRLayersMap.find(name) == primitivesToIRLayersMap.end())
+        if (extIdMap.find(name) == extIdMap.end()) {
             return {};
-
-        auto cnn_names = primitivesToIRLayersMap.at(name);
-        std::vector<std::string> res;
-
-        for (auto& cnn_name : cnn_names) {
-            if (IRToNgraphLayersMap.find(cnn_name) != IRToNgraphLayersMap.end()) {
-                auto ngraph_names = split_string(IRToNgraphLayersMap.at(cnn_name));
-                res.insert(res.end(), ngraph_names.begin(), ngraph_names.end());
-            } else {
-                res.push_back(cnn_name);
-            }
         }
-        return res;
+        return { extIdMap.at(name) };
     };
 
     auto get_inputs = [&] (const cldnn::primitive_info& prim_info) {
@@ -599,13 +569,21 @@ std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> CLDNNGraph::G
     auto allIds = GetNetwork()->get_all_primitive_org_ids();
     auto executedPrimitives = GetNetwork()->get_executed_primitives();
     auto primitivesInfo = GetNetwork()->get_primitives_info();
+    auto extIdMap = GetNetwork()->get_ext_id_mapping();
 
-    auto getUpperCaseName = [&](std::string name) {
+    auto getUpperCaseName = [](std::string name) {
         if (name.length() > 0)
             name[0] = toupper(name[0]);
         return name;
     };
 
+    auto getClearName = [](std::string name) {
+        if (name.find(":") != std::string::npos) {
+            name = name.substr(name.find(":") + 1, name.length());
+        }
+        return name;
+    };
+
     auto getFromProfiling = [&](std::string primId) -> bool {
         auto perfIter = perfMap.find(primId);
 
@@ -696,10 +674,7 @@ std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> CLDNNGraph::G
                 }
             }
 
-            std::string layerName = primId;
-            if (primId.find(":") != std::string::npos) {
-                layerName = primId.substr(primId.find(":") + 1, primId.length());
-            }
+            std::string layerName = getClearName(primId);
 
             for (auto& pi : primitivesInfo) {
                 if (pi.original_id == primId) {
@@ -735,10 +710,27 @@ std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> CLDNNGraph::G
     }
 
     // Step 3. Checking primitives which has been deleted from execution order but added by clDNNPlugin
-    for (auto& primId : profilingIDs)
+    for (auto& primId : profilingIDs) {
         if (std::find(allIds.begin(), allIds.end(), primId) == allIds.end()) {
             getFromProfiling(primId);
         }
+    }
+
+    for (auto& p : extIdMap) {
+        if (p.first.find(p.second) != std::string::npos) {
+            continue;
+        }
+        auto first_res = result.find(getClearName(p.first));
+        auto second_res = result.find(getClearName(p.second));
+
+        if (first_res != result.end() && second_res != result.end() && first_res != second_res) {
+            std::swap(first_res->second.cpu_uSec,        second_res->second.cpu_uSec);
+            std::swap(first_res->second.realTime_uSec,   second_res->second.realTime_uSec);
+            std::swap(first_res->second.status,          second_res->second.status);
+            std::swap(first_res->second.exec_type,       second_res->second.exec_type);
+            std::swap(first_res->second.execution_index, second_res->second.execution_index);
+        }
+    }
     return result;
 }
 
diff --git a/inference-engine/src/cldnn_engine/cldnn_graph.h b/inference-engine/src/cldnn_engine/cldnn_graph.h
index 206c58aaccd89b..d220c4009f51aa 100644
--- a/inference-engine/src/cldnn_engine/cldnn_graph.h
+++ b/inference-engine/src/cldnn_engine/cldnn_graph.h
@@ -61,8 +61,6 @@ class CLDNNGraph {
     InferenceEngine::gpu::ClContext::Ptr m_context;
     std::vector<std::shared_ptr<cldnn::network>> m_networks;
     std::map<std::string, cldnn::primitive_id> primitiveIDs;
-    std::map<cldnn::primitive_id, std::vector<std::string>> primitivesToIRLayersMap;
-    std::map<cldnn::primitive_id, std::string> IRToNgraphLayersMap;
     std::map<std::string, std::vector<cldnn::primitive_id>> prevPrimitiveIDs;
 
     std::map<cldnn::primitive_id, std::pair<std::string, PerfCounter>> perfMap;
diff --git a/inference-engine/src/cldnn_engine/cldnn_program.cpp b/inference-engine/src/cldnn_engine/cldnn_program.cpp
index 7386501f0b1671..57e96a14201723 100644
--- a/inference-engine/src/cldnn_engine/cldnn_program.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_program.cpp
@@ -284,14 +284,12 @@ std::vector<cldnn::primitive_id> Program::GetInputPrimitiveIDs(const std::shared
 void Program::AddPrimitiveToProfiler(const std::shared_ptr<ngraph::Node>& op,
                                      cldnn::primitive_id customOutputId) {
     auto id = layer_type_name_ID(op);
-    primitivesToIRLayersMap[id] = { op->get_friendly_name() };
     primitiveIDs[id] = customOutputId.empty() ? id : customOutputId;
     profilingIDs.push_back(id);
 }
 
 void Program::AddPrimitiveToProfiler(cldnn::primitive_id id, const std::shared_ptr<ngraph::Node>& op,
                                      cldnn::primitive_id customOutputId) {
-    primitivesToIRLayersMap[id] = { op->get_friendly_name() };
     primitiveIDs[id] = customOutputId.empty() ? id : customOutputId;
     profilingIDs.push_back(id);
 }
@@ -299,7 +297,6 @@ void Program::AddPrimitiveToProfiler(cldnn::primitive_id id, const std::shared_p
 void Program::AddInnerPrimitiveToProfiler(cldnn::primitive_id id, cldnn::primitive_id parentId,
                                           const std::shared_ptr<ngraph::Node>& op) {
     InitProfileInfo(id, layer_type_lower(op), false, InferenceEngine::InferenceEngineProfileInfo::EXECUTED, parentId);
-    primitivesToIRLayersMap[id] = { op->get_friendly_name() };
     primitiveIDs[id] = id;
     profilingIDs.push_back(id);
 }
diff --git a/inference-engine/src/cldnn_engine/cldnn_program.h b/inference-engine/src/cldnn_engine/cldnn_program.h
index 23b6313cac96b6..f499104a9b9e91 100644
--- a/inference-engine/src/cldnn_engine/cldnn_program.h
+++ b/inference-engine/src/cldnn_engine/cldnn_program.h
@@ -76,8 +76,6 @@ class Program {
     static const cldnn::primitive_id m_postCustomLayerTag;
 
     std::map<std::string, cldnn::primitive_id> primitiveIDs;
-    std::map<cldnn::primitive_id, std::vector<std::string>> primitivesToIRLayersMap;
-    std::map<cldnn::primitive_id, std::string> IRToNgraphLayersMap;
     std::map<std::string, std::vector<cldnn::primitive_id>> prevPrimitiveIDs;
     std::map<cldnn::primitive_id, std::pair<std::string, PerfCounter>> perfMap;
 
diff --git a/inference-engine/src/cldnn_engine/cldnn_remote_context.cpp b/inference-engine/src/cldnn_engine/cldnn_remote_context.cpp
index 5e2519cc9ba1a3..e816449b461f8b 100644
--- a/inference-engine/src/cldnn_engine/cldnn_remote_context.cpp
+++ b/inference-engine/src/cldnn_engine/cldnn_remote_context.cpp
@@ -134,7 +134,7 @@ std::string CLDNNRemoteBlobImpl::getDeviceName() const noexcept {
     return getContextImpl(m_context.lock())->getDeviceName();
 };
 
-std::shared_ptr<IRemoteContext> CLDNNRemoteBlobImpl::getContext() const noexcept {
+std::shared_ptr<RemoteContext> CLDNNRemoteBlobImpl::getContext() const noexcept {
     return m_context.lock();
 }
 
diff --git a/inference-engine/src/cldnn_engine/cldnn_remote_context.h b/inference-engine/src/cldnn_engine/cldnn_remote_context.h
index d35cd7c041087a..f93193a15435c7 100644
--- a/inference-engine/src/cldnn_engine/cldnn_remote_context.h
+++ b/inference-engine/src/cldnn_engine/cldnn_remote_context.h
@@ -8,7 +8,7 @@
 #include <cldnn/runtime/engine.hpp>
 #include <ie_parameter.hpp>
 #include <cpp_interfaces/interface/ie_iplugin_internal.hpp>
-#include <cpp_interfaces/interface/ie_iremote_context.hpp>
+#include <ie_remote_context.hpp>
 #include "cldnn_config.h"
 #include "cldnn_common_utils.h"
 
@@ -54,7 +54,7 @@ class CLDNNRemoteBlobImpl : public InferenceEngine::gpu::details::param_map_obj_
     bool deallocate() noexcept;
     InferenceEngine::ParamMap getParams() const;
     std::string getDeviceName() const noexcept;
-    std::shared_ptr<InferenceEngine::IRemoteContext> getContext() const noexcept;
+    std::shared_ptr<InferenceEngine::RemoteContext> getContext() const noexcept;
     InferenceEngine::LockedMemory<void> buffer() noexcept;
     InferenceEngine::LockedMemory<const void> cbuffer() const noexcept;
     InferenceEngine::LockedMemory<void> rwmap()noexcept;
diff --git a/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp b/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp
index e46643f0617ca9..d67f9e9888a9d7 100644
--- a/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp
+++ b/inference-engine/src/cldnn_engine/ops/batch_to_space.cpp
@@ -42,7 +42,8 @@ void CreateBatchToSpaceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Batc
                                                   inputs[0], // block_shape
                                                   inputs[1], // crops_begin
                                                   inputs[2], // crops_end
-                                                  out_size);
+                                                  out_size,
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(batchToSpacePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/broadcast.cpp b/inference-engine/src/cldnn_engine/ops/broadcast.cpp
index 6d6e63032005c3..16264a31feaffe 100644
--- a/inference-engine/src/cldnn_engine/ops/broadcast.cpp
+++ b/inference-engine/src/cldnn_engine/ops/broadcast.cpp
@@ -31,8 +31,13 @@ static void CreateCommonBroadcastOp(Program& p, const std::shared_ptr<ngraph::No
         if (targetFormat.value != DefaultFormatForDims(inputRank).value) {
             auto reorderName = layerName + "_cldnn_in_reorder";
             auto targetDatatype = DataTypeFromPrecision(op->get_input_element_type(0));
-            auto reorderPrim = cldnn::reorder(reorderName, inputPrimitive, targetFormat, targetDatatype);
-
+            auto reorderPrim = cldnn::reorder(reorderName,
+                                              inputPrimitive,
+                                              targetFormat,
+                                              targetDatatype,
+                                              std::vector<float>(),
+                                              cldnn::reorder_mean_mode::subtract,
+                                              op->get_friendly_name());
             p.AddPrimitive(reorderPrim);
             p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
 
@@ -66,7 +71,7 @@ static void CreateCommonBroadcastOp(Program& p, const std::shared_ptr<ngraph::No
 
         auto targetShape = CldnnTensorFromIEDims(inputShape);
 
-        auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitive, targetShape);
+        auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitive, targetShape, op->get_friendly_name());
         p.AddPrimitive(reshapePrim);
         p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
 
@@ -75,7 +80,9 @@ static void CreateCommonBroadcastOp(Program& p, const std::shared_ptr<ngraph::No
 
     auto broadcastPrim = cldnn::broadcast(layerName,
                                           inputPrimitive,
-                                          CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                          CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                          {},
+                                          op->get_friendly_name());
 
     p.AddPrimitive(broadcastPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/concat.cpp b/inference-engine/src/cldnn_engine/ops/concat.cpp
index 453e99965309da..fc1e51d1981e5d 100644
--- a/inference-engine/src/cldnn_engine/ops/concat.cpp
+++ b/inference-engine/src/cldnn_engine/ops/concat.cpp
@@ -45,7 +45,8 @@ void CreateConcatOp(Program& p, const std::shared_ptr<ngraph::op::v0::Concat>& o
         layerName,
         inputPrimitives,
         GetConcatAxis(op->get_axis(), op->get_input_shape(0).size()),
-        DataTypeFromPrecision(op->get_output_element_type(0)));
+        DataTypeFromPrecision(op->get_output_element_type(0)),
+        op->get_friendly_name());
 
     p.AddPrimitive(concatPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/constant.cpp b/inference-engine/src/cldnn_engine/ops/constant.cpp
index fea42f31d98227..5f28cd2e60227d 100644
--- a/inference-engine/src/cldnn_engine/ops/constant.cpp
+++ b/inference-engine/src/cldnn_engine/ops/constant.cpp
@@ -199,7 +199,7 @@ void CreateConstantOp(Program& p, const std::shared_ptr<ngraph::op::v0::Constant
         } else {
             std::memcpy(&buf[0], &data[0], bufSize);
         }
-        p.AddPrimitive(cldnn::data(initialconstPrimID, mem));
+        p.AddPrimitive(cldnn::data(initialconstPrimID, mem, op->get_friendly_name()));
         p.blobMemCache[std::make_pair(data, constDims)] = initialconstPrimID;
         constPrimID = initialconstPrimID;
     }
diff --git a/inference-engine/src/cldnn_engine/ops/convert.cpp b/inference-engine/src/cldnn_engine/ops/convert.cpp
index 6af5bee759d683..603eb26abeb600 100644
--- a/inference-engine/src/cldnn_engine/ops/convert.cpp
+++ b/inference-engine/src/cldnn_engine/ops/convert.cpp
@@ -19,8 +19,13 @@ void CreateConvertLikeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Conve
 
     auto outDataType = DataTypeFromPrecision(op->get_input_element_type(1));
 
-    auto reorderPrim = cldnn::reorder(layerName, inputPrimitives[0], cldnn::format::any, outDataType);
-
+    auto reorderPrim = cldnn::reorder(layerName,
+                                      inputPrimitives[0],
+                                      cldnn::format::any,
+                                      outDataType,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name());
     p.AddPrimitive(reorderPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -32,7 +37,13 @@ void CreateConvertOp(Program& p, const std::shared_ptr<ngraph::op::v0::Convert>&
 
     auto outDataType = DataTypeFromPrecision(op->get_destination_type());
 
-    auto reorderPrim = cldnn::reorder(layerName, inputPrimitives[0], cldnn::format::any, outDataType);
+    auto reorderPrim = cldnn::reorder(layerName,
+                                      inputPrimitives[0],
+                                      cldnn::format::any,
+                                      outDataType,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(reorderPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/convolution.cpp b/inference-engine/src/cldnn_engine/ops/convolution.cpp
index 83f536a68b72fb..e8c44693dbd5d4 100644
--- a/inference-engine/src/cldnn_engine/ops/convolution.cpp
+++ b/inference-engine/src/cldnn_engine/ops/convolution.cpp
@@ -84,7 +84,8 @@ void CreateGroupConvolutionOp(Program& p, const std::shared_ptr<ngraph::op::v1::
                                        params.dilation,
                                        CldnnTensorFromIEDims(outDims),
                                        DataTypeFromPrecision(outPrecision),
-                                       weights_have_group_dim);
+                                       weights_have_group_dim,
+                                       op->get_friendly_name());
 
     p.AddPrimitive(convPrim);
     p.AddPrimitiveToProfiler(op);
@@ -112,7 +113,8 @@ void CreateConvolutionOp(Program& p, const std::shared_ptr<ngraph::op::v1::Convo
                                        params.dilation,
                                        CldnnTensorFromIEDims(outDims),
                                        DataTypeFromPrecision(outPrecision),
-                                       weights_have_group_dim);
+                                       weights_have_group_dim,
+                                       op->get_friendly_name());
 
     p.AddPrimitive(convPrim);
     p.AddPrimitiveToProfiler(op);
@@ -146,7 +148,8 @@ void CreateConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngraph::o
         std::swap(permute_order[1], permute_order[0]);
         auto permutePrim = cldnn::permute(permuteName,
                                           weightsName,
-                                          ConvertPermuteOrder(permute_order, weights_rank));
+                                          ConvertPermuteOrder(permute_order, weights_rank),
+                                          op->get_friendly_name());
 
         p.AddPrimitive(permutePrim);
         p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
@@ -159,14 +162,15 @@ void CreateConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngraph::o
 
     auto params = GetConvolutionParameters(op->get_pads_begin(), op->get_dilations(), op->get_strides(), 1);
     auto deconvPrim = cldnn::deconvolution(layerName,
-        inputs[0],
-        weights,
-        {},
-        params.groups,
-        params.stride,
-        params.padding,
-        CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
-        weights_have_group_dim);
+                                           inputs[0],
+                                           weights,
+                                           {},
+                                           params.groups,
+                                           params.stride,
+                                           params.padding,
+                                           CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
+                                           weights_have_group_dim,
+                                           op->get_friendly_name());
 
     p.AddPrimitive(deconvPrim);
     p.AddPrimitiveToProfiler(op);
@@ -202,7 +206,8 @@ void CreateGroupConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngra
         std::swap(permute_order[2], permute_order[1]);
         auto permutePrim = cldnn::permute(permuteName,
                                           weightsName,
-                                          ConvertPermuteOrder(permute_order, weights_rank));
+                                          ConvertPermuteOrder(permute_order, weights_rank),
+                                          op->get_friendly_name());
 
         p.AddPrimitive(permutePrim);
         p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
@@ -214,14 +219,15 @@ void CreateGroupConvolutionBackpropDataOp(Program& p, const std::shared_ptr<ngra
     const bool weights_have_group_dim = true;
 
     auto deconvPrim = cldnn::deconvolution(layerName,
-        inputs[0],
-        weights,
-        {},
-        params.groups,
-        params.stride,
-        params.padding,
-        CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
-        weights_have_group_dim);
+                                           inputs[0],
+                                           weights,
+                                           {},
+                                           params.groups,
+                                           params.stride,
+                                           params.padding,
+                                           CldnnTensorFromIEDims(op->get_output_tensor(0).get_shape()),
+                                           weights_have_group_dim,
+                                           op->get_friendly_name());
 
     p.AddPrimitive(deconvPrim);
     p.AddPrimitiveToProfiler(op);
@@ -247,7 +253,8 @@ void CreateDeformableConvolutionOp(Program& p, const std::shared_ptr<ngraph::op:
                                            params.stride,
                                            params.padding,
                                            params.dilation,
-                                           CldnnTensorFromIEDims(outDims));
+                                           CldnnTensorFromIEDims(outDims),
+                                           op->get_friendly_name());
 
         p.AddPrimitive(convPrim);
         p.AddPrimitiveToProfiler(op);
@@ -280,7 +287,8 @@ void CreateDeformableConvolutionOp(Program& p, const std::shared_ptr<ngraph::op:
                                                           params.padding,
                                                           params.dilation,
                                                           CldnnTensorFromIEDims(outDims),
-                                                          kernel);
+                                                          kernel,
+                                                          op->get_friendly_name());
         p.AddPrimitive(defConvPrimInterp);
         p.AddInnerPrimitiveToProfiler(defConvLayerNameInterp, defConvLayerNameConv, op);
         auto defConvPrim = cldnn::deformable_conv(defConvLayerNameConv,
@@ -288,7 +296,8 @@ void CreateDeformableConvolutionOp(Program& p, const std::shared_ptr<ngraph::op:
                                                   weights,
                                                   {},
                                                   params.groups,
-                                                  CldnnTensorFromIEDims(outDims));
+                                                  CldnnTensorFromIEDims(outDims),
+                                                  op->get_friendly_name());
         p.AddPrimitive(defConvPrim);
         p.AddPrimitiveToProfiler(defConvLayerNameConv, op);
     }
@@ -313,7 +322,8 @@ void CreateBinaryConvolutionOp(Program& p, const std::shared_ptr<ngraph::op::v1:
                                               CldnnTensorFromIEDims(outDims),
                                               params.groups,
                                               op->get_pad_value(),
-                                              calc_precision);
+                                              calc_precision,
+                                              op->get_friendly_name());
 
     p.AddPrimitive(convPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp b/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp
index c8bd8d54e078ea..7dde9c8b92a014 100644
--- a/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp
+++ b/inference-engine/src/cldnn_engine/ops/ctc_greedy_decoder.cpp
@@ -33,7 +33,10 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -73,8 +76,9 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
         shared_memory.emplace_back(p.GetEngine().allocate_memory(mutableLayout));
 
         cldnn::primitive_id ctc_gd_mutable_id_w = layer_type_name_ID(op) + "_md_write";
-        auto ctc_gd_mutable_prim = cldnn::mutable_data(ctc_gd_mutable_id_w, shared_memory[0]);
-        p.primitivesToIRLayersMap[ctc_gd_mutable_id_w] = { op->get_friendly_name() };
+        auto ctc_gd_mutable_prim = cldnn::mutable_data(ctc_gd_mutable_id_w,
+                                                       shared_memory[0],
+                                                       op->get_friendly_name());
         p.primitiveIDs[ctc_gd_mutable_id_w] = ctc_gd_mutable_id_w;
         p.AddPrimitive(ctc_gd_mutable_prim);
         reorderedInputs.push_back(ctc_gd_mutable_id_w);
@@ -86,7 +90,8 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
                 reorderedInputs,
                 blank_index,
                 ctc_merge_repeated,
-                CldnnTensorFromIEDims(op->get_output_shape(0)));
+                CldnnTensorFromIEDims(op->get_output_shape(0)),
+                op->get_friendly_name());
 
     // clDNN primitive supports only i32 as output data type
     primitive.output_data_type = DataTypeFromPrecision(ngraph::element::i32);
@@ -99,8 +104,10 @@ void CreateCommonCTCGreedyDecoderOp(Program& p, const std::shared_ptr<ngraph::No
 
     if (num_output == 2) {
         cldnn::primitive_id ctc_gd_mutable_id_r = layer_type_name_ID(op) + ".1";
-        auto ctc_gd_mutable_prim_r = cldnn::mutable_data(ctc_gd_mutable_id_r, { CTCGreedyDecoderLayerName }, shared_memory[0]);
-        p.primitivesToIRLayersMap[ctc_gd_mutable_id_r] = { op->get_friendly_name() };
+        auto ctc_gd_mutable_prim_r = cldnn::mutable_data(ctc_gd_mutable_id_r,
+                                                         { CTCGreedyDecoderLayerName },
+                                                         shared_memory[0],
+                                                         op->get_friendly_name());
         p.primitiveIDs[ctc_gd_mutable_id_r] = ctc_gd_mutable_id_r;
         p.AddPrimitive(ctc_gd_mutable_prim_r);
     }
diff --git a/inference-engine/src/cldnn_engine/ops/cum_sum.cpp b/inference-engine/src/cldnn_engine/ops/cum_sum.cpp
index 1bdcec2957eda5..9f8e2a463f2890 100644
--- a/inference-engine/src/cldnn_engine/ops/cum_sum.cpp
+++ b/inference-engine/src/cldnn_engine/ops/cum_sum.cpp
@@ -63,7 +63,8 @@ void CreateCumSumOp(Program& p, const std::shared_ptr<ngraph::op::v0::CumSum>& o
                                     inputPrimitives[0],
                                     GetCumSumAxis(axis, rank),
                                     exclusive,
-                                    reverse);
+                                    reverse,
+                                    op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/custom.cpp b/inference-engine/src/cldnn_engine/ops/custom.cpp
index 85945bfbdb9698..c967100d1f9814 100644
--- a/inference-engine/src/cldnn_engine/ops/custom.cpp
+++ b/inference-engine/src/cldnn_engine/ops/custom.cpp
@@ -145,7 +145,10 @@ void CreateCustomOp(Program& p, const std::shared_ptr<ngraph::Node>& op, CLDNNCu
                         reorderPrimName,
                         inputPrimitives[param.portIndex],
                         param.format,
-                        DataTypeFromPrecision(op->get_input_element_type(param.portIndex)));
+                        DataTypeFromPrecision(op->get_input_element_type(param.portIndex)),
+                        std::vector<float>(),
+                        cldnn::reorder_mean_mode::subtract,
+                        op->get_friendly_name());
 
                     p.AddPrimitive(preprocessPrim);
                     p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
@@ -229,7 +232,8 @@ void CreateCustomOp(Program& p, const std::shared_ptr<ngraph::Node>& op, CLDNNCu
                                                   customLayer->CompilerOptions(),
                                                   outputLayout,
                                                   gws,
-                                                  lws);
+                                                  lws,
+                                                  op->get_friendly_name());
 
     auto prevLayerName = genericLayerName;
     if (outputLayout.format != cldnn::format::any) {
@@ -239,7 +243,10 @@ void CreateCustomOp(Program& p, const std::shared_ptr<ngraph::Node>& op, CLDNNCu
             cldnn::reorder(reorderPrimName,
                            genericLayerName,
                            DefaultFormatForDims(op->get_output_shape(0).size()),
-                           customPrim.output_layout.data_type));
+                           customPrim.output_layout.data_type,
+                           std::vector<float>(),
+                           cldnn::reorder_mean_mode::subtract,
+                           op->get_friendly_name()));
         prevLayerName = reorderPrimName;
         p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
     }
diff --git a/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp b/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp
index b53262ab23dec7..aa762a356d705a 100644
--- a/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp
+++ b/inference-engine/src/cldnn_engine/ops/depth_to_space.cpp
@@ -33,7 +33,8 @@ void CreateDepthToSpaceOp(Program& p, const std::shared_ptr<ngraph::op::v0::Dept
     auto depthToSpacePrim = cldnn::depth_to_space(layerName,
                                                   inputPrimitives[0],
                                                   blockSize,
-                                                  mode);
+                                                  mode,
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(depthToSpacePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/detection_output.cpp b/inference-engine/src/cldnn_engine/ops/detection_output.cpp
index aa2b505f0e76df..80616090655314 100644
--- a/inference-engine/src/cldnn_engine/ops/detection_output.cpp
+++ b/inference-engine/src/cldnn_engine/ops/detection_output.cpp
@@ -75,7 +75,8 @@ void CreateDetectionOutputOp(Program& p, const std::shared_ptr<ngraph::op::v0::D
                                                  input_height,
                                                  decrease_label_id,
                                                  clip_before_nms,
-                                                 clip_after_nms);
+                                                 clip_after_nms,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(detectionPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/eltwise.cpp b/inference-engine/src/cldnn_engine/ops/eltwise.cpp
index 817512d5bf92ec..f486bff593d00e 100644
--- a/inference-engine/src/cldnn_engine/ops/eltwise.cpp
+++ b/inference-engine/src/cldnn_engine/ops/eltwise.cpp
@@ -46,7 +46,13 @@ void CreateElementwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cl
             if (targetFormat.value != DefaultFormatForDims(inputRank).value) {
                 auto reorderName = layerName + "_cldnn_in" + std::to_string(i) + "_reorder";
                 auto targetDatatype = DataTypeFromPrecision(op->get_input_element_type(i));
-                auto reorderPrim = cldnn::reorder(reorderName, inputPrimitives[i], targetFormat, targetDatatype);
+                auto reorderPrim = cldnn::reorder(reorderName,
+                                                  inputPrimitives[i],
+                                                  targetFormat,
+                                                  targetDatatype,
+                                                  std::vector<float>(),
+                                                  cldnn::reorder_mean_mode::subtract,
+                                                  op->get_friendly_name());
 
                 p.AddPrimitive(reorderPrim);
                 p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
@@ -61,7 +67,7 @@ void CreateElementwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cl
 
             auto targetShape = CldnnTensorFromIEDims(inputShape);
 
-            auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape);
+            auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape, op->get_friendly_name());
             p.AddPrimitive(reshapePrim);
             p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
 
@@ -74,7 +80,8 @@ void CreateElementwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cl
                                       inputPrimitives,
                                       mode,
                                       {},
-                                      out_dt);
+                                      out_dt,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(eltwisePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp b/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp
index 2e97a60aebf8be..369c0eca44a439 100644
--- a/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp
+++ b/inference-engine/src/cldnn_engine/ops/embedding_bag.cpp
@@ -49,7 +49,10 @@ void CreateEmbeddingBagOffsetsSumOp(Program& p, const std::shared_ptr<ngraph::op
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -62,7 +65,8 @@ void CreateEmbeddingBagOffsetsSumOp(Program& p, const std::shared_ptr<ngraph::op
                                                  reorderedInputs,
                                                  cldnn::embedding_bag::offsets_sum,
                                                  CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                                 defaultIndex);
+                                                 defaultIndex,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(embeddingBagPrim);
     p.AddPrimitiveToProfiler(op);
@@ -86,7 +90,10 @@ void CreateEmbeddingBagPackedSumOp(Program& p, const std::shared_ptr<ngraph::op:
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -98,7 +105,9 @@ void CreateEmbeddingBagPackedSumOp(Program& p, const std::shared_ptr<ngraph::op:
     auto embeddingBagPrim = cldnn::embedding_bag(layerName,
                                                  reorderedInputs,
                                                  cldnn::embedding_bag::packed_sum,
-                                                 CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                                 CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                                 -1,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(embeddingBagPrim);
     p.AddPrimitiveToProfiler(op);
@@ -140,7 +149,10 @@ void CreateEmbeddingSegmentsSumOp(Program& p, const std::shared_ptr<ngraph::op::
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -153,7 +165,8 @@ void CreateEmbeddingSegmentsSumOp(Program& p, const std::shared_ptr<ngraph::op::
                                                  reorderedInputs,
                                                  cldnn::embedding_bag::segments_sum,
                                                  CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                                 defaultIndex);
+                                                 defaultIndex,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(embeddingBagPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp b/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp
index 23b5f01432001a..088a0fcd413eb4 100644
--- a/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp
+++ b/inference-engine/src/cldnn_engine/ops/extract_image_patches.cpp
@@ -38,7 +38,8 @@ void CreateExtractImagePatchesOp(Program& p, const std::shared_ptr<ngraph::op::v
                                                                 strides,
                                                                 rates,
                                                                 auto_pad,
-                                                                CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                                                CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                                                op->get_friendly_name());
 
     p.AddPrimitive(extractImagePatchesPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp b/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp
index 345a70f34bbce3..52ea33e5d3dda8 100644
--- a/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp
+++ b/inference-engine/src/cldnn_engine/ops/fake_quantize.cpp
@@ -31,7 +31,8 @@ void CreateFakeQuantizeOp(Program& p, const std::shared_ptr<ngraph::op::v0::Fake
                                             output_low_id,
                                             output_high_id,
                                             levels,
-                                            dt);
+                                            dt,
+                                            op->get_friendly_name());
 
     p.AddPrimitive(quantizationPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather tree.cpp b/inference-engine/src/cldnn_engine/ops/gather tree.cpp
index 6b73131fd29d84..5476aa40d977e5 100644
--- a/inference-engine/src/cldnn_engine/ops/gather tree.cpp	
+++ b/inference-engine/src/cldnn_engine/ops/gather tree.cpp	
@@ -30,7 +30,10 @@ void CreateGatherTreeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Gather
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layerName, op);
             reorderedInputs[portIndex] = reorderPrimName;
@@ -43,7 +46,8 @@ void CreateGatherTreeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Gather
                                              reorderedInputs[0],
                                              reorderedInputs[1],
                                              reorderedInputs[2],
-                                             reorderedInputs[3]);
+                                             reorderedInputs[3],
+                                             op->get_friendly_name());
 
     p.AddPrimitive(gatherTreePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather.cpp b/inference-engine/src/cldnn_engine/ops/gather.cpp
index d22258e0673261..bcf632f319431e 100644
--- a/inference-engine/src/cldnn_engine/ops/gather.cpp
+++ b/inference-engine/src/cldnn_engine/ops/gather.cpp
@@ -77,7 +77,10 @@ void CreateGatherOpBase(Program& p, const std::shared_ptr<T>& op, const int64_t
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layerName, op);
             reorderedInputs[portIndex] = reorderPrimName;
@@ -94,7 +97,8 @@ void CreateGatherOpBase(Program& p, const std::shared_ptr<T>& op, const int64_t
                                     outLayout,
                                     CldnnTensorFromIEDims(op->get_output_shape(0)),
                                     batch_dim,
-                                    support_neg_ind);
+                                    support_neg_ind,
+                                    op->get_friendly_name());
 
     p.AddPrimitive(gatherPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather_elements.cpp b/inference-engine/src/cldnn_engine/ops/gather_elements.cpp
index d61382807506c1..50c25c37f1ccda 100644
--- a/inference-engine/src/cldnn_engine/ops/gather_elements.cpp
+++ b/inference-engine/src/cldnn_engine/ops/gather_elements.cpp
@@ -55,7 +55,8 @@ void CreateGatherElementsOp(Program& p, const std::shared_ptr<ngraph::op::v6::Ga
                                             inputPrimitives[1],
                                             outLayout,
                                             CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                            GetGatherAxis(axis, rank));
+                                            GetGatherAxis(axis, rank),
+                                            op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/gather_nd.cpp b/inference-engine/src/cldnn_engine/ops/gather_nd.cpp
index cbdc5659bb3197..266ada7f904575 100644
--- a/inference-engine/src/cldnn_engine/ops/gather_nd.cpp
+++ b/inference-engine/src/cldnn_engine/ops/gather_nd.cpp
@@ -22,10 +22,11 @@ void CreateGatherNDOp(Program& p, const std::shared_ptr<ngraph::op::v5::GatherND
     auto batch_dims = op->get_batch_dims();
 
     auto primitive = cldnn::gather_nd(layerName,
-                                           inputPrimitives[0],
-                                           inputPrimitives[1],
-                                           indices_rank,
-                                           batch_dims);
+                                      inputPrimitives[0],
+                                      inputPrimitives[1],
+                                      indices_rank,
+                                      batch_dims,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/grn.cpp b/inference-engine/src/cldnn_engine/ops/grn.cpp
index 960dd03494735d..c6d07fe6191a54 100644
--- a/inference-engine/src/cldnn_engine/ops/grn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/grn.cpp
@@ -19,7 +19,8 @@ void CreateGRNOp(Program& p, const std::shared_ptr<ngraph::op::v0::GRN>& op) {
     auto primitive = cldnn::grn(layerName,
                                 inputPrimitives[0],
                                 op->get_bias(),
-                                DataTypeFromPrecision(op->get_output_element_type(0)));
+                                DataTypeFromPrecision(op->get_output_element_type(0)),
+                                op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/interpolate.cpp b/inference-engine/src/cldnn_engine/ops/interpolate.cpp
index df99e6972eefbf..190032897b4741 100644
--- a/inference-engine/src/cldnn_engine/ops/interpolate.cpp
+++ b/inference-engine/src/cldnn_engine/ops/interpolate.cpp
@@ -193,7 +193,8 @@ void CreateInterpolateOp(Program& p, const std::shared_ptr<ngraph::op::v4::Inter
                                         cldnnSampleType,
                                         shapeCalcMode,
                                         coordTransMode,
-                                        nearestMode);
+                                        nearestMode,
+                                        op->get_friendly_name());
 
     p.AddPrimitive(resamplePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/loop.cpp b/inference-engine/src/cldnn_engine/ops/loop.cpp
index 1ac452265b8820..604f73b7e5a64e 100644
--- a/inference-engine/src/cldnn_engine/ops/loop.cpp
+++ b/inference-engine/src/cldnn_engine/ops/loop.cpp
@@ -29,11 +29,11 @@ using Loop = ngraph::op::v5::Loop;
 namespace CLDNNPlugin {
 
 template<class DATA_TYPE>
-static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num) {
+static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num, const cldnn::primitive_id& ext_prim_id) {
     auto mem = p.GetEngine().allocate_memory({ cldnn::data_types::i64, cldnn::format::bfyx, { 1, 1, 1, 1 } });
     cldnn::mem_lock<int64_t> ptr{mem, p.GetEngine().get_program_stream()};
     *ptr.begin() = num;
-    return {id, mem};
+    return {id, mem, ext_prim_id};
 }
 
 static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::shared_ptr<ngraph::Node>& op,
@@ -44,7 +44,7 @@ static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::sha
     const auto tensor = CldnnTensorFromIEDims(op->get_output_shape(output_idx));
     cldnn::layout output_layout = cldnn::layout(precision, format, tensor);
     auto mem = p.GetEngine().allocate_memory(output_layout);
-    auto md = cldnn::mutable_data(id, {input}, mem); // cldnn::data cannot set dependency
+    auto md = cldnn::mutable_data(id, {input}, mem, op->get_friendly_name()); // cldnn::data cannot set dependency
     return md;
 }
 
@@ -161,8 +161,7 @@ void CreateLoopOp(Program& p, const std::shared_ptr<Loop>& op) {
     }
     const cldnn::primitive_id num_iteration_id = layerName + "_numIteration";
     {
-        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0);
-        p.primitivesToIRLayersMap[num_iteration_id] = { op->get_friendly_name() };
+        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0, op->get_friendly_name());
         p.primitiveIDs[num_iteration_id] = num_iteration_id;
         p.AddPrimitive(num_iteration);
         p.AddInnerPrimitiveToProfiler(num_iteration_id, layerName, op);
@@ -216,7 +215,8 @@ void CreateLoopOp(Program& p, const std::shared_ptr<Loop>& op) {
         back_edges,             /* back edge mapping */
         num_iterations,         /* max iteration, i.e. length of iteration axis */
         body_current_iteration_id,
-        body_execution_condition_id);
+        body_execution_condition_id,
+        op->get_friendly_name());
 
     p.AddPrimitive(loopPrimitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/lrn.cpp b/inference-engine/src/cldnn_engine/ops/lrn.cpp
index c13c17daaeb13d..28e55bf038f825 100644
--- a/inference-engine/src/cldnn_engine/ops/lrn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/lrn.cpp
@@ -38,7 +38,8 @@ void CreateLRNOp(Program& p, const std::shared_ptr<ngraph::op::v0::LRN>& op) {
                               static_cast<float>(op->get_bias()),
                               static_cast<float>(op->get_alpha()),
                               static_cast<float>(op->get_beta()),
-                              GetNormRegion(axis_value));
+                              GetNormRegion(axis_value),
+                              op->get_friendly_name());
 
     p.AddPrimitive(lrnPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/matmul.cpp b/inference-engine/src/cldnn_engine/ops/matmul.cpp
index 3d09fc7fd4e5e6..53b8fecd6c28fa 100644
--- a/inference-engine/src/cldnn_engine/ops/matmul.cpp
+++ b/inference-engine/src/cldnn_engine/ops/matmul.cpp
@@ -89,7 +89,8 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
             auto permuteName = op->get_friendly_name() + "/transpose_b";
             auto permutePrim = cldnn::permute(permuteName,
                                               weightsName,
-                                              cldnn_permute_order);
+                                              cldnn_permute_order,
+                                              op->get_friendly_name());
             p.AddPrimitive(permutePrim);
             p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
             weightsName = permuteName;
@@ -108,7 +109,8 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
             auto permuteName = op->get_friendly_name() + "/transpose_a";
             auto permutePrim = cldnn::permute(permuteName,
                                               inputName,
-                                              cldnn_permute_order);
+                                              cldnn_permute_order,
+                                              op->get_friendly_name());
             p.AddPrimitive(permutePrim);
             p.AddInnerPrimitiveToProfiler(permuteName, layerName, op);
             inputName = permuteName;
@@ -124,7 +126,10 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
                 IE_THROW() << "Inconsistent reshape in Matmul op: " << op->get_friendly_name();
 
             auto reshapeInName = op->get_friendly_name() + suffix;
-            auto reshapeInPrim = cldnn::reshape(reshapeInName, inputName, CldnnTensorFromIEDims(reshapeSize));
+            auto reshapeInPrim = cldnn::reshape(reshapeInName,
+                                                inputName,
+                                                CldnnTensorFromIEDims(reshapeSize),
+                                                op->get_friendly_name());
             p.AddPrimitive(reshapeInPrim);
             p.AddInnerPrimitiveToProfiler(reshapeInName, layerName, op);
             return reshapeInName;
@@ -144,6 +149,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
                                              weightsName,
                                              "",
                                              DataTypeFromPrecision(op->get_output_element_type(0)),
+                                             op->get_friendly_name(),
                                              cldnn::padding(),
                                              input_rank);
 
@@ -153,7 +159,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
         if (reshape_fc) {
             auto outputShape = CldnnTensorFromIEDims(op->get_output_shape(0));
             auto outReshapeName = layerName + "_cldnn_out_reshape";
-            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape);
+            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape, op->get_friendly_name());
 
             p.AddPrimitive(outReshapePrim);
             p.AddInnerPrimitiveToProfiler(outReshapeName, layerName, op);
@@ -188,7 +194,13 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
             if (targetFormat.value != DefaultFormatForDims(inputDimsN).value) {
                 auto reorderName = layerName + "_cldnn_in" + std::to_string(i) + "_reorder";
                 auto targetDatatype = DataTypeFromPrecision(op->get_output_element_type(0));
-                auto reorderPrim = cldnn::reorder(reorderName, inputPrimitives[i], targetFormat, targetDatatype);
+                auto reorderPrim = cldnn::reorder(reorderName,
+                                                  inputPrimitives[i],
+                                                  targetFormat,
+                                                  targetDatatype,
+                                                  std::vector<float>(),
+                                                  cldnn::reorder_mean_mode::subtract,
+                                                  op->get_friendly_name());
 
                 p.AddPrimitive(reorderPrim);
                 p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
@@ -227,7 +239,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
 
                 auto targetShape = gemmSpecificTensor(inputDims);
 
-                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape);
+                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape, op->get_friendly_name());
 
                 p.AddPrimitive(reshapePrim);
                 p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
@@ -248,7 +260,8 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
                                     transA,
                                     transB,
                                     alpha,
-                                    beta);
+                                    beta,
+                                    op->get_friendly_name());
 
         p.AddPrimitive(gemmPrim);
 
@@ -258,7 +271,7 @@ void CreateMatMulOp(Program& p, const std::shared_ptr<ngraph::op::v0::MatMul>& o
         if (outDimsN < 4) {
             auto outputShape = CldnnTensorFromIEDims(outDims);
             auto outReshapeName = layerName + "_cldnn_out_reshape";
-            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape);
+            auto outReshapePrim = cldnn::reshape(outReshapeName, layerName, outputShape, op->get_friendly_name());
 
             p.AddPrimitive(outReshapePrim);
             p.AddInnerPrimitiveToProfiler(outReshapeName, layerName, op);
diff --git a/inference-engine/src/cldnn_engine/ops/mvn.cpp b/inference-engine/src/cldnn_engine/ops/mvn.cpp
index b9cb376a24e34e..abd2128326b210 100644
--- a/inference-engine/src/cldnn_engine/ops/mvn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/mvn.cpp
@@ -24,7 +24,8 @@ static void CreateCommonMVNOp(Program& p, const std::shared_ptr<ngraph::Node>& o
                               normalize_variance,
                               eps,
                               eps_inside_sqrt,
-                              across_channels);
+                              across_channels,
+                              op->get_friendly_name());
 
     p.AddPrimitive(mvnPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp b/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp
index 8adaa3cfa76294..df34657d6cb8ba 100644
--- a/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp
+++ b/inference-engine/src/cldnn_engine/ops/non_max_suppression.cpp
@@ -41,7 +41,10 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
             auto preprocessPrim = cldnn::reorder(reorderPrimName,
                                                  inputPrimitives[portIndex],
                                                  targetFormat,
-                                                 cldnn::data_types::i32);
+                                                 cldnn::data_types::i32,
+                                                 std::vector<float>(),
+                                                 cldnn::reorder_mean_mode::subtract,
+                                                 op->get_friendly_name());
             p.AddPrimitive(preprocessPrim);
             p.AddInnerPrimitiveToProfiler(reorderPrimName, layer_type_name_ID(op), op);
             reorderedInputs[portIndex] = (reorderPrimName);
@@ -77,8 +80,9 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
             shared_memory.emplace_back(p.GetEngine().allocate_memory(mutableLayoutSecond));
 
             cldnn::primitive_id non_max_supression_mutable_id_w_second = layer_type_name_ID(op) + "_md_write_second";
-            auto nms_mutable_prim_second = cldnn::mutable_data(non_max_supression_mutable_id_w_second, shared_memory.back());
-            p.primitivesToIRLayersMap[non_max_supression_mutable_id_w_second] = { op->get_friendly_name() };
+            auto nms_mutable_prim_second = cldnn::mutable_data(non_max_supression_mutable_id_w_second,
+                                                               shared_memory.back(),
+                                                               op->get_friendly_name());
             p.primitiveIDs[non_max_supression_mutable_id_w_second] = non_max_supression_mutable_id_w_second;
             p.AddPrimitive(nms_mutable_prim_second);
             inputPrimitives.push_back(non_max_supression_mutable_id_w_second);
@@ -94,8 +98,9 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
             shared_memory.emplace_back(p.GetEngine().allocate_memory(mutableLayoutFirst));
 
             cldnn::primitive_id non_max_supression_mutable_id_w_first = layer_type_name_ID(op) + "_md_write_first";
-            auto nms_mutable_prim_first = cldnn::mutable_data(non_max_supression_mutable_id_w_first, shared_memory.back());
-            p.primitivesToIRLayersMap[non_max_supression_mutable_id_w_first] = { op->get_friendly_name() };
+            auto nms_mutable_prim_first = cldnn::mutable_data(non_max_supression_mutable_id_w_first,
+                                                              shared_memory.back(),
+                                                              op->get_friendly_name());
             p.primitiveIDs[non_max_supression_mutable_id_w_first] = non_max_supression_mutable_id_w_first;
             p.AddPrimitive(nms_mutable_prim_first);
             inputPrimitives.push_back(non_max_supression_mutable_id_w_first);
@@ -112,7 +117,9 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
             reorderedInputs[1],
             static_cast<int>(outputIndices),
             op->m_center_point_box,
-            op->m_sort_result_descending);
+            op->m_sort_result_descending,
+            "", "", "", "", "", "",
+            op->get_friendly_name());
 
     prim.output_data_type = DataTypeFromPrecision(out_type);
 
@@ -136,15 +143,19 @@ void CreateNonMaxSuppressionIEInternalOp(Program& p, const std::shared_ptr<ngrap
     switch (num_output) {
         case 3: {
             cldnn::primitive_id non_max_supression_id_r_second = layer_type_name_ID(op) + ".2";
-            auto nms_mutable_prim_r_second = cldnn::mutable_data(non_max_supression_id_r_second, { nonMaxSupressionLayerName }, shared_memory.front());
-            p.primitivesToIRLayersMap[non_max_supression_id_r_second] = { op->get_friendly_name() };
+            auto nms_mutable_prim_r_second = cldnn::mutable_data(non_max_supression_id_r_second,
+                                                                 { nonMaxSupressionLayerName },
+                                                                 shared_memory.front(),
+                                                                 op->get_friendly_name());
             p.primitiveIDs[non_max_supression_id_r_second] = non_max_supression_id_r_second;
             p.AddPrimitive(nms_mutable_prim_r_second);
         }
         case 2: {
             cldnn::primitive_id non_max_supression_id_r_first = layer_type_name_ID(op) + ".1";
-            auto nms_mutable_prim_r_first = cldnn::mutable_data(non_max_supression_id_r_first, { nonMaxSupressionLayerName }, shared_memory.back());
-            p.primitivesToIRLayersMap[non_max_supression_id_r_first] = { op->get_friendly_name() };
+            auto nms_mutable_prim_r_first = cldnn::mutable_data(non_max_supression_id_r_first,
+                                                                { nonMaxSupressionLayerName },
+                                                                shared_memory.back(),
+                                                                op->get_friendly_name());
             p.primitiveIDs[non_max_supression_id_r_first] = non_max_supression_id_r_first;
             p.AddPrimitive(nms_mutable_prim_r_first);
         }
diff --git a/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp b/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp
index 85f2eb95de80bc..315dee55952da6 100644
--- a/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp
+++ b/inference-engine/src/cldnn_engine/ops/normalize_l2.cpp
@@ -45,14 +45,15 @@ void CreateNormalizeL2Op(Program& p, const std::shared_ptr<ngraph::op::v0::Norma
 
     std::memcpy(&buf[0], scale->get_data_ptr(), bufSize);
     auto scalesName = layerName + "_cldnn_input_scales";
-    p.AddPrimitive(cldnn::data(scalesName, mem));
+    p.AddPrimitive(cldnn::data(scalesName, mem, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(scalesName, layerName, op);
 
     auto normPrim = cldnn::normalize(layerName,
                                      inputPrimitives[0],
                                      scalesName,
                                      across_spatial,
-                                     eps);
+                                     eps,
+                                     op->get_friendly_name());
 
     p.AddPrimitive(normPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/one_hot.cpp b/inference-engine/src/cldnn_engine/ops/one_hot.cpp
index 3d792bda8aee0e..b7c4fe8a126a21 100644
--- a/inference-engine/src/cldnn_engine/ops/one_hot.cpp
+++ b/inference-engine/src/cldnn_engine/ops/one_hot.cpp
@@ -53,7 +53,8 @@ void CreateOneHotOp(Program& p, const std::shared_ptr<ngraph::op::v1::OneHot>& o
                                      DataTypeFromPrecision(op->get_output_element_type(0)),
                                      static_cast<uint16_t>(axis),
                                      on_value,
-                                     off_value);
+                                     off_value,
+                                     op->get_friendly_name());
 
     p.AddPrimitive(oneHotPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/pad.cpp b/inference-engine/src/cldnn_engine/ops/pad.cpp
index 0d409414b58776..40336df057cf20 100644
--- a/inference-engine/src/cldnn_engine/ops/pad.cpp
+++ b/inference-engine/src/cldnn_engine/ops/pad.cpp
@@ -66,7 +66,8 @@ void CreatePadOp(Program& p, const std::shared_ptr<ngraph::op::v1::Pad>& op) {
                                   pads_begin,
                                   pads_end,
                                   border_mode,
-                                  pad_value);
+                                  pad_value,
+                                  op->get_friendly_name());
 
     p.AddPrimitive(tilePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/parameter.cpp b/inference-engine/src/cldnn_engine/ops/parameter.cpp
index b68593dd0a5b0f..6dd43841cf3202 100644
--- a/inference-engine/src/cldnn_engine/ops/parameter.cpp
+++ b/inference-engine/src/cldnn_engine/ops/parameter.cpp
@@ -195,8 +195,8 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
                                     cldnn::format::nv12, { 1, 1, width, height });
             cldnn::layout uv_layout(DataTypeFromPrecision(ip),
                                     cldnn::format::nv12, { 1, 2, width / 2, height / 2 });
-            auto inputY = cldnn::input_layout(y_name, y_layout);
-            auto inputUV = cldnn::input_layout(uv_name, uv_layout);
+            auto inputY = cldnn::input_layout(y_name, y_layout, inputInfo->name());
+            auto inputUV = cldnn::input_layout(uv_name, uv_layout, inputInfo->name());
 
             p.AddPrimitive(inputY);
             p.inputLayouts.insert({ inputInfo->name() + "_Y" + std::to_string(i), y_layout });
@@ -205,20 +205,29 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
             switch (preProcess.getMeanVariant()) {
             case NONE:
             case MEAN_VALUE: {
-                p.AddPrimitive(cldnn::reorder(preprocessPrimID, y_name, uv_name, networkInputLayout, meanValues));
+                p.AddPrimitive(cldnn::reorder(preprocessPrimID,
+                                              y_name,
+                                              uv_name,
+                                              networkInputLayout,
+                                              meanValues,
+                                              cldnn::reorder_mean_mode::subtract,
+                                              inputInfo->name()));
                 break;
             }
             case MEAN_IMAGE: {
-                p.AddPrimitive(cldnn::reorder(preprocessPrimID, y_name, uv_name, networkInputLayout, meanBlobID));
+                p.AddPrimitive(cldnn::reorder(preprocessPrimID,
+                                              y_name,
+                                              uv_name,
+                                              networkInputLayout,
+                                              meanBlobID,
+                                              cldnn::reorder_mean_mode::subtract,
+                                              inputInfo->name()));
                 break;
             }
             default: IE_THROW(Unexpected) << "Invalid mean variant in input " + inputName;
                 break;
             }
 
-            p.primitivesToIRLayersMap[preprocessPrimID] = { inputInfo->name() };
-            p.primitivesToIRLayersMap[y_name] = { inputInfo->name() };
-            p.primitivesToIRLayersMap[uv_name] = { inputInfo->name() };
             p.profilingIDs.push_back(preprocessPrimID);
             p.InitProfileInfo(preprocessPrimID, "Reorder");
             p.primitiveIDs[inputName] = preprocessPrimID;  // If it is batched blob, it will be overwritten afterwards.
@@ -228,7 +237,7 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
 
         if (inputDims[0] > 1) {
             auto concatPrimID = "concat:" + inputName + Program::m_preProcessTag;
-            p.AddPrimitive(cldnn::concatenation(concatPrimID, reorders, cldnn::concatenation::along_b));
+            p.AddPrimitive(cldnn::concatenation(concatPrimID, reorders, cldnn::concatenation::along_b, op->get_friendly_name()));
             p.primitiveIDs[inputName] = concatPrimID;
         }
     } else {
@@ -237,20 +246,26 @@ void CreateParameterOp(Program& p, const std::shared_ptr<ngraph::op::v0::Paramet
         inputLayout.data_type = DataTypeFromPrecision(ip);
         p.inputLayouts.insert({ inputInfo->name(), inputLayout });
 
-        p.AddPrimitive(cldnn::input_layout(inputName, inputLayout));
-        p.primitivesToIRLayersMap[inputName] = { inputInfo->name() };
+        p.AddPrimitive(cldnn::input_layout(inputName, inputLayout, inputInfo->name()));
 
         switch (preProcess.getMeanVariant()) {
         case NONE:
         case MEAN_VALUE: {
-            p.AddPrimitive(cldnn::reorder(preprocessPrimID, inputName, networkInputLayout, meanValues));
+            p.AddPrimitive(cldnn::reorder(preprocessPrimID,
+                                          inputName,
+                                          networkInputLayout,
+                                          meanValues,
+                                          cldnn::reorder_mean_mode::subtract,
+                                          op->get_friendly_name()));
             break;
         }
         case MEAN_IMAGE: {
             p.AddPrimitive(cldnn::reorder(preprocessPrimID,
-                                        inputName,
-                                        networkInputLayout,
-                                        meanBlobID));
+                                          inputName,
+                                          networkInputLayout,
+                                          meanBlobID,
+                                          cldnn::reorder_mean_mode::subtract,
+                                          op->get_friendly_name()));
             break;
         }
         default: IE_THROW() << "Invalid mean variant in input " << inputName;
diff --git a/inference-engine/src/cldnn_engine/ops/pooling.cpp b/inference-engine/src/cldnn_engine/ops/pooling.cpp
index f1bf6952292056..1e0db7bd204182 100644
--- a/inference-engine/src/cldnn_engine/ops/pooling.cpp
+++ b/inference-engine/src/cldnn_engine/ops/pooling.cpp
@@ -70,7 +70,8 @@ void CreateAvgPoolOp(Program& p, const std::shared_ptr<ngraph::op::v1::AvgPool>&
                                    params.stride,
                                    params.pad_begin,
                                    CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                   DataTypeFromPrecision(op->get_output_element_type(0)));
+                                   DataTypeFromPrecision(op->get_output_element_type(0)),
+                                   op->get_friendly_name());
     poolPrim.pad_end = params.pad_end;
     p.AddPrimitive(poolPrim);
     p.AddPrimitiveToProfiler(op);
@@ -89,7 +90,8 @@ void CreateMaxPoolOp(Program& p, const std::shared_ptr<ngraph::op::v1::MaxPool>&
                                    params.stride,
                                    params.pad_begin,
                                    CldnnTensorFromIEDims(op->get_output_shape(0)),
-                                   DataTypeFromPrecision(op->get_output_element_type(0)));
+                                   DataTypeFromPrecision(op->get_output_element_type(0)),
+                                   op->get_friendly_name());
     poolPrim.pad_end = params.pad_end;
     p.AddPrimitive(poolPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/prior_box.cpp b/inference-engine/src/cldnn_engine/ops/prior_box.cpp
index 6cf0aaa65355d3..43eb5a6994184a 100644
--- a/inference-engine/src/cldnn_engine/ops/prior_box.cpp
+++ b/inference-engine/src/cldnn_engine/ops/prior_box.cpp
@@ -54,7 +54,8 @@ void CreatePriorBoxClusteredOp(Program& p, const std::shared_ptr<ngraph::op::v0:
                                          offset,
                                          width,
                                          height,
-                                         DataTypeFromPrecision(op->get_output_element_type(0)));
+                                         DataTypeFromPrecision(op->get_output_element_type(0)),
+                                         op->get_friendly_name());
 
     p.AddPrimitive(priorBoxPrim);
     p.AddPrimitiveToProfiler(op);
@@ -103,7 +104,8 @@ void CreatePriorBoxOp(Program& p, const std::shared_ptr<ngraph::op::v0::PriorBox
                                          scale_all_sizes,
                                          fixed_ratio,
                                          fixed_size,
-                                         density);
+                                         density,
+                                         op->get_friendly_name());
 
     p.AddPrimitive(priorBoxPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/proposal.cpp b/inference-engine/src/cldnn_engine/ops/proposal.cpp
index d5b906e5e6e057..34677bd82ab11d 100644
--- a/inference-engine/src/cldnn_engine/ops/proposal.cpp
+++ b/inference-engine/src/cldnn_engine/ops/proposal.cpp
@@ -65,8 +65,9 @@ void CreateProposalOp(Program& p, const std::shared_ptr<ngraph::op::v0::Proposal
         auto shared_memory = p.GetEngine().allocate_memory(mutableLayout);
 
         cldnn::primitive_id proposal_mutable_id_w = layer_type_name_ID(op) + "_md_write";
-        auto argmax_mutable_prim = cldnn::mutable_data(proposal_mutable_id_w, shared_memory);
-        p.primitivesToIRLayersMap[proposal_mutable_id_w] = { op->get_friendly_name() };
+        auto argmax_mutable_prim = cldnn::mutable_data(proposal_mutable_id_w,
+                                                       shared_memory,
+                                                       op->get_friendly_name());
         p.primitiveIDs[proposal_mutable_id_w] = proposal_mutable_id_w;
         p.AddPrimitive(argmax_mutable_prim);
         inputPrimitives.push_back(proposal_mutable_id_w);
@@ -96,13 +97,16 @@ void CreateProposalOp(Program& p, const std::shared_ptr<ngraph::op::v0::Proposal
                                             clip_after_nms,
                                             round_ratios,
                                             shift_anchors,
-                                            normalize);
+                                            normalize,
+                                            op->get_friendly_name());
 
         p.AddPrimitive(proposalPrim);
 
         cldnn::primitive_id proposal_mutable_id_r = layer_type_name_ID(op) + ".1";
-        auto argmax_mutable_prim_r = cldnn::mutable_data(proposal_mutable_id_r, { proposalLayerName }, shared_memory);
-        p.primitivesToIRLayersMap[proposal_mutable_id_r] = { op->get_friendly_name() };
+        auto argmax_mutable_prim_r = cldnn::mutable_data(proposal_mutable_id_r,
+                                                         { proposalLayerName },
+                                                         shared_memory,
+                                                         op->get_friendly_name());
         p.primitiveIDs[proposal_mutable_id_r] = proposal_mutable_id_r;
         p.AddPrimitive(argmax_mutable_prim_r);
 
@@ -134,7 +138,8 @@ void CreateProposalOp(Program& p, const std::shared_ptr<ngraph::op::v0::Proposal
                                         clip_after_nms,
                                         round_ratios,
                                         shift_anchors,
-                                        normalize);
+                                        normalize,
+                                        op->get_friendly_name());
 
     p.AddPrimitive(proposalPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/reduce.cpp b/inference-engine/src/cldnn_engine/ops/reduce.cpp
index b336a2e78faaf5..47a54c702997bc 100644
--- a/inference-engine/src/cldnn_engine/ops/reduce.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reduce.cpp
@@ -75,7 +75,8 @@ void CreateReduceOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cldnn::
                                     inputPrimitives[0],
                                     mode,
                                     axes,
-                                    static_cast<int32_t>(keep_dims));
+                                    static_cast<int32_t>(keep_dims),
+                                    op->get_friendly_name());
 
     p.AddPrimitive(reducePrim);
 
@@ -96,7 +97,7 @@ void CreateReduceOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cldnn::
                 outTensor = cldnn::tensor(TensorValue(out_shape[0]), TensorValue(out_shape[1]),
                                           1, TensorValue(out_shape[2]));
         }
-        auto reshape_prim = cldnn::reshape(resultLayerName, layerName, outTensor);
+        auto reshape_prim = cldnn::reshape(resultLayerName, layerName, outTensor, op->get_friendly_name());
         p.AddPrimitive(reshape_prim);
         p.AddPrimitiveToProfiler(op, resultLayerName);
     }
@@ -112,7 +113,13 @@ void CreateReduceOp(Program& p, const std::shared_ptr<ngraph::Node>& op, cldnn::
         else if (rank - rawAxes.size() <= 4)
             out_format = cldnn::format::bfyx;
 
-        auto reorder_prim = cldnn::reorder(reorderLayerName, resultLayerName, out_format, out_dt);
+        auto reorder_prim = cldnn::reorder(reorderLayerName,
+                                           resultLayerName,
+                                           out_format,
+                                           out_dt,
+                                           std::vector<float>(),
+                                           cldnn::reorder_mean_mode::subtract,
+                                           op->get_friendly_name());
         p.AddPrimitive(reorder_prim);
         p.AddPrimitiveToProfiler(op, reorderLayerName);
     } else {
diff --git a/inference-engine/src/cldnn_engine/ops/region_yolo.cpp b/inference-engine/src/cldnn_engine/ops/region_yolo.cpp
index 348dd0f7eeb581..314950027cb044 100644
--- a/inference-engine/src/cldnn_engine/ops/region_yolo.cpp
+++ b/inference-engine/src/cldnn_engine/ops/region_yolo.cpp
@@ -28,7 +28,8 @@ void CreateRegionYoloOp(Program& p, const std::shared_ptr<ngraph::op::v0::Region
                                          classes,
                                          num,
                                          mask_size,
-                                         do_softmax);
+                                         do_softmax,
+                                         op->get_friendly_name());
 
     p.AddPrimitive(regionPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp b/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp
index 4a7f54cf810bc2..9c47ccc9fb0143 100644
--- a/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reorg_yolo.cpp
@@ -20,7 +20,8 @@ void CreateReorgYoloOp(Program& p, const std::shared_ptr<ngraph::op::v0::ReorgYo
 
     auto reorgPrim = cldnn::reorg_yolo(layerName,
                                        inputPrimitives[0],
-                                       stride);
+                                       stride,
+                                       op->get_friendly_name());
 
     p.AddPrimitive(reorgPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/reshape.cpp b/inference-engine/src/cldnn_engine/ops/reshape.cpp
index f0084bb6a1cb21..a4978fbae29b77 100644
--- a/inference-engine/src/cldnn_engine/ops/reshape.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reshape.cpp
@@ -36,9 +36,13 @@ void CreateCommonReshapeOp(Program& p, const std::shared_ptr<ngraph::Node>& op)
         }
 
         cldnn::layout outputLayout(DataTypeFromPrecision(op->get_output_element_type(0)), outputFormat, outTensor);
-        p.AddPrimitive(cldnn::reorder(reorderId, reshapeInputId, outputLayout));
+        p.AddPrimitive(cldnn::reorder(reorderId,
+                                      reshapeInputId,
+                                      outputLayout,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name()));
         p.InitProfileInfo(reorderId, "Reorder", false, InferenceEngine::InferenceEngineProfileInfo::EXECUTED, layerName);
-        p.primitivesToIRLayersMap[reorderId] = { op->get_friendly_name() };
         p.primitiveIDs[layerName + "_reorder"] = reorderId;
         p.primitiveIDs[reorderId] = reorderId;
         p.profilingIDs.push_back(reorderId);
@@ -47,7 +51,8 @@ void CreateCommonReshapeOp(Program& p, const std::shared_ptr<ngraph::Node>& op)
 
     auto reshapePrim = cldnn::reshape(layerName,
                                       reshapeInputId,
-                                      outTensor);
+                                      outTensor,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(reshapePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/result.cpp b/inference-engine/src/cldnn_engine/ops/result.cpp
index fe0d0f05658018..c1219ad8fbaf81 100644
--- a/inference-engine/src/cldnn_engine/ops/result.cpp
+++ b/inference-engine/src/cldnn_engine/ops/result.cpp
@@ -56,9 +56,12 @@ void CreateResultOp(Program& p, const std::shared_ptr<ngraph::op::v0::Result>& o
     std::string outputID = inputs[0];
 
     p.AddPrimitive(cldnn::reorder(outLayerName,
-                                outputID,
-                                FormatFromLayout(outputData->getLayout()),
-                                DataTypeFromPrecision(precision)));
+                                  outputID,
+                                  FormatFromLayout(outputData->getLayout()),
+                                  DataTypeFromPrecision(precision),
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
     p.InitProfileInfo(outLayerName, "reorder");
     p.profilingIDs.push_back(outLayerName);
     p.primitiveIDs[outLayerName] = outLayerName;
diff --git a/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp b/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp
index 766bbc89a31d57..6421a01dc75848 100644
--- a/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp
+++ b/inference-engine/src/cldnn_engine/ops/reverse_sequence.cpp
@@ -22,7 +22,8 @@ void CreateReverseSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v0::R
                                                        inputPrimitives[0],
                                                        inputPrimitives[1],
                                                        seq_axis,
-                                                       batch_axis);
+                                                       batch_axis,
+                                                       op->get_friendly_name());
 
     p.AddPrimitive(reverseSequencePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/rnn.cpp b/inference-engine/src/cldnn_engine/ops/rnn.cpp
index 2d4705f1a910fa..1ebaa0a786841f 100644
--- a/inference-engine/src/cldnn_engine/ops/rnn.cpp
+++ b/inference-engine/src/cldnn_engine/ops/rnn.cpp
@@ -107,8 +107,13 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     cldnn::tensor inStateShape = { lstm_batch_size, 1, lstm_hidden_size, 1 };
     cldnn::layout inputLayout = cldnn::layout(lstm_dtype, cldnn::format::bfyx, inputShape);
     cldnn::layout hiddenLayout = cldnn::layout(lstm_dtype, cldnn::format::bfyx, inStateShape);
-    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape));
-    p.AddPrimitive(cldnn::reorder(permuteID, inReshapeID, inputLayout));
+    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(permuteID,
+                                  inReshapeID,
+                                  inputLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(inReshapeID, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(permuteID, op->get_friendly_name(), op);
@@ -117,11 +122,24 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     std::string hiddenInStr = inHiddenReorderID + "_1";
     std::string cellInResh = inHiddenReshapeID + "_2";
     std::string cellInStr = inHiddenReorderID + "_2";
-    p.AddPrimitive(cldnn::reshape(hiddenInResh, inputPrimitives[1], inStateShape));
-    p.AddPrimitive(cldnn::reorder(hiddenInStr, hiddenInResh, hiddenLayout));
-    p.AddPrimitive(cldnn::reshape(cellInResh, inputPrimitives[2], inStateShape));
-    p.AddPrimitive(cldnn::reorder(cellInStr, cellInResh, hiddenLayout));
-    p.AddPrimitive(cldnn::concatenation(input_concatID, { permuteID, hiddenInStr }, cldnn::concatenation::concatenation_axis::along_x));
+    p.AddPrimitive(cldnn::reshape(hiddenInResh, inputPrimitives[1], inStateShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(hiddenInStr,
+                                  hiddenInResh,
+                                  hiddenLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reshape(cellInResh, inputPrimitives[2], inStateShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(cellInStr,
+                                  cellInResh,
+                                  hiddenLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
+    p.AddPrimitive(cldnn::concatenation(input_concatID,
+                                        { permuteID, hiddenInStr },
+                                        cldnn::concatenation::concatenation_axis::along_x,
+                                        op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(hiddenInResh, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(hiddenInStr, op->get_friendly_name(), op);
@@ -139,14 +157,19 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     std::string crop_id = layerName + "_crop";
 
     cldnn::primitive_id WRconcatID = layerName + "_WRconcat";
-    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_f));
+    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_f, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(WRconcatID, op->get_friendly_name(), op);
 
-    p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, input_concatID, WRconcatID, hasBias ? biasID : ""));
-    p.AddPrimitive(cldnn::reshape(gemmReshapeID, lstm_fc_id, gemmSz));
-    p.AddPrimitive(cldnn::reorder(gemmReorderID, gemmReshapeID, gemmLayout));
-    p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, gemmReorderID, cellInStr,
-                                 clip, 0, activations, activation_params, cldnn::lstm_weights_order::fizo));
+    p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, input_concatID, WRconcatID, hasBias ? biasID : "", op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reshape(gemmReshapeID, lstm_fc_id, gemmSz, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(gemmReorderID,
+                                  gemmReshapeID,
+                                  gemmLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
+    p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, gemmReorderID, cellInStr, clip, 0, activations,
+                                   activation_params, cldnn::lstm_weights_order::fizo, 0, op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(lstm_fc_id, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(gemmReshapeID, op->get_friendly_name(), op);
@@ -156,16 +179,16 @@ void CreateLSTMCellOp(Program& p, const std::shared_ptr<ngraph::op::v4::LSTMCell
     cldnn::tensor outSz = cldnn::tensor{ lstm_batch_size, lstm_hidden_size, 1, 1 };
     cldnn::primitive_id outputHiddenCropID = layerName + "_hc";
     cldnn::primitive_id outputHiddenID = layerName + ".0";
-    p.AddPrimitive(cldnn::crop(outputHiddenCropID, lstm_elt_id, hiddenSz, cldnn::tensor{0, 0, 0, 0}));
+    p.AddPrimitive(cldnn::crop(outputHiddenCropID, lstm_elt_id, hiddenSz, cldnn::tensor{0, 0, 0, 0}, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputHiddenCropID, op->get_friendly_name(), op);
-    p.AddPrimitive(cldnn::reshape(outputHiddenID, outputHiddenCropID, outSz));
+    p.AddPrimitive(cldnn::reshape(outputHiddenID, outputHiddenCropID, outSz, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputHiddenID, op->get_friendly_name(), op);
 
     cldnn::primitive_id outputCellCropID = layerName + "_cc";
     cldnn::primitive_id outputCellID = layerName + ".1";
-    p.AddPrimitive(cldnn::crop(outputCellCropID, lstm_elt_id, hiddenSz, cellCropSz));
+    p.AddPrimitive(cldnn::crop(outputCellCropID, lstm_elt_id, hiddenSz, cellCropSz, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputCellCropID, op->get_friendly_name(), op);
-    p.AddPrimitive(cldnn::reshape(outputCellID, outputCellCropID, outSz));
+    p.AddPrimitive(cldnn::reshape(outputCellID, outputCellCropID, outSz, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(outputCellID, op->get_friendly_name(), op);
 
     // output primitive IDs
@@ -223,11 +246,16 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
     cldnn::tensor inputShape = { lstm_batch_size, lstm_sequence_len, lstm_input_size, 1 };
     cldnn::tensor inStateShape = { lstm_batch_size, 1, lstm_hidden_size, 1 };
     cldnn::layout inputLayout = cldnn::layout(lstm_dtype, cldnn::format::bfyx, inputShape);
-    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape));
-    p.AddPrimitive(cldnn::reorder(permuteID, inReshapeID, inputLayout));
+    p.AddPrimitive(cldnn::reshape(inReshapeID, inputPrimitives[0], inputShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reorder(permuteID,
+                                  inReshapeID,
+                                  inputLayout,
+                                  std::vector<float>(),
+                                  cldnn::reorder_mean_mode::subtract,
+                                  op->get_friendly_name()));
 
-    p.AddPrimitive(cldnn::reshape(inHiddenStateID, inputPrimitives[1], inStateShape));
-    p.AddPrimitive(cldnn::reshape(inCellStateID, inputPrimitives[2], inStateShape));
+    p.AddPrimitive(cldnn::reshape(inHiddenStateID, inputPrimitives[1], inStateShape, op->get_friendly_name()));
+    p.AddPrimitive(cldnn::reshape(inCellStateID, inputPrimitives[2], inStateShape, op->get_friendly_name()));
 
     p.AddInnerPrimitiveToProfiler(inReshapeID, op->get_friendly_name(), op);
     p.AddInnerPrimitiveToProfiler(permuteID, op->get_friendly_name(), op);
@@ -243,12 +271,12 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
     cldnn::primitive_id inputCropID = layerName + "_inputCrop";
 
     cldnn::primitive_id WRconcatID = layerName + "_WRconcat";
-    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_y));
+    p.AddPrimitive(cldnn::concatenation(WRconcatID, { weightID, recurrentID }, cldnn::concatenation::concatenation_axis::along_y, op->get_friendly_name()));
     p.AddInnerPrimitiveToProfiler(WRconcatID, op->get_friendly_name(), op);
 
     std::vector<size_t> WRreshapeSize = { 4 * size_t(lstm_hidden_size), size_t(lstm_input_size + lstm_hidden_size) };
     cldnn::primitive_id WRreshapeID = WRconcatID + "_reshape";
-    auto reshapeInPrim = cldnn::reshape(WRreshapeID, WRconcatID, CldnnTensorFromIEDims(WRreshapeSize));
+    auto reshapeInPrim = cldnn::reshape(WRreshapeID, WRconcatID, CldnnTensorFromIEDims(WRreshapeSize), op->get_friendly_name());
     p.AddPrimitive(reshapeInPrim);
     p.AddInnerPrimitiveToProfiler(WRreshapeID, op->get_friendly_name(), op);
 
@@ -267,30 +295,35 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
         cldnn::tensor crop_tensor{ inputShape.batch[0], 1, inputShape.spatial[0], inputShape.spatial[1] };
         cldnn::tensor offset_tensor{ 0, static_cast<cldnn::tensor::value_type>(seqIdx), 0, 0 };
         cldnn::primitive_id inputCrop_id = inputCropID + ":" + seqIdx_str;
-        p.AddPrimitive(cldnn::crop(inputCrop_id, permuteID, crop_tensor, offset_tensor));
+        p.AddPrimitive(cldnn::crop(inputCrop_id, permuteID, crop_tensor, offset_tensor, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(inputCrop_id, op->get_friendly_name(), op);
 
-        p.AddPrimitive(cldnn::concatenation(concatID, { inputCrop_id, hiddenStr }, cldnn::concatenation::concatenation_axis::along_x));
+        p.AddPrimitive(cldnn::concatenation(concatID, { inputCrop_id, hiddenStr }, cldnn::concatenation::concatenation_axis::along_x, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(concatID, op->get_friendly_name(), op);
-        p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, concatID, WRreshapeID, biasID));
+        p.AddPrimitive(cldnn::fully_connected(lstm_fc_id, concatID, WRreshapeID, biasID, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(lstm_fc_id, op->get_friendly_name(), op);
 
-        p.AddPrimitive(cldnn::reshape(lstm_fc_resh_id, lstm_fc_id, gemmSz));
-        p.AddPrimitive(cldnn::reorder(lstm_fc_reor_id, lstm_fc_resh_id, gemmLayout));
-        p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, lstm_fc_reor_id, cellStr,
-                                     clip, 0, activations, activation_params, cldnn::lstm_weights_order::fizo));
+        p.AddPrimitive(cldnn::reshape(lstm_fc_resh_id, lstm_fc_id, gemmSz, op->get_friendly_name()));
+        p.AddPrimitive(cldnn::reorder(lstm_fc_reor_id,
+                                      lstm_fc_resh_id,
+                                      gemmLayout,
+                                      std::vector<float>(),
+                                      cldnn::reorder_mean_mode::subtract,
+                                      op->get_friendly_name()));
+        p.AddPrimitive(cldnn::lstm_elt(lstm_elt_id, lstm_fc_reor_id, cellStr, clip, 0, activations,
+                                       activation_params, cldnn::lstm_weights_order::fizo, 0, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(lstm_fc_resh_id, op->get_friendly_name(), op);
         p.AddInnerPrimitiveToProfiler(lstm_fc_reor_id, op->get_friendly_name(), op);
         p.AddInnerPrimitiveToProfiler(lstm_elt_id, op->get_friendly_name(), op);
 
         hiddenStr = crop_id + ":hidden";
         cellStr = crop_id + ":cell";
-        p.AddPrimitive(cldnn::crop(hiddenStr, lstm_elt_id, hiddenSz, cldnn::tensor{ 0, 0, 0, 0 }));
+        p.AddPrimitive(cldnn::crop(hiddenStr, lstm_elt_id, hiddenSz, cldnn::tensor{ 0, 0, 0, 0 }, op->get_friendly_name()));
         p.AddInnerPrimitiveToProfiler(hiddenStr, op->get_friendly_name(), op);
         output_ids_offsets.push_back(hiddenStr);
 
         if (i < lstm_sequence_len - 1) {
-            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz));
+            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz, op->get_friendly_name()));
             p.AddInnerPrimitiveToProfiler(cellStr, op->get_friendly_name(), op);
         } else {
             // last hidden state crop (output 2)
@@ -299,7 +332,7 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
             p.primitiveIDs[outputHiddenID] = hiddenStr;
 
             // last cell state crop (output 3)
-            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz));
+            p.AddPrimitive(cldnn::crop(cellStr, lstm_elt_id, hiddenSz, cellCropSz, op->get_friendly_name()));
             cldnn::primitive_id outputCellID = layerName + ".2";
             p.AddInnerPrimitiveToProfiler(cellStr, op->get_friendly_name(), op);
             p.primitiveIDs[outputCellID] = cellStr;
@@ -310,7 +343,7 @@ void CreateLSTMSequenceOp(Program& p, const std::shared_ptr<ngraph::op::v5::LSTM
     // concatenated hidden state (output 1)
     cldnn::primitive_id outputConcatID = layerName + ".0";
     cldnn::primitive_id concatStr = layerName + ":hiddenConcat";
-    p.AddPrimitive(cldnn::concatenation(concatStr, output_ids_offsets, cldnn::concatenation::along_f));
+    p.AddPrimitive(cldnn::concatenation(concatStr, output_ids_offsets, cldnn::concatenation::along_f, op->get_friendly_name()));
 
     p.primitiveIDs[outputConcatID] = concatStr;
     p.primitiveIDs[layerName] = concatStr;
diff --git a/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp b/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp
index f2087756405404..5de1a56019cc4f 100644
--- a/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp
+++ b/inference-engine/src/cldnn_engine/ops/roi_pooling.cpp
@@ -57,7 +57,8 @@ void CreateDeformablePSROIPoolingOp(Program& p, const std::shared_ptr<ngraph::op
                                                group_size,
                                                output_dim,
                                                spatial_bins_x,
-                                               spatial_bins_y);
+                                               spatial_bins_y,
+                                               op->get_friendly_name());
     p.AddPrimitive(psROIPoolingPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -85,7 +86,8 @@ void CreatePSROIPoolingOp(Program& p, const std::shared_ptr<ngraph::op::v0::PSRO
                                                spatial_scale,
                                                output_dim,
                                                spatial_bins_x,
-                                               spatial_bins_y);
+                                               spatial_bins_y,
+                                               op->get_friendly_name());
     p.AddPrimitive(psROIPoolingPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -110,7 +112,11 @@ void CreateROIPoolingOp(Program& p, const std::shared_ptr<ngraph::op::v0::ROIPoo
                                              position_sensitive,
                                              pooled_width,
                                              pooled_height,
-                                             spatial_scale);
+                                             spatial_scale,
+                                             0,
+                                             1,
+                                             1,
+                                             op->get_friendly_name());
 
     p.AddPrimitive(roiPoolingPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp b/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp
index 19f63dbf3a3986..487587a2afa24d 100644
--- a/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp
+++ b/inference-engine/src/cldnn_engine/ops/scatter_elements_update.cpp
@@ -54,10 +54,11 @@ void CreateScatterElementsUpdateOp(Program& p, const std::shared_ptr<ngraph::op:
     int32_t axis = axes_constant->cast_vector<int32_t>()[0];
 
     auto primitive = cldnn::scatter_elements_update(layerName,
-                                           inputPrimitives[0],
-                                           inputPrimitives[1],
-                                           inputPrimitives[2],
-                                           GetScatterElementsUpdateAxis(axis, rank));
+                                                    inputPrimitives[0],
+                                                    inputPrimitives[1],
+                                                    inputPrimitives[2],
+                                                    GetScatterElementsUpdateAxis(axis, rank),
+                                                    op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp b/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp
index cf5d059772a245..525cccfc32ebcb 100644
--- a/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp
+++ b/inference-engine/src/cldnn_engine/ops/scatter_nd_update.cpp
@@ -19,10 +19,11 @@ void CreateScatterNDUpdateOp(Program& p, const std::shared_ptr<ngraph::op::v3::S
     auto indices_rank = op->get_input_shape(1).size();
 
     auto primitive = cldnn::scatter_nd_update(layerName,
-                                           inputPrimitives[0],
-                                           inputPrimitives[1],
-                                           inputPrimitives[2],
-                                           indices_rank);
+                                              inputPrimitives[0],
+                                              inputPrimitives[1],
+                                              inputPrimitives[2],
+                                              indices_rank,
+                                              op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/scatter_update.cpp b/inference-engine/src/cldnn_engine/ops/scatter_update.cpp
index c6fb4e9c0aa003..913ed452b5f6af 100644
--- a/inference-engine/src/cldnn_engine/ops/scatter_update.cpp
+++ b/inference-engine/src/cldnn_engine/ops/scatter_update.cpp
@@ -57,7 +57,8 @@ void CreateScatterUpdateOp(Program& p, const std::shared_ptr<ngraph::op::v3::Sca
                                            inputPrimitives[0],
                                            inputPrimitives[1],
                                            inputPrimitives[2],
-                                           GetScatterUpdateAxis(axis, rank));
+                                           GetScatterUpdateAxis(axis, rank),
+                                           op->get_friendly_name());
 
     p.AddPrimitive(primitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/select.cpp b/inference-engine/src/cldnn_engine/ops/select.cpp
index 6b3866ac5dbaa9..b47a04b5e56d87 100644
--- a/inference-engine/src/cldnn_engine/ops/select.cpp
+++ b/inference-engine/src/cldnn_engine/ops/select.cpp
@@ -40,7 +40,13 @@ void CreateSelectOp(Program& p, const std::shared_ptr<ngraph::op::v1::Select>& o
             if (targetFormat.value != DefaultFormatForDims(inputDimsN).value) {
                 auto reorderName = layerName + "_cldnn_in" + std::to_string(i) + "_reorder";
                 auto targetDatatype = DataTypeFromPrecision(op->get_input_element_type(i));
-                auto reorderPrim = cldnn::reorder(reorderName, inputPrimitives[i], targetFormat, targetDatatype);
+                auto reorderPrim = cldnn::reorder(reorderName,
+                                                  inputPrimitives[i],
+                                                  targetFormat,
+                                                  targetDatatype,
+                                                  std::vector<float>(),
+                                                  cldnn::reorder_mean_mode::subtract,
+                                                  op->get_friendly_name());
 
                 p.AddPrimitive(reorderPrim);
                 p.AddInnerPrimitiveToProfiler(reorderName, layerName, op);
@@ -57,7 +63,7 @@ void CreateSelectOp(Program& p, const std::shared_ptr<ngraph::op::v1::Select>& o
 
                 auto targetShape = CldnnTensorFromIEDims(inputDims);
 
-                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape);
+                auto reshapePrim = cldnn::reshape(reshapeName, inputPrimitives[i], targetShape, op->get_friendly_name());
 
                 p.AddPrimitive(reshapePrim);
                 p.AddInnerPrimitiveToProfiler(reshapeName, layerName, op);
@@ -73,6 +79,7 @@ void CreateSelectOp(Program& p, const std::shared_ptr<ngraph::op::v1::Select>& o
                                     inputPrimitives[0],
                                     inputPrimitives[1],
                                     inputPrimitives[2],
+                                    op->get_friendly_name(),
                                     cldnn::padding(),
                                     bc_string);
 
diff --git a/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp b/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp
index f3066ace26acc4..42976ffbc379b4 100644
--- a/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp
+++ b/inference-engine/src/cldnn_engine/ops/shuffle_channels.cpp
@@ -36,7 +36,8 @@ void CreateShuffleChannelsOp(Program& p, const std::shared_ptr<ngraph::op::v0::S
     auto shuffleChannelsPrim = cldnn::shuffle_channels(layerName,
                                                        inputPrimitives[0],
                                                        group,
-                                                       axis);
+                                                       axis,
+                                                       op->get_friendly_name());
 
     p.AddPrimitive(shuffleChannelsPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/softmax.cpp b/inference-engine/src/cldnn_engine/ops/softmax.cpp
index cbaffc04accd49..c8049e5800e900 100644
--- a/inference-engine/src/cldnn_engine/ops/softmax.cpp
+++ b/inference-engine/src/cldnn_engine/ops/softmax.cpp
@@ -41,7 +41,8 @@ void CreateSoftmaxOp(Program& p, const std::shared_ptr<ngraph::op::v1::Softmax>&
     std::string layerName = layer_type_name_ID(op);
     auto softmaxPrim = cldnn::softmax(layerName,
                                       inputPrimitives[0],
-                                      GetSoftmaxAxis(op->get_axis(), op->get_input_shape(0).size()));
+                                      GetSoftmaxAxis(op->get_axis(), op->get_input_shape(0).size()),
+                                      op->get_friendly_name());
     p.AddPrimitive(softmaxPrim);
     p.AddPrimitiveToProfiler(op);
 }
@@ -58,9 +59,10 @@ void CreateLogSoftmaxOp(Program& p, const std::shared_ptr<ngraph::op::v5::LogSof
 
     auto softmaxPrim = cldnn::softmax(layerNameSoftmax,
                                       inputPrimitives[0],
-                                      GetSoftmaxAxis(static_cast<size_t>(axis), op->get_input_shape(0).size()));
+                                      GetSoftmaxAxis(static_cast<size_t>(axis), op->get_input_shape(0).size()),
+                                      op->get_friendly_name());
 
-    auto logPrim = cldnn::activation(layerName, layerNameSoftmax, cldnn::activation_func::log);
+    auto logPrim = cldnn::activation(layerName, layerNameSoftmax, cldnn::activation_func::log, {(0.0F), (0.0F)}, op->get_friendly_name());
 
     p.AddPrimitive(softmaxPrim);
     p.AddPrimitive(logPrim);
diff --git a/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp b/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp
index fa57d178038882..2f51da29776580 100644
--- a/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp
+++ b/inference-engine/src/cldnn_engine/ops/space_to_batch.cpp
@@ -42,7 +42,8 @@ void CreateSpaceToBatchOp(Program& p, const std::shared_ptr<ngraph::op::v1::Spac
                                                   inputs[0],          // block_shape
                                                   inputs[1],          // crops_begin
                                                   inputs[2],          // crops_end
-                                                  out_size);
+                                                  out_size,
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(batchToSpacePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp b/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp
index df4a25b469811a..ccdb4f6bd39da5 100644
--- a/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp
+++ b/inference-engine/src/cldnn_engine/ops/space_to_depth.cpp
@@ -27,7 +27,8 @@ void CreateSpaceToDepthOp(Program& p, const std::shared_ptr<ngraph::op::v0::Spac
     auto spaceToDepthPrim = cldnn::space_to_depth(layerName,
                                                   inputPrimitives[0],
                                                   GetDepthMode(op->get_mode()),
-                                                  op->get_block_size());
+                                                  op->get_block_size(),
+                                                  op->get_friendly_name());
 
     p.AddPrimitive(spaceToDepthPrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/split.cpp b/inference-engine/src/cldnn_engine/ops/split.cpp
index 33b48c6d17fb2a..247739c274ad8a 100644
--- a/inference-engine/src/cldnn_engine/ops/split.cpp
+++ b/inference-engine/src/cldnn_engine/ops/split.cpp
@@ -40,8 +40,7 @@ void CreateCommonSplitOp(Program& p, const std::shared_ptr<ngraph::Node>& op) {
         auto outTensor = CldnnTensorFromIEDims(outLayerDims, 1);
         auto offsetTensor = CldnnTensorFromIEDims(startOffset, 0);
 
-        auto cropPrim = cldnn::crop(outLayerName, inputPrimitives[0], outTensor, offsetTensor);
-        p.primitivesToIRLayersMap[outLayerName] = { op->get_friendly_name() };
+        auto cropPrim = cldnn::crop(outLayerName, inputPrimitives[0], outTensor, offsetTensor, op->get_friendly_name());
         p.primitiveIDs[outLayerName] = outLayerName;
 
         p.AddPrimitive(cropPrim);
diff --git a/inference-engine/src/cldnn_engine/ops/strided_slice.cpp b/inference-engine/src/cldnn_engine/ops/strided_slice.cpp
index 8c796290a747da..695612b073fd9a 100644
--- a/inference-engine/src/cldnn_engine/ops/strided_slice.cpp
+++ b/inference-engine/src/cldnn_engine/ops/strided_slice.cpp
@@ -189,7 +189,7 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
         if (!new_axis_mask.empty()) {
             auto targetShape = CldnnTensorFromIEDims(reshape_pattern);
             auto reshapeInName = op->get_friendly_name() + "/Reshape_before";
-            auto reshapePrim = cldnn::reshape(reshapeInName, inputPrimitives[0], targetShape);
+            auto reshapePrim = cldnn::reshape(reshapeInName, inputPrimitives[0], targetShape, op->get_friendly_name());
             p.AddPrimitive(reshapePrim);
             p.AddInnerPrimitiveToProfiler(reshapeInName, layerName, op);
             inPrimitive = reshapeInName;
@@ -215,7 +215,7 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
         cldnn::tensor offSize = CldnnTensorFromIEDims(offset, 0);
 
 
-        auto cropPrim = cldnn::crop(layerName, inPrimitive, refSize, offSize);
+        auto cropPrim = cldnn::crop(layerName, inPrimitive, refSize, offSize, op->get_friendly_name());
         p.AddPrimitive(cropPrim);
         p.AddPrimitiveToProfiler(layerName, op);
 
@@ -223,7 +223,7 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
         if (!shrink_axis_mask.empty()) {
             auto targetShape = CldnnTensorFromIEDims(output_shape);
             auto reshapeOutName = op->get_friendly_name() + "/Crop";
-            auto reshapePrim = cldnn::reshape(reshapeOutName, layerName, targetShape);
+            auto reshapePrim = cldnn::reshape(reshapeOutName, layerName, targetShape, op->get_friendly_name());
             p.AddPrimitive(reshapePrim);
             p.AddInnerPrimitiveToProfiler(reshapeOutName, layerName, op);
         }
@@ -258,7 +258,8 @@ void CreateStridedSliceOp(Program& p, const std::shared_ptr<ngraph::op::v1::Stri
                                                  end_mask,
                                                  new_axis_mask,
                                                  shrink_axis_mask,
-                                                 out_size);
+                                                 out_size,
+                                                 op->get_friendly_name());
 
     p.AddPrimitive(stridedSlicePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp b/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp
index d9843481979f23..53fb5939ccb1cc 100644
--- a/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp
+++ b/inference-engine/src/cldnn_engine/ops/tensor_iterator.cpp
@@ -27,11 +27,11 @@ using TensorIterator = ngraph::op::v0::TensorIterator;
 namespace CLDNNPlugin {
 
 template<class DATA_TYPE>
-static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num) {
+static DATA_TYPE CreateScalarData(Program &p, const cldnn::primitive_id& id, int64_t num, const cldnn::primitive_id& ext_prim_id) {
     auto mem = p.GetEngine().allocate_memory({ cldnn::data_types::i64, cldnn::format::bfyx, { 1, 1, 1, 1 } });
     cldnn::mem_lock<int64_t> ptr{mem, p.GetEngine().get_program_stream()};
     *ptr.begin() = num;
-    return {id, mem};
+    return {id, mem, ext_prim_id};
 }
 
 static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::shared_ptr<ngraph::Node>& op,
@@ -42,7 +42,7 @@ static cldnn::mutable_data CreateAdditionalOutputData(Program &p, const std::sha
     const auto tensor = CldnnTensorFromIEDims(op->get_output_shape(output_idx));
     cldnn::layout output_layout = cldnn::layout(precision, format, tensor);
     auto mem = p.GetEngine().allocate_memory(output_layout);
-    auto md = cldnn::mutable_data(id, {input}, mem); // cldnn::data cannot set dependency
+    auto md = cldnn::mutable_data(id, {input}, mem, op->get_friendly_name()); // cldnn::data cannot set dependency
     return md;
 }
 
@@ -122,24 +122,21 @@ void CreateTensorIteratorOp(Program &p, const std::shared_ptr<TensorIterator> &o
         throw std::runtime_error("tensor iterator's num_iteration cannot be negative");
     }
     {
-        cldnn::data trip_count = CreateScalarData<cldnn::data>(p, trip_count_id, num_iterations);
-        p.primitivesToIRLayersMap[trip_count_id] = { op->get_friendly_name() };
+        cldnn::data trip_count = CreateScalarData<cldnn::data>(p, trip_count_id, num_iterations, op->get_friendly_name());
         p.primitiveIDs[trip_count_id] = trip_count_id;
         p.AddPrimitive(trip_count);
         p.AddInnerPrimitiveToProfiler(trip_count_id, layerName, op);
     }
     const cldnn::primitive_id execution_condition_id = layerName + "_initialExecutionCondition";
     {
-        cldnn::mutable_data execution_condition = CreateScalarData<cldnn::mutable_data>(p, execution_condition_id, 1);
-        p.primitivesToIRLayersMap[execution_condition_id] = { op->get_friendly_name() };
+        cldnn::mutable_data execution_condition = CreateScalarData<cldnn::mutable_data>(p, execution_condition_id, 1, op->get_friendly_name());
         p.primitiveIDs[execution_condition_id] = execution_condition_id;
         p.AddPrimitive(execution_condition);
         p.AddInnerPrimitiveToProfiler(execution_condition_id, layerName, op);
     }
     const cldnn::primitive_id num_iteration_id = layerName + "_numIteration";
     {
-        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0);
-        p.primitivesToIRLayersMap[num_iteration_id] = { op->get_friendly_name() };
+        cldnn::mutable_data num_iteration = CreateScalarData<cldnn::mutable_data>(p, num_iteration_id, 0, op->get_friendly_name());
         p.primitiveIDs[num_iteration_id] = num_iteration_id;
         p.AddPrimitive(num_iteration);
         p.AddInnerPrimitiveToProfiler(num_iteration_id, layerName, op);
@@ -191,7 +188,10 @@ void CreateTensorIteratorOp(Program &p, const std::shared_ptr<TensorIterator> &o
         input_primitive_maps,         /* input mappings connecting outer network and inner network */
         output_primitive_maps,        /* output mappings connecting outer network and inner network */
         back_edges,             /* back edge mapping */
-        num_iterations);        /* max iteration, i.e. length of iteration axis */
+        num_iterations,         /* max iteration, i.e. length of iteration axis */
+        "",
+        "",
+        op->get_friendly_name());
 
     p.AddPrimitive(loopPrimitive);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/tile.cpp b/inference-engine/src/cldnn_engine/ops/tile.cpp
index aa91fbd3d5a410..4d35ff0c647a92 100644
--- a/inference-engine/src/cldnn_engine/ops/tile.cpp
+++ b/inference-engine/src/cldnn_engine/ops/tile.cpp
@@ -18,7 +18,8 @@ void CreateTileOp(Program& p, const std::shared_ptr<ngraph::op::v0::Tile>& op) {
 
     auto tilePrim = cldnn::tile(layerName,
                                 inputPrimitives[0],
-                                CldnnTensorFromIEDims(op->get_output_shape(0)));
+                                CldnnTensorFromIEDims(op->get_output_shape(0)),
+                                op->get_friendly_name());
 
     p.AddPrimitive(tilePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/topk.cpp b/inference-engine/src/cldnn_engine/ops/topk.cpp
index 3d8f7e6521a112..20637b4eb585f8 100644
--- a/inference-engine/src/cldnn_engine/ops/topk.cpp
+++ b/inference-engine/src/cldnn_engine/ops/topk.cpp
@@ -74,8 +74,9 @@ void CreateTopKOp(Program& p, const std::shared_ptr<ngraph::op::v1::TopK>& op) {
         auto shared_memory = p.GetEngine().allocate_memory(mutableLayout);
 
         cldnn::primitive_id argmax_mutable_id_w = layer_type_name_ID(op) + "_md_write";
-        auto argmax_mutable_prim = cldnn::mutable_data(argmax_mutable_id_w, shared_memory);
-        p.primitivesToIRLayersMap[argmax_mutable_id_w] = {op->get_friendly_name()};
+        auto argmax_mutable_prim = cldnn::mutable_data(argmax_mutable_id_w,
+                                                       shared_memory,
+                                                       op->get_friendly_name());
         p.primitiveIDs[argmax_mutable_id_w] = argmax_mutable_id_w;
         p.AddPrimitive(argmax_mutable_prim);
         inputPrimitives.push_back(argmax_mutable_id_w);
@@ -88,14 +89,17 @@ void CreateTopKOp(Program& p, const std::shared_ptr<ngraph::op::v1::TopK>& op) {
                                              chosen_axis,
                                              stype,
                                              true,
+                                             op->get_friendly_name(),
                                              cldnn::padding({0, 0, 0, 0}, 0),
                                              DataTypeFromPrecision(op->get_output_element_type(0)));
 
         p.AddPrimitive(argmaxPrim);
 
         cldnn::primitive_id argmax_mutable_id_r = layerName + ".1";
-        auto argmax_mutable_prim_r = cldnn::mutable_data(argmax_mutable_id_r, {ArgMaxLayerName}, shared_memory);
-        p.primitivesToIRLayersMap[argmax_mutable_id_r] = {op->get_friendly_name()};
+        auto argmax_mutable_prim_r = cldnn::mutable_data(argmax_mutable_id_r,
+                                                         { ArgMaxLayerName },
+                                                         shared_memory,
+                                                         op->get_friendly_name());
         p.primitiveIDs[argmax_mutable_id_r] = argmax_mutable_id_r;
         p.AddPrimitive(argmax_mutable_prim_r);
         p.InitProfileInfo(ArgMaxLayerName, layer_type_lower(op));
@@ -108,6 +112,7 @@ void CreateTopKOp(Program& p, const std::shared_ptr<ngraph::op::v1::TopK>& op) {
                                              chosen_axis,
                                              stype,
                                              true,
+                                             op->get_friendly_name(),
                                              cldnn::padding({0, 0, 0, 0}, 0),
                                              DataTypeFromPrecision(op->get_output_element_type(0)));
 
diff --git a/inference-engine/src/cldnn_engine/ops/transpose.cpp b/inference-engine/src/cldnn_engine/ops/transpose.cpp
index f5de62923a2c3b..c2bf2e943d3924 100644
--- a/inference-engine/src/cldnn_engine/ops/transpose.cpp
+++ b/inference-engine/src/cldnn_engine/ops/transpose.cpp
@@ -37,7 +37,8 @@ void CreateTransposeOp(Program& p, const std::shared_ptr<ngraph::op::v1::Transpo
 
     auto permutePrim = cldnn::permute(layerName,
                                       inputPrimitives[0],
-                                      cldnn_permute_order);
+                                      cldnn_permute_order,
+                                      op->get_friendly_name());
 
     p.AddPrimitive(permutePrim);
     p.AddPrimitiveToProfiler(op);
diff --git a/inference-engine/src/cldnn_engine/ops/unary.cpp b/inference-engine/src/cldnn_engine/ops/unary.cpp
index 9a277a8be2aa04..ecab7600ade7f7 100644
--- a/inference-engine/src/cldnn_engine/ops/unary.cpp
+++ b/inference-engine/src/cldnn_engine/ops/unary.cpp
@@ -49,7 +49,7 @@ void CreateUnaryEltwiseOp(Program& p, const std::shared_ptr<ngraph::Node>& op,
                           cldnn::activation_func func, cldnn::activation_additional_params params) {
     auto inputs = p.GetInputPrimitiveIDs(op);
     std::string layerName = layer_type_name_ID(op);
-    auto activationPrimitive = cldnn::activation(layerName, inputs[0], func, params);
+    auto activationPrimitive = cldnn::activation(layerName, inputs[0], func, params, op->get_friendly_name());
     p.AddPrimitive(activationPrimitive);
     p.AddPrimitiveToProfiler(op);
 }
@@ -86,7 +86,11 @@ void CreatePReluOp(Program& p, const std::shared_ptr<ngraph::op::v0::PRelu>& op)
     } else if (out_shape.size() >= 2 && ngraph::shape_size(slope_shape) == out_shape[1]) {
         auto inputs = p.GetInputPrimitiveIDs(op);
         std::string layerName = layer_type_name_ID(op);
-        auto activationPrimitive = cldnn::activation(layerName, inputs[0], inputs[1], cldnn::activation_func::relu_negative_slope);
+        auto activationPrimitive = cldnn::activation(layerName,
+                                                     inputs[0],
+                                                     inputs[1],
+                                                     cldnn::activation_func::relu_negative_slope,
+                                                     op->get_friendly_name());
         p.AddPrimitive(activationPrimitive);
         p.AddPrimitiveToProfiler(op);
     }
diff --git a/inference-engine/src/gna_plugin/CMakeLists.txt b/inference-engine/src/gna_plugin/CMakeLists.txt
index 36b9d6d5cc0b8e..f90cfce5c8a229 100644
--- a/inference-engine/src/gna_plugin/CMakeLists.txt
+++ b/inference-engine/src/gna_plugin/CMakeLists.txt
@@ -81,5 +81,5 @@ set_target_properties(${TARGET_NAME} ${TARGET_NAME}_test_static
 
 file(GLOB_RECURSE source_list "${libGNA_LIBRARIES_BASE_PATH}/*${CMAKE_SHARED_LIBRARY_SUFFIX}*")
 install(FILES ${source_list}
-        DESTINATION ${IE_CPACK_IE_DIR}/external/gna/lib
+        DESTINATION ${IE_CPACK_RUNTIME_PATH}
         COMPONENT gna)
diff --git a/inference-engine/src/gna_plugin/backend/am_intel_dnn.cpp b/inference-engine/src/gna_plugin/backend/am_intel_dnn.cpp
index 8b3e0901ba28e7..322dbd2f9d300d 100644
--- a/inference-engine/src/gna_plugin/backend/am_intel_dnn.cpp
+++ b/inference-engine/src/gna_plugin/backend/am_intel_dnn.cpp
@@ -23,6 +23,7 @@
 #include "dnn.hpp"
 #include "am_intel_dnn.hpp"
 #include "dnn_types.h"
+#include "gna/gna_config.hpp"
 #include "gna_types.h"
 #include "gna_limitations.hpp"
 #include "layers/gna_convolution_layer.hpp"
@@ -248,6 +249,16 @@ void GNAPluginNS::backend::AMIntelDNN::InitConvolutional2DComponentPrivate(intel
     ptr_inputs = &comp.ptr_inputs;
     ptr_outputs = &comp.ptr_outputs;
 }
+
+bool GNAPluginNS::backend::AMIntelDNN::isOperationCnnLegacySpecific(const Gna2Operation& op) {
+    // GNA compile target GNA_TARGET_3_0 does not support pooling window < pooling stride
+    return op.Type == Gna2OperationTypeConvolution &&
+        op.NumberOfParameters > std::max(PoolStrideParamIdx, PoolWinParamIdx) &&
+        op.Parameters[PoolStrideParamIdx] != nullptr &&
+        op.Parameters[PoolWinParamIdx] != nullptr &&
+        static_cast<Gna2Shape*>(op.Parameters[PoolStrideParamIdx])->NumberOfDimensions == 1 &&
+        static_cast<Gna2Shape*>(op.Parameters[PoolStrideParamIdx])->Dimensions[0] > static_cast<Gna2Shape*>(op.Parameters[PoolWinParamIdx])->Dimensions[0];
+}
 #endif
 
 void GNAPluginNS::backend::AMIntelDNN::InitMaxpoolComponentPrivate(intel_dnn_component_t &comp,
@@ -1677,7 +1688,12 @@ void GNAPluginNS::backend::AMIntelDNN::InitGNAStruct(intel_nnet_type_t *ptr_nnet
                             const auto fltStride = fltStrideShape->Dimensions[0];
                             const auto outFromConv = outputFromConv(inVecCnt, nFltSize, fltStride);
                             //  FLAT input matrix, pooled outputs per filter
-                            if (gnaCompileTarget == InferenceEngine::GNAConfigParams::GNA_TARGET_3_0) {
+
+                            auto effectiveCompileTarget = gnaCompileTarget;
+                            if (isOperationCnnLegacySpecific(*gnaOperation)) {
+                                effectiveCompileTarget = InferenceEngine::GNAConfigParams::GNA_TARGET_2_0;
+                            }
+                            if (effectiveCompileTarget == InferenceEngine::GNAConfigParams::GNA_TARGET_3_0) {
                                 outputTensor.Shape.Dimensions[1] = outputFromPooling(outFromConv, poolWindow->Dimensions[0], poolStride->Dimensions[0]);
                             } else {
                                 outputTensor.Shape.Dimensions[1] = outputFromPoolingLegacy(outFromConv, poolStride->Dimensions[0]);
diff --git a/inference-engine/src/gna_plugin/backend/am_intel_dnn.hpp b/inference-engine/src/gna_plugin/backend/am_intel_dnn.hpp
index 19ca045647fd81..5099e090188c32 100644
--- a/inference-engine/src/gna_plugin/backend/am_intel_dnn.hpp
+++ b/inference-engine/src/gna_plugin/backend/am_intel_dnn.hpp
@@ -10,6 +10,7 @@
 
 #include "dnn_types.h"
 #include "gna_types.h"
+#include "gna/gna_config.hpp"
 
 #include "gna_plugin_log.hpp"
 
@@ -153,6 +154,10 @@ class AMIntelDNN {
             (void*&)ptr_filters,
             (void*&)ptr_biases);
     }
+
+    // Checks whether operation is Convolution and its parameters makes it specific to GNA1/GNA2 targets
+    // It does not guarantee that operation fully compatible to GNA1/GNA2, but for sure is not comaptible with GNA3 target
+    static bool isOperationCnnLegacySpecific(const Gna2Operation& operation);
 #endif
 
     template<class A, class B>
diff --git a/inference-engine/src/gna_plugin/backend/gna_limitations.cpp b/inference-engine/src/gna_plugin/backend/gna_limitations.cpp
index 6afe55bd043d93..34fd7534ba6d68 100644
--- a/inference-engine/src/gna_plugin/backend/gna_limitations.cpp
+++ b/inference-engine/src/gna_plugin/backend/gna_limitations.cpp
@@ -32,7 +32,7 @@ bool RangeLimit2D::isValid(const uint32_t h, const uint32_t w) const {
 }
 
 std::string RangeLimit2D::GetErrorOrEmpty(const uint32_t h, const uint32_t w) const {
-    return hLimit.GetErrorOrEmpty(h) + hLimit.GetErrorOrEmpty(w);
+    return hLimit.GetErrorOrEmpty(h) + wLimit.GetErrorOrEmpty(w);
 }
 
 RangeMultipleLimit::RangeMultipleLimit(RangeLimit rlIn, uint32_t multiplierIn) : RangeLimit(rlIn), multiplier(multiplierIn) {
diff --git a/inference-engine/src/gna_plugin/frontend/layer_quantizer.hpp b/inference-engine/src/gna_plugin/frontend/layer_quantizer.hpp
index 40099b34f8ca19..26566fd339a871 100644
--- a/inference-engine/src/gna_plugin/frontend/layer_quantizer.hpp
+++ b/inference-engine/src/gna_plugin/frontend/layer_quantizer.hpp
@@ -232,7 +232,7 @@ inline InferenceEngine::Blob::Ptr fp32_to_precision_blob(InferenceEngine::Blob::
         }
 
         f32Value = f32Value * scale_factor;
-        if (f32Value > std::numeric_limits<T>::max()) {
+        if (f32Value > static_cast<float>(std::numeric_limits<T>::max())) {
             precValue = std::numeric_limits<T>::max();
         } else if (f32Value < std::numeric_limits<T>::min()) {
             precValue = std::numeric_limits<T>::min();
@@ -699,5 +699,53 @@ using QuantI8_I8 = frontend::QuantPair<frontend::QuantI8_I8, frontend::QuantI8_I
 using FakeQuantI16 = frontend::QuantPair<frontend::FakeQuantI16, frontend::FakeQuantI16>;
 using FakeQuantI8 = frontend::QuantPair<frontend::FakeQuantI8, frontend::FakeQuantI16>;
 
+enum class QuantizedDataType {
+    input,
+    output,
+    weights,
+    bias
+};
+
+/**
+ * @brief Returns a scale factor for specific layer data
+ * @param layer Layer to be quantized
+ * @param data_type Type of data to be quantized
+ * @return scale factor
+ */
+inline float getScaleFactor(InferenceEngine::CNNLayerPtr layer, QuantizedDataType data_type) {
+    IE_ASSERT(layer != nullptr);
+    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
+    float scale_factor;
+    if (!quantized) {
+        scale_factor = 1.0f;
+    } else {
+        switch (data_type) {
+            case QuantizedDataType::input:
+                scale_factor = quantized->_src_quant.GetScale();
+                break;
+            case QuantizedDataType::output:
+            scale_factor = quantized->_dst_quant.GetScale();
+                break;
+            case QuantizedDataType::weights:
+                scale_factor = quantized->_weights_quant.GetScale();
+                break;
+            case QuantizedDataType::bias:
+                scale_factor = quantized->_bias_quant.GetScale();
+                break;
+            default:
+                THROW_GNA_LAYER_EXCEPTION(layer) << "Unsupported data type for quantization: " << static_cast<int>(data_type);
+        }
+    }
+
+    auto isZero = [](float p1) {
+        return std::abs(p1) <= 0.00001f;
+    };
+
+    if (scale_factor < 0.0 || isZero(scale_factor) || std::isinf(scale_factor)) {
+        THROW_GNA_LAYER_EXCEPTION(layer) << "Invalid scale factor: " << scale_factor;
+    }
+
+    return scale_factor;
+}
 
 }  // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/frontend/scale_factor_calc.hpp b/inference-engine/src/gna_plugin/frontend/scale_factor_calc.hpp
index a986a4b60e2b62..812f0e0772a907 100644
--- a/inference-engine/src/gna_plugin/frontend/scale_factor_calc.hpp
+++ b/inference-engine/src/gna_plugin/frontend/scale_factor_calc.hpp
@@ -36,6 +36,17 @@ struct ScaleFactorUpdateResult {
     }
 };
 
+/**
+* @brief Calculates a scale factor from FakeQuantize statistics according to the formula:
+* scale factor = max representable value / max absolute input value
+* @param levels Number of integer quants
+* @param minValue Minimum value to be quantized
+* @param maxValue Maximum value to be quantized
+*/
+inline float CalculateScaleFactorFromStats(size_t levels, float minValue, float maxValue) {
+    return maxValue == minValue ? 1.0f : (levels - 1) / (maxValue - minValue);
+}
+
 /**
  * @brief Compares two float values and returns if they are equal
  * @param p1 First float value
@@ -372,7 +383,7 @@ class ScaleFactorPerLayer<InferenceEngine::CNNLayer *> {
             auto maxOutValue = quantizedParams->_dst_quant.GetMaxValues().front();
             auto absMax = std::max(std::abs(minOutValue), std::abs(maxOutValue));
 
-            result = (quantizedParams->_dst_quant.GetLevels() - 1) / (maxOutValue - minOutValue);
+            result = CalculateScaleFactorFromStats(quantizedParams->_dst_quant.GetLevels(), minOutValue, maxOutValue);
             if (std::isinf(result) || fp32eq(absMax, 0.0f)) {
                 result = max_activation_scale_factor;
             }
@@ -452,7 +463,7 @@ class ScaleFactorPerLayer<InferenceEngine::CNNLayer *> {
             if (CNNNetHasPrevLayer(cnnLayer) && quant->_dst_quant.IsStatsSet() && !quant->_dst_quant.IsScaleSet()) {
                 auto minOutValue = quant->_dst_quant.GetMinValues().front();
                 auto maxOutValue = quant->_dst_quant.GetMaxValues().front();
-                auto scale = (quant->_dst_quant.GetLevels() - 1) / (maxOutValue - minOutValue);
+                auto scale = CalculateScaleFactorFromStats(quant->_dst_quant.GetLevels(), minOutValue, maxOutValue);
                 quant->_dst_quant.SetScale(scale);
                 quant->_src_quant = quant->_dst_quant;
             }
@@ -479,7 +490,8 @@ class ScaleFactorPerLayer<InferenceEngine::CNNLayer *> {
 
                     if ((!fakeQuantize && quantSibling->_dst_quant.IsScaleSet()) ||
                         (fakeQuantize && quantSibling->_dst_quant.IsScaleSet() && !fp32eq(quantSibling->_dst_quant.GetScale(), 1.0) &&
-                        quantSibling->_dst_quant.GetScale() < inputQuant->_dst_quant.GetScale()) || infiniteLoopCount > 0) {
+                        quantSibling->_dst_quant.GetScale() < inputQuant->_dst_quant.GetScale()) ||
+                        quantSibling->_dst_quant.IsScaleSet() && infiniteLoopCount > 0) {
                         // means we already restarted propagation input memory layer
                         // need to search for requantiseable layer prior memory output layer
                         InferenceEngine::CNNLayerPtr restartedLayer;
@@ -646,6 +658,73 @@ class ScaleFactorPerLayer<InferenceEngine::CNNLayer *> {
 
 template<>
 class ScaleFactorPerLayer<InferenceEngine::EltwiseLayer*> {
+ private:
+    bool requantizeEltwiseInput(InferenceEngine::EltwiseLayer* eltwiseLayer, uint8_t inputIx, int16_t maxValue,
+        bool fakeQuantize, ScaleFactorUpdateResult &result) {
+        auto quantData = InferenceEngine::getInjectedData<QuantizedLayerParams>(*eltwiseLayer);
+        auto in = InferenceEngine::CNNNetPrevLayer(eltwiseLayer, inputIx);
+        bool has8BOr16BOut = LayerInfo(in).has8BOr16BOutput();
+        auto quantParams =
+                InferenceEngine::getInjectedData<QuantizedLayerParams>(InferenceEngine::CNNNetPrevLayer(eltwiseLayer, inputIx));
+        // trick to get opposite index (for 0 -> 1 for 1 -> 0) by inversing i.
+        auto quantParamsOpposite =
+                InferenceEngine::getInjectedData<QuantizedLayerParams>(InferenceEngine::CNNNetPrevLayer(eltwiseLayer, !inputIx));
+
+        while (in && !LayerInfo(in).isInput() && !LayerInfo(in).isMemory() && !LayerInfo(in).isCopy()) {
+            auto info = LayerInfo(in);
+            if (info.isActivation() || info.isConst()) {
+                auto quantDataForInputLayer = InferenceEngine::getInjectedData<QuantizedLayerParams>(*in);
+                float newOutputScale;
+                if (has8BOr16BOut) {
+                    newOutputScale = quantParamsOpposite->_dst_quant.GetScale() / maxValue;
+                } else {
+                    newOutputScale = quantDataForInputLayer->_dst_quant.GetScale() *
+                                     quantParamsOpposite->_dst_quant.GetScale() * maxValue /
+                                     quantParams->_dst_quant.GetScale();
+                }
+                if (info.isActivation() && newOutputScale > static_cast<float>(std::numeric_limits<int16_t>::max()) / 2) {
+                    return false;
+                }
+                gnawarn() << "[WARNING] saturated weights for " << eltwiseLayer->name
+                            << ". Layer new output scale: " << in->name << ", output_scale=" << newOutputScale
+                            << ", was " << quantDataForInputLayer->_dst_quant.GetScale() <<"\n" << std::flush;
+                quantDataForInputLayer->_dst_quant.SetScale(newOutputScale);
+                result = ScaleFactorUpdateResult(in.get());
+                return true;
+            }
+
+            if (fakeQuantize && info.isWeightableIdentity()) {
+                auto quantDataForInputLayer = InferenceEngine::getInjectedData<QuantizedLayerParams>(*in);
+                if (!fp32eq(quantDataForInputLayer->_weights_quant.GetScale(), 1.0f)) {
+                    auto reducer = quantData->_weights_quant.GetScale() / maxValue;
+                    reducer = std::max(1.0f, reducer);
+                    auto newWeightsScale = quantDataForInputLayer->_weights_quant.GetScale() / reducer;
+                    newWeightsScale = std::max(1.0f, newWeightsScale);
+                    quantDataForInputLayer->_weights_quant.SetScale(static_cast<int32_t>(newWeightsScale));
+                    quantDataForInputLayer->_dst_quant.SetScale(quantDataForInputLayer->_weights_quant.GetScale() *
+                        quantDataForInputLayer->_src_quant.GetScale());
+
+                    result = ScaleFactorUpdateResult(in.get());
+                    return true;
+                }
+            }
+
+            // if we are here it means that we are in the port 1
+            if (info.isFullyConnected() || info.isConvolution()) {
+                auto quantDataForInputLayer = InferenceEngine::getInjectedData<QuantizedLayerParams>(*in);
+                auto newOutputScale = quantParamsOpposite->_dst_quant.GetScale() * maxValue;
+                auto newWeightScale = newOutputScale / quantDataForInputLayer->_src_quant.GetScale();
+                quantDataForInputLayer->_dst_quant.SetScale(newOutputScale);
+                quantDataForInputLayer->_weights_quant.SetScale(newWeightScale);
+                result = ScaleFactorUpdateResult(in.get());
+                return true;
+            }
+
+            in = InferenceEngine::CNNNetHasPrevLayer(in.get()) ? InferenceEngine::CNNNetPrevLayer(in) : nullptr;
+        }
+        return false;
+    }
+
  public:
     bool operator()(InferenceEngine::EltwiseLayer* eltwiseLayer, int weightsSize, int inputsSize, ScaleFactorUpdateResult &result,
         bool fakeQuantize, int infiniteLoopCount) {
@@ -723,7 +802,7 @@ class ScaleFactorPerLayer<InferenceEngine::EltwiseLayer*> {
                             }
                         }
 
-                        if (!fp32eq(bestWeightsScale, quantParams1->_weights_quant.GetScale())) {
+                        if (bestWeightsScale > 0.0f && !fp32eq(bestWeightsScale, quantParams1->_weights_quant.GetScale())) {
                             quantParams1->_weights_quant.SetScale(bestWeightsScale);
                             quantParams1->_dst_quant.SetScale(quantParams1->_weights_quant.GetScale() * quantParams1->_src_quant.GetScale());
                             result = ScaleFactorUpdateResult(in1.get());
@@ -735,79 +814,22 @@ class ScaleFactorPerLayer<InferenceEngine::EltwiseLayer*> {
                 quantData->_dst_quant.SetScale(quantParams1->_dst_quant.GetScale());
 
                 // eltwise will work in int16 or int8 if low precision inputs are used
-                auto maxValue = lowPrecision ? (std::numeric_limits<int8_t>::max() - 1) : (std::numeric_limits<int16_t>::max() - 1);
-                if (quantData->_weights_quant.GetScale() > maxValue + 1) {
-                    // rescaling it's activation input
-                    // iterating thru previous layers of eltwise
-                    for (uint8_t i = 0; i < 2; ++i) {
-                        InferenceEngine::CNNLayerPtr in = InferenceEngine::CNNNetPrevLayer(eltwiseLayer, i);
-                        bool has8BOr16BOut = LayerInfo(in).has8BOr16BOutput();
-                        auto quantParams =
-                                InferenceEngine::getInjectedData<QuantizedLayerParams>(InferenceEngine::CNNNetPrevLayer(eltwiseLayer, i));
-                        // trick to get opposite index (for 0 -> 1 for 1 -> 0) by inversing i.
-                        auto quantParamsOpposite =
-                                InferenceEngine::getInjectedData<QuantizedLayerParams>(InferenceEngine::CNNNetPrevLayer(eltwiseLayer, !i));
-
-                        for (; InferenceEngine::CNNNetHasPrevLayer(in.get()); in = CNNNetPrevLayer(in)) {
-                            auto info = LayerInfo(in);
-                            if (info.isSplit() || info.isSlice() || info.isConcat() || info.isNonFunctional()) {
-                                continue;
-                            } else if (info.has8BOr16BOutput() && info.isActivation()) {
-                                auto quantDataForActivation = InferenceEngine::getInjectedData<QuantizedLayerParams>(*in);
-                                float newOutputScale;
-                                if (has8BOr16BOut) {
-                                    newOutputScale = quantParamsOpposite->_dst_quant.GetScale() / maxValue;
-                                } else {
-                                    newOutputScale = quantDataForActivation->_dst_quant.GetScale() *
-                                                     quantParamsOpposite->_dst_quant.GetScale() * maxValue /
-                                                     quantParams->_dst_quant.GetScale();
-                                }
-                                if (newOutputScale > static_cast<float>(std::numeric_limits<int16_t>::max()) / 2) {
-                                    break;
-                                }
-                                gnawarn() << "[WARNING] saturated weights for " << eltwiseLayer->name
-                                         << ". Layer new output scale: " << in->name << ", output_scale=" << newOutputScale
-                                         << ", was " << quantDataForActivation->_dst_quant.GetScale() <<"\n" << std::flush;
-                                quantDataForActivation->_dst_quant.SetScale(newOutputScale);
-                                result = ScaleFactorUpdateResult(in.get());
-                                return true;
-                            } else if (info.has8BOr16BOutput()) {
-                                break;
-                            }
-
-                            if (fakeQuantize && info.isWeightableIdentity()) {
-                                auto quantDataForInputLayer = InferenceEngine::getInjectedData<QuantizedLayerParams>(*in);
-                                if (!fp32eq(quantDataForInputLayer->_weights_quant.GetScale(), 1.0f)) {
-                                    auto reducer = quantData->_weights_quant.GetScale() / std::numeric_limits<int16_t>::max();
-                                    reducer = std::max(1.0f, reducer);
-                                    auto newWeightsScale = quantDataForInputLayer->_weights_quant.GetScale() / reducer;
-                                    newWeightsScale = std::max(1.0f, newWeightsScale);
-                                    quantDataForInputLayer->_weights_quant.SetScale(static_cast<int32_t>(newWeightsScale));
-                                    quantDataForInputLayer->_dst_quant.SetScale(quantDataForInputLayer->_weights_quant.GetScale() *
-                                        quantDataForInputLayer->_src_quant.GetScale());
-
-                                    result = ScaleFactorUpdateResult(in.get());
-                                    return true;
-                                }
-                            }
+                auto maxValue = lowPrecision ? std::numeric_limits<int8_t>::max() : std::numeric_limits<int16_t>::max();
+                if (quantData->_weights_quant.GetScale() <= maxValue) {
+                    return true;
+                }
 
-                            // if we are here it means that we are in the port 1
-                            if (info.isFullyConnected() || info.isConvolution()) {
-                                auto quantDataForInputLayer = InferenceEngine::getInjectedData<QuantizedLayerParams>(*in);
-                                auto newOutputScale = quantParamsOpposite->_dst_quant.GetScale() * maxValue;
-                                auto newWeightScale = newOutputScale / quantDataForInputLayer->_src_quant.GetScale();
-                                quantDataForInputLayer->_dst_quant.SetScale(newOutputScale);
-                                quantDataForInputLayer->_weights_quant.SetScale(newWeightScale);
-                                result = ScaleFactorUpdateResult(in.get());
-                                return true;
-                            }
-                        }
+                // rescaling it's activation input
+                // iterating thru previous layers of eltwise
+                for (uint8_t i = 0; i < 2; ++i) {
+                    if (requantizeEltwiseInput(eltwiseLayer, i, maxValue - 1, fakeQuantize, result)) {
+                        return true;
                     }
-                    // we unable to rescale the input - results might be bad
-                    gnawarn() << "[INFO] weights saturated for " << eltwiseLayer->name << "\n";
                 }
-                break;
+                // we unable to rescale the input - results might be bad
+                gnawarn() << "[INFO] weights saturated for " << eltwiseLayer->name << "\n";
             }
+            break;
             default : THROW_GNA_EXCEPTION << "Unsupported Eltwise layer for quantisation: " << eltwiseLayer->_operation;
         }
         return true;
@@ -1068,8 +1090,8 @@ class ScaleFactorPerLayer<InferenceEngine::WeightableLayer*> {
         quant->_src_quant = quantDataForInputLayer->_dst_quant;
         if (quant->_weights_quant.IsStatsSet() && !quant->_weights_quant.IsScaleSet()) {
             auto getScale = [&quant](size_t i) {
-                auto valuesDiff = quant->_weights_quant.GetMaxValues(false)[i] - quant->_weights_quant.GetMinValues(false)[i];
-                return valuesDiff == 0 ? 1.0f : (quant->_weights_quant.GetLevels() - 1) / valuesDiff;
+                return CalculateScaleFactorFromStats(quant->_weights_quant.GetLevels(),
+                    quant->_weights_quant.GetMinValues(false)[i], quant->_weights_quant.GetMaxValues(false)[i]);
             };
 
             float min_channel_scale = getScale(0);
@@ -1142,7 +1164,6 @@ class ScaleFactorPerLayer<InferenceEngine::WeightableLayer*> {
             }
             quant->_weights_quant.SetScale(quant->_weights_quant.GetScale() / weights_reducer);
         }
-
         double tmp_dst_quant_scale = quant->_weights_quant.GetScale() * quant->_src_quant.GetScale();
         if (weightsSize == 1) {
             auto itt = thresholds.begin();
@@ -1222,9 +1243,8 @@ class ScaleFactorPerLayer<InferenceEngine::GemmLayer*> {
         quantData->_weights_quant.SetScale(quantParams1->_dst_quant.GetScale());
         if (quantData->_src_quant.IsStatsSet()) {
             auto getScale = [&quantParams0](size_t i) {
-                return (quantParams0->_dst_quant.GetLevels() - 1) /
-                       (quantParams0->_dst_quant.GetMaxValues(false)[i] -
-                        quantParams0->_dst_quant.GetMinValues(false)[i]);
+                return CalculateScaleFactorFromStats(quantParams0->_dst_quant.GetLevels(),
+                    quantParams0->_dst_quant.GetMinValues(false)[i], quantParams0->_dst_quant.GetMaxValues(false)[i]);
             };
             float min_channel_scale = getScale(0);
             quantParams0->_dst_quant.SetScale(min_channel_scale);
diff --git a/inference-engine/src/gna_plugin/gna_device.cpp b/inference-engine/src/gna_plugin/gna_device.cpp
index 85a246ea34f134..af561cc0c47939 100644
--- a/inference-engine/src/gna_plugin/gna_device.cpp
+++ b/inference-engine/src/gna_plugin/gna_device.cpp
@@ -24,6 +24,7 @@
 #include "gna-api.h"
 #endif
 
+#include "backend/am_intel_dnn.hpp"
 #include "gna/gna_config.hpp"
 #include "gna_plugin_log.hpp"
 
@@ -115,13 +116,26 @@ uint32_t GNADeviceHelper::propagate(const uint32_t requestConfigId, Gna2Accelera
     return reqId;
 }
 
+void enforceLegacyCnn(Gna2Operation& operation) {
+    snprintf(
+        const_cast<char*>(operation.Operands[1]->Layout),
+        sizeof(operation.Operands[1]->Layout) / sizeof(char),
+        "GNA1");
+}
+
 void GNADeviceHelper::enforceLegacyCnns(Gna2Model& gnaModel) {
     for (uint32_t i = 0; i < gnaModel.NumberOfOperations; i++) {
         if (gnaModel.Operations[i].Type == Gna2OperationTypeConvolution) {
-            snprintf(
-                const_cast<char*>(gnaModel.Operations[i].Operands[1]->Layout),
-                sizeof(gnaModel.Operations[i].Operands[1]->Layout) / sizeof(char),
-                "GNA1");
+            enforceLegacyCnn(gnaModel.Operations[i]);
+        }
+    }
+}
+
+void GNADeviceHelper::enforceLegacyCnnsWhenNeeded(Gna2Model& gnaModel) {
+    for (uint32_t i = 0; i < gnaModel.NumberOfOperations; i++) {
+        auto& op = gnaModel.Operations[i];
+        if (GNAPluginNS::backend::AMIntelDNN::isOperationCnnLegacySpecific(op)) {
+            enforceLegacyCnn(op);
         }
     }
 }
@@ -132,6 +146,7 @@ uint32_t GNADeviceHelper::createModel(Gna2Model& gnaModel) const {
     if (enforceLegacyCnnNeeded()) {
         enforceLegacyCnns(gnaModel);
     }
+    enforceLegacyCnnsWhenNeeded(gnaModel);
 #if GNA_LIB_VER == 2 && defined MODEL_DUMP
     std::string path =
 #ifdef _WIN32
@@ -581,3 +596,14 @@ void GNADeviceHelper::getGnaPerfCounters(std::map<std::string, InferenceEngine::
 #endif
     retPerfCounters["1.2 Stall scoring time in HW"] = info;
 }
+
+std::string GNADeviceHelper::getEffectiveGnaCompileTarget() const {
+#if GNA_LIB_VER == 1
+    return InferenceEngine::GNAConfigParams::GNA_TARGET_2_0;
+#else
+    if (getTargetDevice(false) == Gna2DeviceVersion3_0) {
+        return InferenceEngine::GNAConfigParams::GNA_TARGET_3_0;
+    }
+    return InferenceEngine::GNAConfigParams::GNA_TARGET_2_0;
+#endif
+}
diff --git a/inference-engine/src/gna_plugin/gna_device.hpp b/inference-engine/src/gna_plugin/gna_device.hpp
index cae32c70b1de3e..4983ce0d2e0509 100644
--- a/inference-engine/src/gna_plugin/gna_device.hpp
+++ b/inference-engine/src/gna_plugin/gna_device.hpp
@@ -176,6 +176,7 @@ class GNADeviceHelper {
     void getGnaPerfCounters(std::map<std::string,
                         InferenceEngine::InferenceEngineProfileInfo>& retPerfCounters);
     static std::string GetGnaLibraryVersion();
+    std::string getEffectiveGnaCompileTarget() const;
  private:
     void open(uint8_t const n_threads);
 
@@ -190,6 +191,7 @@ class GNADeviceHelper {
     static const std::map <const std::pair<Gna2OperationType, int32_t>, const std::string > operandTypes;
 
     static void enforceLegacyCnns(Gna2Model& gnaModel);
+    static void enforceLegacyCnnsWhenNeeded(Gna2Model& gnaModel);
     Gna2DeviceVersion parseDeclaredTarget(std::string target, const bool execTarget) const;
     Gna2DeviceVersion getDefaultTarget() const;
     Gna2DeviceVersion getTargetDevice(bool execTarget) const;
diff --git a/inference-engine/src/gna_plugin/gna_graph_compiler.cpp b/inference-engine/src/gna_plugin/gna_graph_compiler.cpp
index 01581337aec9d8..8ef6ad8a7a5d60 100644
--- a/inference-engine/src/gna_plugin/gna_graph_compiler.cpp
+++ b/inference-engine/src/gna_plugin/gna_graph_compiler.cpp
@@ -409,13 +409,9 @@ void GNAGraphCompiler::finalizeConvolution1DPrimitive(InferenceEngine::CNNLayerP
     uint32_t num_bytes_per_weight = convolution._weights->getTensorDesc().getPrecision().size();
     uint32_t num_bytes_per_bias = biasPrecision.size();
 
-    float weight_scale_factor = 1.0f;
-    float output_scale_factor = 1.0f;
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(convolution);
-    if (quantized != nullptr) {
-        weight_scale_factor = quantized->_weights_quant.GetScale();
-        output_scale_factor = quantized->_dst_quant.GetScale();
-    }
+    float weight_scale_factor = getScaleFactor(layer, QuantizedDataType::weights);
+    float output_scale_factor = getScaleFactor(layer, QuantizedDataType::output);
+
     auto& currentComponent = dnnComponents.addComponent(convolution.name, "convolution");
     dnn->InitConvolutional1DComponent(currentComponent,
         num_columns_in,
@@ -586,13 +582,8 @@ void GNAGraphCompiler::finalizeConvolution2DPrimitive(InferenceEngine::CNNLayerP
         in_height, in_width, in_channels,
         convolution._kernel_y, convolution._kernel_x, filter_n, convolution._stride_y, convolution._stride_x, inputPrec);
 
-    float weight_scale_factor = 1.0f;
-    float output_scale_factor = 1.0f;
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(convolution);
-    if (quantized != nullptr) {
-        weight_scale_factor = quantized->_weights_quant.GetScale();
-        output_scale_factor = quantized->_dst_quant.GetScale();
-    }
+    float weight_scale_factor = getScaleFactor(layer, QuantizedDataType::weights);
+    float output_scale_factor = getScaleFactor(layer, QuantizedDataType::output);
 
     auto& currentComponent = dnnComponents.addComponent(convolution.name, "convolution");
     dnn->InitConvolutional2DComponent(currentComponent,
@@ -673,9 +664,6 @@ void GNAGraphCompiler::finalizeConvolution2DPrimitive(InferenceEngine::CNNLayerP
 
 void GNAGraphCompiler::PowerPrimitive(InferenceEngine::CNNLayerPtr layer) {
     auto& power = dynamic_cast<PowerLayer&>(*layer.get());
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
-    IE_ASSERT(gnaFlags->sw_fp32 ? (quantized == nullptr) : (quantized != nullptr));
-
     if (power.power < 0.0f || power.power > 2.8f) {
         IE_THROW() << "[GNA plugin] unsupported power factor, expected be in <0, 2.8> range but was " << power.power;
     }
@@ -705,6 +693,8 @@ void GNAGraphCompiler::PowerPrimitive(InferenceEngine::CNNLayerPtr layer) {
 
         auto& currentComponent = dnnComponents.addComponent(layer->name, "power");
 
+        auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
+        IE_ASSERT(gnaFlags->sw_fp32 ? (quantized == nullptr) : (quantized != nullptr));
         dnn->InitAffineComponent(currentComponent,
             num_rows_in + num_padding,
             num_columns_in,
@@ -764,8 +754,8 @@ void GNAGraphCompiler::PowerPrimitive(InferenceEngine::CNNLayerPtr layer) {
 
         gna_pwl_segment_t* ptr_pwl_segments_target = nullptr;
 
-        float output_pwl_scale_factor = quantized != nullptr ? quantized->_dst_quant.GetScale() : 1.0f;
-        float input_pwl_scale_factor = quantized != nullptr ? quantized->_src_quant.GetScale() : 1.0f;
+        float output_pwl_scale_factor = getScaleFactor(layer, QuantizedDataType::output);
+        float input_pwl_scale_factor = getScaleFactor(layer, QuantizedDataType::input);
 
         if (!gnaFlags->sw_fp32) {
             if (gnaFlags->uniformPwlDesign) {
@@ -823,7 +813,6 @@ void GNAGraphCompiler::PowerPrimitive(InferenceEngine::CNNLayerPtr layer) {
 
 void GNAGraphCompiler::PoolingPrimitive(InferenceEngine::CNNLayerPtr layer) {
     auto& pooling = dynamic_cast<PoolingLayer&>(*layer.get());
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
 
     IE_ASSERT(!layer->insData.empty());
     IE_ASSERT(!layer->outData.empty());
@@ -883,7 +872,7 @@ void GNAGraphCompiler::PoolingPrimitive(InferenceEngine::CNNLayerPtr layer) {
         outputs->getPrecision().size(),
         { pooling._kernel[X_AXIS], pooling._kernel[Y_AXIS] },
         { pooling._stride[X_AXIS], pooling._stride[Y_AXIS] },
-        quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+        getScaleFactor(layer, QuantizedDataType::output),
         ptr_inputs,
         ptr_outputs);
 
@@ -901,8 +890,6 @@ void GNAGraphCompiler::PoolingPrimitive(InferenceEngine::CNNLayerPtr layer) {
 }
 
 void GNAGraphCompiler::CopyPrimitive(InferenceEngine::CNNLayerPtr layer) {
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
-
     IE_ASSERT(!layer->insData.empty());
     IE_ASSERT(!layer->outData.empty());
     auto inputs = layer->insData.begin()->lock();
@@ -928,7 +915,7 @@ void GNAGraphCompiler::CopyPrimitive(InferenceEngine::CNNLayerPtr layer) {
         num_columns_out,
         inputs->getPrecision().size(),
         outputs->getPrecision().size(),
-        quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+        getScaleFactor(layer, QuantizedDataType::output),
         num_rows_out + num_padding_out,
         num_columns_out,
         ptr_inputs,
@@ -1053,7 +1040,6 @@ void GNAGraphCompiler::CropPrimitive(InferenceEngine::CNNLayerPtr layer) {
             << axis.size() << ".";
     }
 
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
     size_t cropOffset = offset.front() * cropLayer->precision.size();
     size_t cropOutputSize = dim.front() * cropLayer->precision.size();
     const uint32_t noOfInputsDivisor = gnaFlags->input_low_precision ?
@@ -1111,6 +1097,7 @@ void GNAGraphCompiler::CropPrimitive(InferenceEngine::CNNLayerPtr layer) {
 
         auto& currentComponent = dnnComponents.addComponent(layer->name, "crop");
 
+        auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
         dnn->InitAffineComponent(currentComponent,
             num_rows_in + num_padding,
             num_columns_in,
@@ -1119,8 +1106,8 @@ void GNAGraphCompiler::CropPrimitive(InferenceEngine::CNNLayerPtr layer) {
             outputs->getPrecision().size(),
             quantized == nullptr ? inputs->getPrecision().size() : (gnaFlags->input_low_precision ? 1 : 2),
             gnaFlags->input_low_precision ? 1 : 4,
-            quantized == nullptr ? 1 : quantized->_weights_quant.GetScale(),
-            quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+            getScaleFactor(layer, QuantizedDataType::weights),
+            getScaleFactor(layer, QuantizedDataType::output),
             ptr_inputs,
             ptr_outputs,
             ptr_weights,
@@ -1254,8 +1241,8 @@ void GNAGraphCompiler::EltwisePrimitive(InferenceEngine::CNNLayerPtr layer) {
         // TODO: only fp32 and Int16 tested
         quantized == nullptr ? inputs2Bytes->getPrecision().size() : (gnaFlags->input_low_precision ? 1 : 2),
         quantized == nullptr ? inputs4Bytes->getPrecision().size() : (gnaFlags->input_low_precision ? 1 : 4),
-        quantized == nullptr ? 1 : quantized->_weights_quant.GetScale(),
-        quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+        getScaleFactor(layer, QuantizedDataType::weights),
+        getScaleFactor(layer, QuantizedDataType::output),
         ptr_inputs,
         ptr_outputs,
         ptr_weights,
@@ -1363,8 +1350,8 @@ void GNAGraphCompiler::GemmPrimitive(InferenceEngine::CNNLayerPtr layer) {
                              outputs->getPrecision().size(),
                              quantized == nullptr ? input_2->getPrecision().size() : 2,
                              quantized == nullptr ? input_2->getPrecision().size() : 4,
-                             quantized == nullptr ? 1 : quantized->_weights_quant.GetScale(),
-                             quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+                             getScaleFactor(layer, QuantizedDataType::weights),
+                             getScaleFactor(layer, QuantizedDataType::output),
                              ptr_input_1,
                              ptr_outputs,
                              ptr_input_2,
@@ -1452,8 +1439,8 @@ void GNAGraphCompiler::AffinePrimitive(InferenceEngine::CNNLayerPtr layer, bool
         outputs->getPrecision().size(),
         weightable._weights->getTensorDesc().getPrecision().size(),
         biasPrecisionSize,
-        quantized == nullptr ? 1 : quantized->_weights_quant.GetScale(),
-        quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+        getScaleFactor(layer, QuantizedDataType::weights),
+        getScaleFactor(layer, QuantizedDataType::output),
         ptr_inputs,
         ptr_outputs,
         ptr_weights,
@@ -1592,8 +1579,6 @@ void GNAGraphCompiler::ConcatAlignFilterPrimitive(InferenceEngine::CNNLayerPtr l
         return;
     }
 
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
-
     void* ptr_inputs = nullptr;
     void* ptr_outputs = nullptr;
     void* ptr_weights = nullptr;
@@ -1632,7 +1617,7 @@ void GNAGraphCompiler::ConcatAlignFilterPrimitive(InferenceEngine::CNNLayerPtr l
                                num_columns_in,
                                inputs->getPrecision().size(),
                                inputs->getPrecision().size(),
-                               quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+                               getScaleFactor(layer, QuantizedDataType::output),
                                num_rows_copied,
                                num_columns_in,
                                ptr_inputs,
@@ -1669,8 +1654,8 @@ void GNAGraphCompiler::ConcatAlignFilterPrimitive(InferenceEngine::CNNLayerPtr l
         outputs->getPrecision().size(),
         filterLayer->_weights->getTensorDesc().getPrecision().size(),
         biasPrecisionSize,
-        quantized == nullptr ? 1 : quantized->_weights_quant.GetScale(),
-        quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+        getScaleFactor(layer, QuantizedDataType::weights),
+        getScaleFactor(layer, QuantizedDataType::output),
         ptr_inputs,
         ptr_outputs,
         ptr_weights,
@@ -1726,8 +1711,6 @@ void GNAGraphCompiler::ConvolutionFilterPrimitive(InferenceEngine::CNNLayerPtr l
         return;
     }
 
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
-
     auto prevLayer = CNNNetPrevLayer(layer.get(), 0);
     if (!LayerInfo(prevLayer).isSplit() && !LayerInfo(prevLayer).isSlice()) {
         THROW_GNA_EXCEPTION << "Case with Affine Aligning Filter for not Split/Slice layers is not implemented yet!";
@@ -1774,8 +1757,8 @@ void GNAGraphCompiler::ConvolutionFilterPrimitive(InferenceEngine::CNNLayerPtr l
         numberOfFilters,
         filterWidth,
         convolutionStride,
-        quantized == nullptr ? 1 : quantized->_weights_quant.GetScale(),
-        quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+        getScaleFactor(layer, QuantizedDataType::weights),
+        getScaleFactor(layer, QuantizedDataType::output),
         ptr_inputs,
         ptr_outputs,
         ptr_weights,
@@ -1834,9 +1817,8 @@ void GNAGraphCompiler::PWLPrimitive(InferenceEngine::CNNLayerPtr layer) {
 
     auto inputs = layer->insData.begin()->lock();
     auto outputs = *layer->outData.begin();
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
-    float output_pwl_scale_factor = quantized != nullptr ? quantized->_dst_quant.GetScale() : 1.0f;
-    float input_pwl_scale_factor = quantized != nullptr ? quantized->_src_quant.GetScale() : 1.0f;
+    float output_pwl_scale_factor = getScaleFactor(layer, QuantizedDataType::output);
+    float input_pwl_scale_factor = getScaleFactor(layer, QuantizedDataType::input);
 
     auto orientation = kDnnInterleavedOrientation;
 
@@ -1903,6 +1885,7 @@ void GNAGraphCompiler::PWLPrimitive(InferenceEngine::CNNLayerPtr layer) {
     }
     auto activation_type = DnnActivation::fromType(it->second);
     activation_type.fqParams.set = false;
+    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
     if (quantized != nullptr && quantized->_dst_quant.IsStatsSet()) {
         activation_type.fqParams.set = true;
         activation_type.fqParams.levels = quantized->_dst_quant.GetLevels();
@@ -2044,7 +2027,6 @@ void GNAGraphCompiler::PermutePrimitive(InferenceEngine::CNNLayerPtr layer) {
         return;
     }
     auto layerOrder = layer->GetParamAsInts("order");
-    auto quantized = InferenceEngine::getInjectedData<QuantizedLayerParams>(layer);
     if (layer->insData.empty()) {
         THROW_GNA_LAYER_EXCEPTION(layer) << "Input layer pointer is unexpectedly absent";
     }
@@ -2088,7 +2070,7 @@ void GNAGraphCompiler::PermutePrimitive(InferenceEngine::CNNLayerPtr layer) {
                                          squeezedInputOrder[1],
                                          inputs->getPrecision().size(),
                                          outputs->getPrecision().size(),
-                                         (quantized == nullptr) ? 1.0f : quantized->_dst_quant.GetScale(),
+                                         getScaleFactor(layer, QuantizedDataType::output),
                                          ptr_inputs,
                                          ptr_outputs);
         }
@@ -2103,7 +2085,7 @@ void GNAGraphCompiler::PermutePrimitive(InferenceEngine::CNNLayerPtr layer) {
                                            squeezedInputOrder[1],
                                            inputs->getPrecision().size(),
                                            outputs->getPrecision().size(),
-                                           quantized == nullptr ? 1 : quantized->_dst_quant.GetScale(),
+                                           getScaleFactor(layer, QuantizedDataType::output),
                                            ptr_inputs,
                                            ptr_outputs);
         }
@@ -2595,4 +2577,4 @@ GNAGraphCompiler::transposeMatrix(uint8_t* ptr_matrix, size_t element_size, uint
         }
     }
     return temp_buffer;
-}
+}
\ No newline at end of file
diff --git a/inference-engine/src/gna_plugin/gna_plugin.cpp b/inference-engine/src/gna_plugin/gna_plugin.cpp
index bc566df0f098cc..f4e8924f831b6a 100644
--- a/inference-engine/src/gna_plugin/gna_plugin.cpp
+++ b/inference-engine/src/gna_plugin/gna_plugin.cpp
@@ -64,9 +64,12 @@
 #include "transformations/convert_matmul_to_pointwise_convolution.hpp"
 #include "transformations/split_convolution_with_large_buffer_size.hpp"
 #include "transformations/handle_transposes_around_matmul.hpp"
-#include "transformations/decompose_2d_conv.hpp"
-#include "transformations/convert_padded2valid_conv.hpp"
+#include "transformations/decompose_2d_convolution.hpp"
+#include "transformations/convert_padded_to_valid_convolution.hpp"
+#include "transformations/insert_reshape_around_matmul.hpp"
+#include "transformations/convert_dwsc_to_scaleshifts.hpp"
 #include "transformations/op_conversions/lstm_cell_decomposition.hpp"
+#include "transformations/remove_single_input_concat.hpp"
 
 #include <ngraph/opsets/opset7.hpp>
 
@@ -485,17 +488,10 @@ void GNAPlugin::UpdateInputScaleFromNetwork(InferenceEngine::CNNNetwork & networ
                     << "unsupported, per-channel quantization for input layer : " << input.second->name();
             }
 
-            auto fp32eq = [](float p1, float p2) -> bool {
-                return (std::abs(p1 - p2) <= 0.00001f * std::min(std::abs(p1), std::abs(p2)));
-            };
             // GNA input is always quantized to int16, so number of levels can't be greater than max uint16
-            size_t levels = std::min(fqLayer.getLevels(), static_cast<size_t>(std::numeric_limits<uint16_t>::max()));
-            float scaleInput = (levels - 1) / (inputRange.second[0] - inputRange.first[0]);
-            auto minAbsVal = std::min(std::abs(inputRange.second[0]), std::abs(inputRange.first[0]));
-            auto maxAbsVal = std::max(std::abs(inputRange.second[0]), std::abs(inputRange.first[0]));
-            if (fp32eq(minAbsVal, 0.0f) && !fp32eq(maxAbsVal, 0.0f)) {
-                scaleInput = (fqLayer.getLevels() - 1) / (2 * maxAbsVal);
-            }
+            // todo: should be solved in POT (issue 63330)
+            size_t levels = std::min(fqLayer.getLevels(), static_cast<size_t>(std::numeric_limits<uint16_t>::max() + 1));
+            auto scaleInput = frontend::CalculateScaleFactorFromStats(levels, inputRange.first[0], inputRange.second[0]);
 
             IE_ASSERT(config.inputScaleFactors.size() > inputIdx);
             IE_ASSERT(inputsDesc->inputScaleFactors.size() > inputIdx);
@@ -721,7 +717,8 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
         manager.register_pass<ngraph::pass::ConvertPriorBox>();
         manager.register_pass<ngraph::pass::CommonOptimizations>();
         manager.register_pass<ngraph::pass::LSTMCellDecomposition>();
-        manager.register_pass<ConvertPadded2ValidConv>();
+        manager.register_pass<ConvertDWSCToScaleShifts>();
+        manager.register_pass<ConvertPaddedToValidConv>();
         if (config.gnaCompileTarget == InferenceEngine::GNAConfigParams::GNA_TARGET_2_0) {
             manager.register_pass<Decompose2DConvTransposedWithBiasAF>();
             manager.register_pass<Decompose2DConvTransposedWithBias>();
@@ -736,19 +733,23 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
         manager.register_pass<SplitConvolutionWithFq>();
         manager.register_pass<SplitConvolutionWithBias>();
         manager.register_pass<SplitConvolution>();
-        manager.register_pass<HandleTransposesAroundMatMul>();
+        manager.register_pass<InsertReshapeAroundMatmulWithTranspose>();
+        manager.register_pass<InsertReshapeAroundMatmulWithFq>();
+        manager.register_pass<InsertReshapeAroundMatmulWithAdd>();
+        manager.register_pass<InsertReshapeAroundMatmul>();
         manager.register_pass<SwapInputMatMulWithFq>();
         manager.register_pass<SwapInputMatMulWithBias>();
         manager.register_pass<SwapInputMatMul>();
+        manager.register_pass<HandleTransposesAroundMatMul>();
         manager.register_pass<InsertTransposeAfterConvOrPool>();
         manager.register_pass<ReorderActivationAndPooling>();
+        manager.register_pass<RemoveSingleInputConcat>();
         manager.register_pass<ngraph::pass::ConvertOpSet3ToOpSet2>();
         manager.register_pass<ngraph::pass::ConvertOpSet2ToOpSet1>();
         manager.register_pass<ngraph::pass::ConvertOpSet1ToLegacy>();
         manager.register_pass<RemoveExtraReshapes>();
         // UnrollTI should be the last transformation in the transformation pipeline
         manager.register_pass<ngraph::pass::UnrollTensorIterator>();
-
         const auto& pass_config = manager.get_pass_config();
         pass_config->disable<ngraph::pass::FakeQuantizeMulFusion>();
         pass_config->disable<ngraph::pass::FakeQuantizeReshapeFusion>();
@@ -797,10 +798,9 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
             passes->registerPass<UnrollTIPass>();
             passes->registerPass<RemoveConstPass>();
             passes->registerPass<UnrollLSTMCellPass>();
+            passes->registerPass<RemoveSingleInputConcatPass>();
         }
 
-        passes->registerPass<RemoveSingleInputConcatPass>();
-
         // fake quantisation aware passes
         passes->registerPass<FuseFQIntoWeightsPass>();
         passes->registerPass<MoveFakeQuantizeLayerIntoQuantParamsPass>();
@@ -1036,10 +1036,14 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
 #else
     nnets.emplace_back(make_shared<CPPWrapper<intel_nnet_type_t>>(), -1, InferenceEngine::BlobMap());
 #endif
+    std::string effectiveGnaCompileTarget = config.gnaCompileTarget;
+    if (gnadevice) {
+        effectiveGnaCompileTarget = gnadevice->getEffectiveGnaCompileTarget();
+    }
     if (!gnaFlags->sw_fp32 && !graphCompiler.dnnComponents.components.empty()) {
         // number of layer gets calculated inside that InitGNAStruct function
 #if GNA_LIB_VER == 2
-        dnn->InitGNAStruct(&std::get<0>(gnaModels.front())->obj, config.gnaCompileTarget);
+        dnn->InitGNAStruct(&std::get<0>(gnaModels.front())->obj, effectiveGnaCompileTarget);
 #else
         dnn->InitGNAStruct(&std::get<0>(nnets.front())->obj);
 #endif
@@ -1050,7 +1054,7 @@ void GNAPlugin::LoadNetwork(CNNNetwork & _network) {
 #if GNA_LIB_VER == 2
         gnaModels.push_back(std::make_tuple(make_shared<CPPWrapper<Gna2Model>>()));
         // this can be improved by just copy all structures, but we are too lazy
-        dnn->InitGNAStruct(&std::get<0>(gnaModels.back())->obj, config.gnaCompileTarget);
+        dnn->InitGNAStruct(&std::get<0>(gnaModels.back())->obj, effectiveGnaCompileTarget);
 #else
         nnets.emplace_back(make_shared<CPPWrapper<intel_nnet_type_t>>(), -1, InferenceEngine::BlobMap());
         dnn->InitGNAStruct(&std::get<0>(nnets.back())->obj);
@@ -1616,7 +1620,7 @@ InferenceEngine::IExecutableNetworkInternal::Ptr GNAPlugin::ImportNetwork(std::i
     // If scale factors are defined in configuration we still need to use them instead of imported values,
     // for example to change the scale factors for the old models.
     if (!config.inputScaleFactors.empty()) {
-        IE_ASSERT(config.inputScaleFactors.size() == inputsDesc->inputScaleFactors.size());
+        IE_ASSERT(config.inputScaleFactors.size() <= inputsDesc->inputScaleFactors.size());
         for (size_t i = 0; i < config.inputScaleFactors.size(); ++i) {
             if (config.inputScaleFactors[i] != GNAPluginNS::kScaleFactorDefault) {
                 gnalog() << "[Import Network] Using input scale factor defined in configuration for input " << i << std::endl;
diff --git a/inference-engine/src/gna_plugin/gna_plugin.hpp b/inference-engine/src/gna_plugin/gna_plugin.hpp
index 476106f558ee99..eb9d71f875ee9c 100644
--- a/inference-engine/src/gna_plugin/gna_plugin.hpp
+++ b/inference-engine/src/gna_plugin/gna_plugin.hpp
@@ -114,10 +114,10 @@ class GNAPlugin : public InferenceEngine::IInferencePlugin {
                                          const std::map<std::string, InferenceEngine::Parameter> & options) const override;
     InferenceEngine::Parameter GetMetric(const std::string& name,
                                          const std::map<std::string, InferenceEngine::Parameter> & options) const override;
-    std::shared_ptr<InferenceEngine::IRemoteContext> CreateContext(const InferenceEngine::ParamMap& params) override {
+    std::shared_ptr<InferenceEngine::RemoteContext> CreateContext(const InferenceEngine::ParamMap& params) override {
         THROW_GNA_EXCEPTION << "Not implemented";
     }
-    std::shared_ptr<InferenceEngine::IRemoteContext> GetDefaultContext(const InferenceEngine::ParamMap&) override {
+    std::shared_ptr<InferenceEngine::RemoteContext> GetDefaultContext(const InferenceEngine::ParamMap&) override {
         THROW_GNA_EXCEPTION << "Not implemented";
     }
 
@@ -130,7 +130,7 @@ class GNAPlugin : public InferenceEngine::IInferencePlugin {
         THROW_GNA_EXCEPTION << "Not implemented";
     }
     InferenceEngine::IExecutableNetworkInternal::Ptr ImportNetwork(std::istream& networkModel,
-                                                     const std::shared_ptr<InferenceEngine::IRemoteContext>& context,
+                                                     const std::shared_ptr<InferenceEngine::RemoteContext>& context,
                                                      const std::map<std::string, std::string> &config) override {
         THROW_GNA_EXCEPTION << "Not implemented";
     }
diff --git a/inference-engine/src/gna_plugin/layers/gna_layer_info.hpp b/inference-engine/src/gna_plugin/layers/gna_layer_info.hpp
index 53362a2d702bc1..13bd120fdea6e1 100644
--- a/inference-engine/src/gna_plugin/layers/gna_layer_info.hpp
+++ b/inference-engine/src/gna_plugin/layers/gna_layer_info.hpp
@@ -61,8 +61,9 @@ class LayerInfo {
         IS_VALID();
         static InferenceEngine::details::caseless_set<std::string> layersWith8BOr16BOutputs = {"memory", "input", "split", "slice", "concat", "copy", "const"};
         return layersWith8BOr16BOutputs.find(layer->type) != layersWith8BOr16BOutputs.end() ||
-                                                                        isActivation() ||
-                                                            (isCrop() && !isCropAffined());
+               isActivation() ||
+               (isCrop() && !isCropAffined()) ||
+               isPermute();
     }
     bool has32BOutput() const noexcept {
         IS_VALID();
diff --git a/inference-engine/src/gna_plugin/runtime/pwl.cpp b/inference-engine/src/gna_plugin/runtime/pwl.cpp
index 89796fbb0cf8a6..f60b3a2d7d1b9a 100644
--- a/inference-engine/src/gna_plugin/runtime/pwl.cpp
+++ b/inference-engine/src/gna_plugin/runtime/pwl.cpp
@@ -549,21 +549,21 @@ void PwlDesignOpt(const DnnActivation activation_type,
             break;
         case kActLog: {
             double x_min = (1 + ~XBASEMASK) / scale_in;
-            double x_max = ((INT32_MAX / scale_in) < LOG_DOMAIN) ? (INT32_MAX / scale_in) : LOG_DOMAIN;
+            double x_max = ((static_cast<double>(INT32_MAX) / scale_in) < LOG_DOMAIN) ? (static_cast<double>(INT32_MAX) / scale_in) : LOG_DOMAIN;
             pwl = pwl_search(activation_type, x_min, x_max, PWL_DESIGN_THRESHOLD, pwlMaxErrorPercent, PWL_DESIGN_SAMPLES, err_pct);
             make_gna_pwl(activation_type, pwl, x_min, x_max, scale_in, scale_out, low_precision, ptr_segment);
             break;
         }
         case kActNegLog: {
             double x_min = (1 + ~XBASEMASK) / scale_in;
-            double x_max = ((INT32_MAX / scale_in) < LOG_DOMAIN) ? (INT32_MAX / scale_in) : LOG_DOMAIN;
+            double x_max = ((static_cast<double>(INT32_MAX) / scale_in) < LOG_DOMAIN) ? (static_cast<double>(INT32_MAX) / scale_in) : LOG_DOMAIN;
             pwl = pwl_search(activation_type, x_min, x_max, PWL_DESIGN_THRESHOLD, pwlMaxErrorPercent, PWL_DESIGN_SAMPLES, err_pct);
             make_gna_pwl(activation_type, pwl, x_min, x_max, scale_in, scale_out, low_precision, ptr_segment);
             break;
         }
         case kActNegHalfLog: {
             double x_min = (1 + ~XBASEMASK) / scale_in;
-            double x_max = ((INT32_MAX / scale_in) < LOG_DOMAIN) ? (INT32_MAX / scale_in) : LOG_DOMAIN;
+            double x_max = ((static_cast<double>(INT32_MAX) / scale_in) < LOG_DOMAIN) ? (static_cast<double>(INT32_MAX) / scale_in) : LOG_DOMAIN;
             pwl = pwl_search(activation_type, x_min, x_max, PWL_DESIGN_THRESHOLD, pwlMaxErrorPercent, PWL_DESIGN_SAMPLES, err_pct);
             make_gna_pwl(activation_type, pwl, x_min, x_max, scale_in, scale_out, low_precision, ptr_segment);
             break;
diff --git a/inference-engine/src/gna_plugin/transformations/convert_dwsc_to_scaleshifts.cpp b/inference-engine/src/gna_plugin/transformations/convert_dwsc_to_scaleshifts.cpp
new file mode 100644
index 00000000000000..a138748cface10
--- /dev/null
+++ b/inference-engine/src/gna_plugin/transformations/convert_dwsc_to_scaleshifts.cpp
@@ -0,0 +1,207 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <openvino/cc/ngraph/itt.hpp>
+
+#include "transformations/convert_dwsc_to_scaleshifts.hpp"
+
+#include <ngraph/opsets/opset7.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/pattern/op/or.hpp>
+#include <transformations/utils/utils.hpp>
+#include <ngraph/rt_info.hpp>
+#include <ie_common.h>
+#include "utils/transformation_helper.hpp"
+
+
+using namespace GNAPluginNS;
+
+NGRAPH_RTTI_DEFINITION(ConvertDWSCToScaleShifts, "ConvertDWSCToScaleShifts", 0);
+
+static std::shared_ptr<ngraph::Node> DecomposeDWSC(std::shared_ptr<ngraph::opset7::GroupConvolution> dwsc,
+    std::shared_ptr<ngraph::opset7::Constant> bias_const, std::shared_ptr<ngraph::opset7::FakeQuantize> fq_bias,
+    std::shared_ptr<ngraph::opset7::Reshape> flat_input_plane, std::shared_ptr<ngraph::Node> flat_filters_plane) {
+    std::shared_ptr<ngraph::opset7::Constant> const_zero_padding;
+    std::shared_ptr<ngraph::Node> reshaped_bias;
+    ngraph::OutputVector output_chunks;
+    auto input_channel_count = dwsc->get_input_shape(0)[1];
+    auto input_width = dwsc->get_input_shape(0)[3];
+    auto output_width = dwsc->get_output_shape(0)[3];
+    auto filter_width = dwsc->get_input_shape(1)[4];
+    auto pads_begin = dwsc->get_pads_begin()[1];
+    auto stride_width = dwsc->get_strides()[1];
+    auto dilation_width = dwsc->get_dilations()[1];
+
+    // Constant with zero padding
+    if (pads_begin) {
+        const_zero_padding = std::make_shared<ngraph::opset7::Constant>(dwsc->get_element_type(), ngraph::Shape{1, input_channel_count}, 0);
+        copy_runtime_info(dwsc, const_zero_padding);
+    }
+
+    // Reshape bias const
+    if (bias_const) {
+        auto bias_size = shape_size(bias_const->get_shape());
+        reshaped_bias = ngraph::op::util::make_try_fold<ngraph::opset7::Reshape>(bias_const,
+            ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, ngraph::Shape{1, bias_size}), false);
+    }
+
+    // Move filter over input performing multiplication and addition (scaleshift), take padding, stride, dilation and bias into account
+    for (int32_t input_position = -pads_begin, o = 0; o < output_width; input_position += stride_width, o++) {
+        std::shared_ptr<ngraph::Node> previous_layer_output, last_layer_output;
+        int32_t filter_end = input_position + filter_width * dilation_width;
+        bool first = true;
+
+        filter_end = filter_end < input_width ? filter_end : input_width;
+
+        for (int32_t filter_pos = input_position, filter_idx = 0; filter_pos < filter_end; filter_pos += dilation_width, filter_idx++) {
+            if (filter_pos >= 0) {
+                auto conv_input_slice = FlatCrop(flat_input_plane, filter_pos * input_channel_count, input_channel_count);
+                auto conv_filter_slice = FlatCrop(flat_filters_plane, filter_idx * input_channel_count, input_channel_count);
+
+                if (first) {
+                    first = false;
+                    previous_layer_output = std::make_shared<ngraph::opset7::Multiply>(conv_input_slice, conv_filter_slice);
+                    copy_runtime_info(dwsc, previous_layer_output);
+                    if (bias_const) {
+                        previous_layer_output = std::make_shared<ngraph::opset7::Add>(previous_layer_output, reshaped_bias);
+                        copy_runtime_info(dwsc, previous_layer_output);
+                        previous_layer_output = InsertFQLayer(fq_bias, previous_layer_output);
+                    }
+                    last_layer_output = previous_layer_output;
+                } else {
+                    last_layer_output = std::make_shared<ngraph::opset7::Multiply>(conv_input_slice, conv_filter_slice);
+                    copy_runtime_info(dwsc, last_layer_output);
+                    last_layer_output = std::make_shared<ngraph::opset7::Add>(last_layer_output, previous_layer_output);
+                    copy_runtime_info(dwsc, last_layer_output);
+                    previous_layer_output = last_layer_output;
+                }
+            }
+        }
+
+        if (!last_layer_output) {
+            IE_ASSERT(const_zero_padding);
+            last_layer_output = const_zero_padding;
+        }
+
+        output_chunks.push_back(last_layer_output);
+    }
+
+    // Concat is only needed when output width > 1
+    if (output_chunks.size() > 1) {
+        auto concat_output_plane = std::make_shared<ngraph::opset7::Concat>(output_chunks, 0);
+        copy_runtime_info(dwsc, concat_output_plane);
+        return concat_output_plane;
+    }
+
+    return output_chunks[0].get_node_shared_ptr();
+}
+
+static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
+    std::shared_ptr<ngraph::Node> dwsc_node,
+    std::shared_ptr<ngraph::Node> bias_const_node,
+    std::shared_ptr<ngraph::Node> fq_bias_node,
+    std::shared_ptr<ngraph::Node> trailing_transpose) {
+    auto dwsc = std::dynamic_pointer_cast<ngraph::opset7::GroupConvolution>(dwsc_node);
+    auto bias_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(bias_const_node);
+    auto fq_bias = std::dynamic_pointer_cast<ngraph::opset7::FakeQuantize>(fq_bias_node);
+
+    // We are looking for Transpose(NHWC->NCHW) => GroupConv => Transpose(NCHW->NHWC)
+    // or similar cases, so required network must be in NHWC order like in TF
+    if (!TransposeOrderMatches(std::dynamic_pointer_cast<ngraph::opset7::Transpose>(leading_transpose), {0, 3, 1, 2}))
+        return false;
+
+    if (!TransposeOrderMatches(std::dynamic_pointer_cast<ngraph::opset7::Transpose>(trailing_transpose), {0, 2, 3, 1}))
+        return false;
+
+    auto output_channel_count = dwsc->get_output_shape(0)[1];
+    auto output_width = dwsc->get_output_shape(0)[3];
+
+    // Prepare flat input data
+    auto flat_input_plane = std::make_shared<ngraph::opset7::Reshape>(leading_transpose->input_value(0),
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2},
+            ngraph::Shape{1, shape_size(dwsc->input_value(0).get_shape())}), false);
+
+    // Prepare flat filter data
+    auto filters_const = std::dynamic_pointer_cast<ngraph::Node>(dwsc->get_input_node_shared_ptr(1));
+    auto filters_size = shape_size(filters_const->get_shape());
+
+    auto transposed_filters_const = ngraph::op::util::make_try_fold<ngraph::opset7::Transpose>(filters_const,
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{5}, ngraph::Shape{4, 1, 2, 3, 0}));
+
+    auto flat_filters_plane = ngraph::op::util::make_try_fold<ngraph::opset7::Reshape>(transposed_filters_const,
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, ngraph::Shape{1, filters_size}), false);
+
+    copy_runtime_info(dwsc, {flat_input_plane, transposed_filters_const, flat_filters_plane});
+
+    // Convert DWSC to a set of diagonal layers
+    auto output_plane = DecomposeDWSC(dwsc, bias_const, fq_bias, flat_input_plane, flat_filters_plane);
+
+    // Restore the original output shape
+    auto result = std::make_shared<ngraph::opset7::Reshape>(output_plane,
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{4},
+            ngraph::Shape{1, output_channel_count, 1, output_width}), false);
+    copy_runtime_info(dwsc, result);
+
+    // We need to put here the original Group Convolution layer name, so the new layer output can be used as a network result
+    std::string result_name = trailing_transpose->get_friendly_name();
+    replace_node(trailing_transpose, result);
+    result->set_friendly_name(result_name);
+
+    return true;
+}
+
+static bool VerifyDWSC(const ngraph::Output<ngraph::Node>& output) {
+    auto dwsc = output.get_node();
+
+    // Verify it's a 1D convolution
+    // Verify that filter group count == input channel count
+    // Verify that per group filter output channel count == 1
+    if (!consumers_and_rank(1, 4)(output) ||
+        dwsc->get_input_shape(1)[3] != 1 || dwsc->get_input_shape(0)[2] != 1 || dwsc->get_output_shape(0)[2] != 1 ||
+        dwsc->get_input_shape(1)[0] != dwsc->get_input_shape(0)[1] ||
+        dwsc->get_input_shape(1)[1] != 1)
+        return false;
+
+    return true;
+}
+
+ConvertDWSCToScaleShifts::ConvertDWSCToScaleShifts() {
+    MATCHER_SCOPE(ConvertDWSCToScaleShifts);
+
+    auto const_input = ngraph::pattern::wrap_type<ngraph::opset7::Constant>();
+    auto leading_transpose = ngraph::pattern::wrap_type<ngraph::opset7::Transpose>({ngraph::pattern::any_input(), const_input},
+        consumers_and_rank(1, 4));
+    auto filters_const_fq = ngraph::pattern::wrap_type<ngraph::opset7::Constant>(ngraph::pattern::rank_equals(4));
+    auto fq_filters_const = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({filters_const_fq, const_input, const_input, const_input, const_input},
+        consumers_and_rank(1, 4));
+    auto reshape_filters_const = ngraph::pattern::wrap_type<ngraph::opset7::Reshape>({fq_filters_const, const_input}, ngraph::pattern::rank_equals(5));
+    auto filters_const = ngraph::pattern::wrap_type<ngraph::opset7::Constant>(ngraph::pattern::rank_equals(5));
+    auto dwsc_filters = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{filters_const, reshape_filters_const });
+    auto dwsc = ngraph::pattern::wrap_type<ngraph::opset7::GroupConvolution>({leading_transpose, dwsc_filters}, VerifyDWSC);
+    auto bias = ngraph::pattern::wrap_type<ngraph::opset7::Add>({dwsc, const_input});
+    auto fq_bias = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({bias, const_input, const_input, const_input, const_input},
+        consumers_and_rank(1, 4));
+    auto transpose_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{dwsc, bias, fq_bias});
+    auto trailing_transpose = ngraph::pattern::wrap_type<ngraph::opset7::Transpose>({transpose_input, const_input}, consumers_and_rank(1, 4));
+
+    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher& m) {
+        const auto& pattern_map = m.get_pattern_value_map();
+        auto bias_it = pattern_map.find(bias);
+        auto bias_node = (bias_it == std::end(pattern_map) ? nullptr : bias_it->second.get_node_shared_ptr());
+        std::shared_ptr<ngraph::Node> bias_const = nullptr;
+
+        if (bias_node && (bias_const = VerifyBiasGetConst(pattern_map.at(dwsc).get_node_shared_ptr(), bias_node)) == nullptr)
+            return false;
+
+        auto fq_bias_it = pattern_map.find(fq_bias);
+        auto fq_bias_node = (fq_bias_it == std::end(pattern_map) ? nullptr : fq_bias_it->second.get_node_shared_ptr());
+
+        return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), pattern_map.at(dwsc).get_node_shared_ptr(),
+            bias_const, fq_bias_node,
+            pattern_map.at(trailing_transpose).get_node_shared_ptr());
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(trailing_transpose, matcher_name);
+    this->register_matcher(m, callback);
+}
diff --git a/inference-engine/src/gna_plugin/transformations/convert_dwsc_to_scaleshifts.hpp b/inference-engine/src/gna_plugin/transformations/convert_dwsc_to_scaleshifts.hpp
new file mode 100644
index 00000000000000..270533e85b8c96
--- /dev/null
+++ b/inference-engine/src/gna_plugin/transformations/convert_dwsc_to_scaleshifts.hpp
@@ -0,0 +1,21 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <ngraph/pass/graph_rewrite.hpp>
+
+namespace GNAPluginNS {
+
+/**
+ * @brief Convert a depthwise separable convolution (represented by a GroupConvolution) to a set of ScaleShift layers (MatMul + Add)
+ * Additionally supported are bias and fake quantize layers.
+ */
+class ConvertDWSCToScaleShifts : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    ConvertDWSCToScaleShifts();
+};
+
+} // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/convert_padded2valid_conv.cpp b/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.cpp
similarity index 92%
rename from inference-engine/src/gna_plugin/transformations/convert_padded2valid_conv.cpp
rename to inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.cpp
index 82f8ccc5eadcaa..f32b9b2da0ed5a 100644
--- a/inference-engine/src/gna_plugin/transformations/convert_padded2valid_conv.cpp
+++ b/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.cpp
@@ -4,7 +4,7 @@
 
 #include <openvino/cc/ngraph/itt.hpp>
 
-#include "transformations/convert_padded2valid_conv.hpp"
+#include "transformations/convert_padded_to_valid_convolution.hpp"
 
 #include <memory>
 
@@ -19,7 +19,7 @@
 
 using namespace GNAPluginNS;
 
-NGRAPH_RTTI_DEFINITION(ConvertPadded2ValidConv, "ConvertPadded2ValidConv", 0);
+NGRAPH_RTTI_DEFINITION(ConvertPaddedToValidConv, "ConvertPaddedToValidConv", 0);
 
 static bool VerifyAndGetConvData(std::shared_ptr<ngraph::opset7::Convolution> conv, ConvData& conv_data) {
     const auto& input = conv->input_value(0);
@@ -34,17 +34,6 @@ static bool VerifyAndGetConvData(std::shared_ptr<ngraph::opset7::Convolution> co
     return conv_data.pads_begin_height || conv_data.pads_end_height || conv_data.pads_begin_width || conv_data.pads_end_width;
 }
 
-static bool VerifyBias(std::shared_ptr<ngraph::opset7::Add> bias, const size_t& filter_count) {
-    auto add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(bias->input_value(0).get_node_shared_ptr());
-
-    // We need to check both inputs of Add when looking for constant
-    if (!add_const)
-        add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(bias->input_value(1).get_node_shared_ptr());
-
-    // The add may be a normal add not convolution bias, then we just go further
-    return (add_const && shape_size(add_const->get_shape()) == filter_count);
-}
-
 static void InsertPadding(ngraph::OutputVector& input_rows_to_concat, size_t size, const std::shared_ptr<ngraph::opset7::Convolution>& conv,
     const std::shared_ptr<ngraph::opset7::Constant> padding_const, size_t biggest_padding) {
 
@@ -181,9 +170,6 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
     if (!TransposeOrderMatches(std::dynamic_pointer_cast<ngraph::opset7::Transpose>(trailing_transpose), {0, 2, 3, 1}))
         return false;
 
-    if (bias && !VerifyBias(std::dynamic_pointer_cast<ngraph::opset7::Add>(bias), conv_data.filter_count))
-        return false;
-
     GeneratePadding(std::dynamic_pointer_cast<ngraph::opset7::Transpose>(leading_transpose),
         std::dynamic_pointer_cast<ngraph::opset7::Convolution>(conv), conv_data);
 
@@ -196,8 +182,8 @@ static std::function<bool(ngraph::Output<ngraph::Node>)> consumers_and_rank(cons
     };
 }
 
-ConvertPadded2ValidConv::ConvertPadded2ValidConv() {
-    MATCHER_SCOPE(ConvertPadded2ValidConv);
+ConvertPaddedToValidConv::ConvertPaddedToValidConv() {
+    MATCHER_SCOPE(ConvertPaddedToValidConv);
 
     auto const_input = ngraph::pattern::wrap_type<ngraph::opset7::Constant>();
     auto leading_transpose = ngraph::pattern::wrap_type<ngraph::opset7::Transpose>({ngraph::pattern::any_input(), const_input},
@@ -237,6 +223,9 @@ ConvertPadded2ValidConv::ConvertPadded2ValidConv() {
         auto bias_it = pattern_map.find(bias);
         auto bias_node = (bias_it == std::end(pattern_map) ? nullptr : bias_it->second.get_node_shared_ptr());
 
+        if (bias_node && !VerifyBiasGetConst(pattern_map.at(conv).get_node_shared_ptr(), bias_node))
+            return false;
+
         return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), pattern_map.at(conv).get_node_shared_ptr(),
             pattern_map.at(trailing_transpose).get_node_shared_ptr(), bias_node);
     };
diff --git a/inference-engine/src/gna_plugin/transformations/convert_padded2valid_conv.hpp b/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.hpp
similarity index 93%
rename from inference-engine/src/gna_plugin/transformations/convert_padded2valid_conv.hpp
rename to inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.hpp
index 55bef912b9c184..61f285e2549758 100644
--- a/inference-engine/src/gna_plugin/transformations/convert_padded2valid_conv.hpp
+++ b/inference-engine/src/gna_plugin/transformations/convert_padded_to_valid_convolution.hpp
@@ -28,10 +28,10 @@ namespace GNAPluginNS {
  *   Transpose (NCHW -> NHWC)               Transpose (NCHW -> NHWC)
  *
  */
-class ConvertPadded2ValidConv : public ngraph::pass::MatcherPass {
+class ConvertPaddedToValidConv : public ngraph::pass::MatcherPass {
 public:
   NGRAPH_RTTI_DECLARATION;
-  ConvertPadded2ValidConv();
+  ConvertPaddedToValidConv();
 };
 
 } // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/decompose_2d_conv.cpp b/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.cpp
similarity index 92%
rename from inference-engine/src/gna_plugin/transformations/decompose_2d_conv.cpp
rename to inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.cpp
index 4b313ce8bb0650..2aaec0604a811c 100644
--- a/inference-engine/src/gna_plugin/transformations/decompose_2d_conv.cpp
+++ b/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.cpp
@@ -4,9 +4,7 @@
 
 #include <openvino/cc/ngraph/itt.hpp>
 
-#include "transformations/decompose_2d_conv.hpp"
-
-#include <memory>
+#include "transformations/decompose_2d_convolution.hpp"
 
 #include <ngraph/opsets/opset7.hpp>
 #include <ngraph/pattern/op/wrap_type.hpp>
@@ -68,22 +66,6 @@ static bool VerifyAndGetConvData(std::shared_ptr<ngraph::opset7::Convolution> co
     return true;
 }
 
-static std::shared_ptr<ngraph::Node> VerifyBiasAndReshapeConst(std::shared_ptr<ngraph::opset7::Add> conv_bias, const ConvData& conv_data) {
-    auto add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(conv_bias->input_value(1).get_node_shared_ptr());
-
-    if (add_const) {
-        auto bias_size = shape_size(add_const->get_shape());
-
-        // The add may be a normal add not conv bias, then we just go further
-        if (bias_size == conv_data.filter_count) {
-            return ngraph::op::util::make_try_fold<ngraph::opset7::Reshape>(add_const,
-                ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{4}, ngraph::Shape{1, bias_size, 1, 1}), false);
-        }
-    }
-    // Bias size does not match (or dynamic bias), can't decompose such convolution
-    return nullptr;
-}
-
 static bool VerifyMaxPool(GraphData& graph_data, std::shared_ptr<ngraph::opset7::MaxPool> max_pool) {
     auto pool_filter = max_pool->get_kernel();
     auto pool_strides = max_pool->get_strides();
@@ -236,7 +218,7 @@ static void TransformInput(const GraphData& graph_data, const ConvData& conv_dat
     */
 
     // First we need to prepare flat (height = 1) slices of input data proper for flattened (height = 1) filters created later on;
-    // the input datat is overlapping (duplicated)
+    // the input data is overlapping (duplicated)
     ngraph::OutputVector dilated_input_planes;
     for (size_t filter_height = 0; filter_height < conv_data.filter_height; filter_height++) {
         size_t offset;
@@ -280,16 +262,6 @@ static void TransformInput(const GraphData& graph_data, const ConvData& conv_dat
     split_input_plane = flattened_dilated_transposed_input;
 }
 
-static void InsertFQLayer(const std::shared_ptr<ngraph::opset7::FakeQuantize> fqLayer,
-    std::shared_ptr<ngraph::Node> lastNode) {
-    if (fqLayer != nullptr) {
-        lastNode = fqLayer->clone_with_new_inputs({lastNode,
-            fqLayer->input_value(1), fqLayer->input_value(2),
-            fqLayer->input_value(3), fqLayer->input_value(4)});
-        ngraph::copy_runtime_info(fqLayer, lastNode);
-    }
-}
-
 // Valid 1D (decomposed 2D) convolution wrapped with transposes NHWC => NCHW => conv => NCHW => NHWC
 static std::shared_ptr<ngraph::Node> Create1DConv(const GraphData& graph_data, const ConvData& conv_data, const ngraph::Output<ngraph::Node>& input,
     std::shared_ptr<ngraph::Node> filters, const size_t conv_index, const size_t h_index) {
@@ -298,7 +270,7 @@ static std::shared_ptr<ngraph::Node> Create1DConv(const GraphData& graph_data, c
             ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{4}, {0, 3, 1, 2})->output(0));
 
         // Fake quantize
-        InsertFQLayer(graph_data.fq_conv, filters);
+        filters = InsertFQLayer(graph_data.fq_conv, filters);
 
         // 1D Convolution
         auto conv = std::make_shared<ngraph::opset7::Convolution>(nchw_input, filters,
@@ -306,13 +278,16 @@ static std::shared_ptr<ngraph::Node> Create1DConv(const GraphData& graph_data, c
             ngraph::Strides{1, 1}, ngraph::op::PadType::VALID);
         std::string conv_name = graph_data.conv->get_friendly_name() + "_H_" + std::to_string(h_index) + "_CH_" + std::to_string(0);
         conv->set_friendly_name(conv_name);
+        std::shared_ptr<ngraph::Node> last_conv_block_op = conv;
 
         // Bias & fake quantize
-        std::shared_ptr<ngraph::Node> last_conv_block_op = conv;
         if (graph_data.bias_const && conv_index == 0) {
-            last_conv_block_op = std::make_shared<ngraph::opset7::Add>(conv, graph_data.bias_const);
+            auto bias_size = shape_size(graph_data.bias_const->get_shape());
+            auto reshaped_bias_const = ngraph::op::util::make_try_fold<ngraph::opset7::Reshape>(graph_data.bias_const,
+                ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{4}, ngraph::Shape{1, bias_size, 1, 1}), false);
+            last_conv_block_op = std::make_shared<ngraph::opset7::Add>(conv, reshaped_bias_const);
             copy_runtime_info(graph_data.conv, last_conv_block_op);
-            InsertFQLayer(graph_data.fq_bias, last_conv_block_op);
+            last_conv_block_op = InsertFQLayer(graph_data.fq_bias, last_conv_block_op);
         }
 
         // Max pooling
@@ -326,7 +301,7 @@ static std::shared_ptr<ngraph::Node> Create1DConv(const GraphData& graph_data, c
         if (graph_data.af && graph_data.conv_count == 1) {
             last_conv_block_op = graph_data.af->copy_with_new_inputs({last_conv_block_op});
             copy_runtime_info(conv, last_conv_block_op);
-            InsertFQLayer(graph_data.fq_af, last_conv_block_op);
+            last_conv_block_op = InsertFQLayer(graph_data.fq_af, last_conv_block_op);
         }
 
         // Transpose NCHW => NHWC
@@ -472,6 +447,7 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
     std::shared_ptr<ngraph::Node> conv,
     std::shared_ptr<ngraph::Node> trailing_transpose,
     std::shared_ptr<ngraph::Node> bias,
+    std::shared_ptr<ngraph::Node> bias_const,
     std::shared_ptr<ngraph::Node> fq_bias,
     std::shared_ptr<ngraph::Node> max_pool,
     std::shared_ptr<ngraph::Node> af,
@@ -486,7 +462,7 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
         std::dynamic_pointer_cast<ngraph::opset7::MaxPool>(max_pool),
         std::dynamic_pointer_cast<ngraph::op::util::UnaryElementwiseArithmetic>(af),
         std::dynamic_pointer_cast<ngraph::opset7::FakeQuantize>(fq_af),
-        last_op_for_replacement, nullptr, 1, 1, 1};
+        last_op_for_replacement, bias_const, 1, 1, 1};
     ConvData conv_data;
 
     if (!VerifyAndGetConvData(std::dynamic_pointer_cast<ngraph::opset7::Convolution>(conv), conv_data))
@@ -500,9 +476,6 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
     if (!TransposeOrderMatches(std::dynamic_pointer_cast<ngraph::opset7::Transpose>(trailing_transpose), {0, 2, 3, 1}))
         return false;
 
-    if (bias && !(graph_data.bias_const = VerifyBiasAndReshapeConst(std::dynamic_pointer_cast<ngraph::opset7::Add>(bias), conv_data)))
-        return false;
-
     if (max_pool && !VerifyMaxPool(graph_data, std::dynamic_pointer_cast<ngraph::opset7::MaxPool>(max_pool)))
         return false;
 
@@ -515,22 +488,6 @@ static bool Convert(std::shared_ptr<ngraph::Node> leading_transpose,
     return true;
 }
 
-static bool VerifyBias(std::shared_ptr<ngraph::Node> conv, std::shared_ptr<ngraph::Node> bias) {
-    auto add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(bias->input_value(1).get_node_shared_ptr());
-
-    if (!add_const) {
-        add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(bias->input_value(0).get_node_shared_ptr());
-    }
-
-    if (!add_const) {
-        auto bias_size = shape_size(add_const->get_shape());
-        auto conv_filter_count = conv->input_value(1).get_shape()[0];
-        if (bias_size == conv_filter_count)
-            return true;
-    }
-    return false;
-}
-
 Decompose2DConv::Decompose2DConv() {
     MATCHER_SCOPE(Decompose2DConv);
 
@@ -576,6 +533,11 @@ Decompose2DConv::Decompose2DConv() {
         auto fq_conv_node = (fq_conv_it == std::end(pattern_map) ? nullptr : fq_conv_it->second.get_node_shared_ptr());
         auto bias_it = pattern_map.find(bias);
         auto bias_node = (bias_it == std::end(pattern_map) ? nullptr : bias_it->second.get_node_shared_ptr());
+        std::shared_ptr<ngraph::Node> bias_const_node = nullptr;
+
+        if (bias_node && !(bias_const_node = VerifyBiasGetConst(pattern_map.at(conv).get_node_shared_ptr(), bias_node)))
+            return false;
+
         auto fq_bias_it = pattern_map.find(fq_bias);
         auto fq_bias_node = (fq_bias_it == std::end(pattern_map) ? nullptr : fq_bias_it->second.get_node_shared_ptr());
         auto fq_af_it = pattern_map.find(fq_af);
@@ -596,7 +558,7 @@ Decompose2DConv::Decompose2DConv() {
         }
 
         return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), fq_conv_node, pattern_map.at(conv).get_node_shared_ptr(),
-            pattern_map.at(trailing_transpose).get_node_shared_ptr(), bias_node, fq_bias_node, max_pool_node, af_node, fq_af_node,
+            pattern_map.at(trailing_transpose).get_node_shared_ptr(), bias_node, bias_const_node, fq_bias_node, max_pool_node, af_node, fq_af_node,
             pattern_map.at(trailing_transpose).get_node_shared_ptr());
     };
 
@@ -621,11 +583,13 @@ Decompose2DConvTransposedWithBias::Decompose2DConvTransposedWithBias() {
 
     ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher& m) {
         const auto& pattern_map = m.get_pattern_value_map();
-        if (!VerifyBias(pattern_map.at(conv).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr()))
+        std::shared_ptr<ngraph::Node> bias_const_node = nullptr;
+
+        if (!(bias_const_node = VerifyBiasGetConst(pattern_map.at(conv).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr())))
             return false;
 
         return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), nullptr, pattern_map.at(conv).get_node_shared_ptr(),
-            pattern_map.at(trailing_transpose).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr(), nullptr, nullptr,
+            pattern_map.at(trailing_transpose).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr(), bias_const_node, nullptr, nullptr,
             nullptr, nullptr, pattern_map.at(bias).get_node_shared_ptr());
     };
 
@@ -654,11 +618,13 @@ Decompose2DConvTransposedWithBiasAF::Decompose2DConvTransposedWithBiasAF() {
 
     ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher& m) {
         const auto& pattern_map = m.get_pattern_value_map();
-        if (!VerifyBias(pattern_map.at(conv).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr()))
+        std::shared_ptr<ngraph::Node> bias_const_node = nullptr;
+
+        if (!(bias_const_node = VerifyBiasGetConst(pattern_map.at(conv).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr())))
             return false;
 
         return Convert(pattern_map.at(leading_transpose).get_node_shared_ptr(), nullptr, pattern_map.at(conv).get_node_shared_ptr(),
-            pattern_map.at(trailing_transpose).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr(), nullptr,
+            pattern_map.at(trailing_transpose).get_node_shared_ptr(), pattern_map.at(bias).get_node_shared_ptr(), bias_const_node, nullptr,
             nullptr, pattern_map.at(af).get_node_shared_ptr(), nullptr, pattern_map.at(af).get_node_shared_ptr());
     };
 
diff --git a/inference-engine/src/gna_plugin/transformations/decompose_2d_conv.hpp b/inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.hpp
similarity index 100%
rename from inference-engine/src/gna_plugin/transformations/decompose_2d_conv.hpp
rename to inference-engine/src/gna_plugin/transformations/decompose_2d_convolution.hpp
diff --git a/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.cpp b/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.cpp
index 9591bd0fc6cef9..e0a009a9e926f1 100644
--- a/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.cpp
+++ b/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.cpp
@@ -6,31 +6,33 @@
 
 #include <numeric>
 
-#include <ngraph/opsets/opset7.hpp>
-#include <ngraph/pattern/op/wrap_type.hpp>
-#include <ngraph/pattern/op/or.hpp>
+#include <openvino/cc/ngraph/itt.hpp>
 #include <ngraph/rt_info.hpp>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pattern/op/or.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ie/ie_common.h>
 
 #include "gna_plugin_log.hpp"
 #include "backend/gna_limitations.hpp"
 
-using namespace GNAPluginNS;
+namespace GNAPluginNS {
 
 NGRAPH_RTTI_DEFINITION(HandleTransposesAroundMatMul, "HandleTransposesAroundMatMul", 0);
 NGRAPH_RTTI_DEFINITION(HandleTransposeBeforeMatMul, "HandleTransposeBeforeMatMul", 0);
 NGRAPH_RTTI_DEFINITION(HandleTransposeAfterMatMul, "HandleTransposeAfterMatMul", 0);
 
-static void ReplaceTransposeWithReshape(std::shared_ptr<ngraph::Node> transpose_node) {
+void ReplaceTransposeWithReshape(std::shared_ptr<ngraph::Node> transpose_node) {
     auto shape = transpose_node->get_output_shape(0);
-    auto reshape_const = std::make_shared<ngraph::opset7::Constant>(ngraph::element::Type_t::i64,
+    auto reshape_const = std::make_shared<ngraph::opset8::Constant>(ngraph::element::Type_t::i64,
         ngraph::Shape{shape.size()}, shape);
-    auto reshape_node = std::make_shared<ngraph::opset7::Reshape>(transpose_node->input_value(0), reshape_const, false);
-    reshape_node->set_friendly_name(transpose_node->get_friendly_name() + "/reshape");
+    auto reshape_node = std::make_shared<ngraph::opset8::Reshape>(transpose_node->input_value(0), reshape_const, false);
+    reshape_node->set_friendly_name(transpose_node->get_friendly_name());
     ngraph::copy_runtime_info(transpose_node, reshape_node);
     transpose_node->output(0).replace(reshape_node->output(0));
 }
 
-static void InsertTranspose(std::shared_ptr<ngraph::Node> prev_node, const std::string& base_name) {
+void InsertTranspose(std::shared_ptr<ngraph::Node> prev_node, const std::string& base_name) {
     auto consumers = prev_node->output(0).get_target_inputs();
     const auto orig_shape = prev_node->get_output_shape(0);
     std::vector<size_t> transpose_ids;
@@ -44,13 +46,13 @@ static void InsertTranspose(std::shared_ptr<ngraph::Node> prev_node, const std::
     std::iota(std::begin(permute_order), std::end(permute_order), 0);
     std::swap(permute_order[transpose_ids[0]], permute_order[transpose_ids[1]]);
 
-    auto transpose_order = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{permute_order.size()}, permute_order);
-    auto transpose = std::make_shared<ngraph::opset7::Transpose>(prev_node, transpose_order);
+    auto transpose_order = ngraph::opset8::Constant::create(ngraph::element::i64, ngraph::Shape{permute_order.size()}, permute_order);
+    auto transpose = std::make_shared<ngraph::opset8::Transpose>(prev_node, transpose_order);
     transpose->set_friendly_name(base_name + "/in_transpose");
 
-    auto reshapeConstAfter = std::make_shared<ngraph::opset7::Constant>(ngraph::element::Type_t::i64,
+    auto reshapeConstAfter = std::make_shared<ngraph::opset8::Constant>(ngraph::element::Type_t::i64,
         ngraph::Shape{orig_shape.size()}, orig_shape);
-    auto reshapeAfter = std::make_shared<ngraph::opset7::Reshape>(transpose, reshapeConstAfter, false);
+    auto reshapeAfter = std::make_shared<ngraph::opset8::Reshape>(transpose, reshapeConstAfter, false);
     reshapeAfter->set_friendly_name(base_name + "/reshape_after_transpose");
     ngraph::copy_runtime_info(prev_node, ngraph::NodeVector{transpose, reshapeAfter});
 
@@ -59,74 +61,102 @@ static void InsertTranspose(std::shared_ptr<ngraph::Node> prev_node, const std::
     }
 }
 
+static bool VerifyReshape(const ngraph::Output<ngraph::Node>& reshape_out) {
+    auto in_shape = reshape_out.get_node_shared_ptr()->get_input_shape(0);
+    auto out_shape = reshape_out.get_node_shared_ptr()->get_output_shape(0);
+    return in_shape[0] != out_shape[0];
+}
+
 HandleTransposeBeforeMatMul::HandleTransposeBeforeMatMul() {
-    auto reshape = ngraph::pattern::wrap_type<ngraph::opset7::Reshape>({ngraph::pattern::any_input(),
-        ngraph::pattern::any_input()}, VerifyReshape());
-    auto transpose = ngraph::pattern::wrap_type<ngraph::opset7::Transpose>({reshape,
+    auto constant = ngraph::pattern::wrap_type<ngraph::opset8::Constant>();
+    auto fq = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({constant, ngraph::pattern::any_input(),
+        ngraph::pattern::any_input(), ngraph::pattern::any_input(), ngraph::pattern::any_input()});
+    auto reshape = ngraph::pattern::wrap_type<ngraph::opset8::Reshape>({}, VerifyReshape);
+    auto transpose = ngraph::pattern::wrap_type<ngraph::opset8::Transpose>({reshape,
+        ngraph::pattern::any_input()});
+    auto matmul1 = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>({
+        std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{reshape, transpose}),
         ngraph::pattern::any_input()});
-    auto matmul_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{reshape, transpose});
-    auto matmul1 = ngraph::pattern::wrap_type<ngraph::opset7::MatMul>({matmul_input, ngraph::pattern::any_input()});
-    auto matmul2 = ngraph::pattern::wrap_type<ngraph::opset7::MatMul>({ngraph::pattern::any_input(), matmul_input});
+    auto matmul2 = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>({
+        std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{constant, fq}),
+        std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{reshape, transpose, ngraph::pattern::any_input()})});
     auto matmul = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{matmul1, matmul2});
 
-    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &m) {
-        const auto& pattern_map = m.get_pattern_value_map();
-        auto transpose_it = pattern_map.find(transpose);
-        if (transpose_it != std::end(pattern_map)) {
-            ReplaceTransposeWithReshape(transpose_it->second.get_node_shared_ptr());
-        } else {
+    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &matcher) {
+        const auto& pattern_map = matcher.get_pattern_value_map();
+        auto matmul_iter = pattern_map.find(matmul1);
+        if (matmul_iter == std::end(pattern_map) &&
+            (matmul_iter = pattern_map.find(matmul2)) == std::end(pattern_map)) {
+            return false;
+        }
+
+        auto transpose_reshape_it = pattern_map.find(transpose);
+        if (transpose_reshape_it != std::end(pattern_map)) {
+            ReplaceTransposeWithReshape(transpose_reshape_it->second.get_node_shared_ptr());
+        } else if ((transpose_reshape_it = pattern_map.find(reshape)) != std::end(pattern_map)) {
             auto reshape_node = pattern_map.at(reshape).get_node_shared_ptr();
-            if (!GNALimitations::IsTransposeSupported(reshape_node->get_output_shape(0))) return false;
-            auto matmul_it = pattern_map.find(matmul1);
-            auto matmul_out = matmul_it != std::end(pattern_map) ? matmul_it->second : pattern_map.at(matmul2);
-            InsertTranspose(reshape_node, matmul_out.get_node_shared_ptr()->get_friendly_name());
+            if (GNALimitations::IsTransposeSupported(reshape_node->get_output_shape(0))) {
+                auto matmul_node = matmul_iter->second.get_node_shared_ptr();
+                InsertTranspose(reshape_node, matmul_node->get_friendly_name());
+            }
+        }
+
+        auto iter = pattern_map.find(fq);
+        if (iter != pattern_map.end() ||
+            (iter = pattern_map.find(constant)) != pattern_map.end()) {
+            auto prev_node = iter->second.get_node_shared_ptr();
+            if (!GNALimitations::IsTransposeSupported(prev_node->get_output_shape(0))) return false;
+            auto matmul_node = iter->second.get_node_shared_ptr();
+            InsertTranspose(prev_node, matmul_node->get_friendly_name());
         }
         return true;
     };
 
-    auto m = std::make_shared<ngraph::pattern::Matcher>(matmul, "HandleTransposeBeforeMatMul");
-    this->register_matcher(m, callback);
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(matmul, "HandleTransposeBeforeMatMul");
+    this->register_matcher(matcher, callback);
 }
 
 HandleTransposeAfterMatMul::HandleTransposeAfterMatMul() {
-    auto matmul = ngraph::pattern::wrap_type<ngraph::opset7::MatMul>();
-    auto fq = ngraph::pattern::wrap_type<ngraph::opset7::FakeQuantize>({matmul, ngraph::pattern::any_input(),
+    auto matmul = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>();
+    auto add_left = ngraph::pattern::wrap_type<ngraph::opset8::Add>({matmul, ngraph::pattern::any_input()});
+    auto add_right = ngraph::pattern::wrap_type<ngraph::opset8::Add>({ngraph::pattern::any_input(), matmul});
+    auto fq_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{matmul, add_left, add_right});
+    auto fq = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({fq_input, ngraph::pattern::any_input(),
         ngraph::pattern::any_input(), ngraph::pattern::any_input(), ngraph::pattern::any_input()});
-    auto transpose_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{matmul, fq});
-    auto transpose = ngraph::pattern::wrap_type<ngraph::opset7::Transpose>({transpose_input, ngraph::pattern::any_input()});
+    auto transpose_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{fq_input, fq});
+    auto transpose = ngraph::pattern::wrap_type<ngraph::opset8::Transpose>({transpose_input, ngraph::pattern::any_input()});
     auto reshape_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{transpose_input, transpose});
-    auto reshape = ngraph::pattern::wrap_type<ngraph::opset7::Reshape>({reshape_input,
-        ngraph::pattern::any_input()}, VerifyReshape());
+    auto reshape = ngraph::pattern::wrap_type<ngraph::opset8::Reshape>(
+        {reshape_input, ngraph::pattern::any_input()}, VerifyReshape);
 
-    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &m) {
-        const auto& pattern_map = m.get_pattern_value_map();
+    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &matcher) {
+        const auto& pattern_map = matcher.get_pattern_value_map();
         auto transpose_it = pattern_map.find(transpose);
         if (transpose_it != std::end(pattern_map)) {
             ReplaceTransposeWithReshape(transpose_it->second.get_node_shared_ptr());
         } else {
             auto reshape_node = pattern_map.at(reshape).get_node_shared_ptr();
-            if (!GNALimitations::IsTransposeSupported(reshape_node->get_input_shape(0))) return false;
-            auto matmul_node = pattern_map.at(matmul).get_node_shared_ptr();
-            InsertTranspose(matmul_node, matmul_node->get_friendly_name());
+            if (!GNALimitations::IsTransposeSupported(reshape_node->get_output_shape(0))) return false;
+            auto iter = pattern_map.find(fq);
+            if (iter == pattern_map.end() &&
+                (iter = pattern_map.find(add_left)) == pattern_map.end() &&
+                (iter = pattern_map.find(add_right)) == pattern_map.end() &&
+                (iter = pattern_map.find(matmul)) == pattern_map.end()) {
+                return false;
+            }
+            auto node = iter->second.get_node_shared_ptr();
+            InsertTranspose(node, node->get_friendly_name());
         }
         return true;
     };
 
-    auto m = std::make_shared<ngraph::pattern::Matcher>(reshape, "HandleTransposeAfterMatMul");
-    this->register_matcher(m, callback);
-}
-
-bool VerifyReshape::operator()(const ngraph::Output<ngraph::Node>& reshape_out) const {
-    auto in_shape = reshape_out.get_node_shared_ptr()->get_input_shape(0);
-    auto out_shape = reshape_out.get_node_shared_ptr()->get_output_shape(0);
-
-    // Check if Reshape changes the final 2d shape of Affine primitive
-    in_shape.erase(std::remove(in_shape.begin(), in_shape.end(), 1), in_shape.end());
-    out_shape.erase(std::remove(out_shape.begin(), out_shape.end(), 1), out_shape.end());
-    return in_shape != out_shape;
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(reshape, "HandleTransposeAfterMatMul");
+    this->register_matcher(matcher, callback);
 }
 
 HandleTransposesAroundMatMul::HandleTransposesAroundMatMul() {
     add_matcher<HandleTransposeBeforeMatMul>();
     add_matcher<HandleTransposeAfterMatMul>();
 }
+
+} // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.hpp b/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.hpp
index 2601655f77fe9e..c9e41b641b93f3 100644
--- a/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.hpp
+++ b/inference-engine/src/gna_plugin/transformations/handle_transposes_around_matmul.hpp
@@ -8,10 +8,6 @@
 
 namespace GNAPluginNS {
 
-struct VerifyReshape {
-    bool operator()(const ngraph::Output<ngraph::Node>& reshape_out) const;
-};
-
 /**
  * @brief Inserts Transpose before MatMul or removes it (if it exists) if there is Reshape
  * before MatMul which changes the batch size:
@@ -48,16 +44,16 @@ class HandleTransposeBeforeMatMul : public ngraph::pass::MatcherPass {
  *       |                       |
  *    [1, A*B]                [1, A*B]
  */
-class HandleTransposeAfterMatMul : public ngraph::pass::MatcherPass {
+class HandleTransposeAfterMatMul: public ngraph::pass::MatcherPass {
 public:
-  NGRAPH_RTTI_DECLARATION;
-  HandleTransposeAfterMatMul();
+    NGRAPH_RTTI_DECLARATION;
+    HandleTransposeAfterMatMul();
 };
 
-class HandleTransposesAroundMatMul: public ngraph::pass::GraphRewrite {
+class HandleTransposesAroundMatMul : public ngraph::pass::GraphRewrite {
 public:
-    NGRAPH_RTTI_DECLARATION;
-    HandleTransposesAroundMatMul();
+  NGRAPH_RTTI_DECLARATION;
+  HandleTransposesAroundMatMul();
 };
 
 } // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/insert_reshape_around_matmul.cpp b/inference-engine/src/gna_plugin/transformations/insert_reshape_around_matmul.cpp
new file mode 100644
index 00000000000000..9d82d7b402d68e
--- /dev/null
+++ b/inference-engine/src/gna_plugin/transformations/insert_reshape_around_matmul.cpp
@@ -0,0 +1,237 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "transformations/insert_reshape_around_matmul.hpp"
+#include <openvino/cc/ngraph/itt.hpp>
+#include <ngraph/rt_info.hpp>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pattern/op/or.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ie/ie_common.h>
+
+#include "gna_plugin_log.hpp"
+
+namespace GNAPluginNS {
+
+NGRAPH_RTTI_DEFINITION(InsertReshapeAroundMatmul, "InsertReshapeAroundMatmul", 0);
+NGRAPH_RTTI_DEFINITION(InsertReshapeAroundMatmulWithAdd, "InsertReshapeAroundMatmulWithAdd", 0);
+NGRAPH_RTTI_DEFINITION(InsertReshapeAroundMatmulWithFq, "InsertReshapeAroundMatmulWithFq", 0);
+NGRAPH_RTTI_DEFINITION(InsertReshapeAroundMatmulWithTranspose, "InsertReshapeAroundMatmulWithTranspose", 0);
+
+static bool InsertReshape(
+    ngraph::pattern::Matcher &matcher,
+    const std::shared_ptr<ngraph::Node>& input,
+    const std::shared_ptr<ngraph::Node>& matmul1,
+    const std::shared_ptr<ngraph::Node>& matmul2,
+    const std::shared_ptr<ngraph::Node>& add1 = nullptr,
+    const std::shared_ptr<ngraph::Node>& add2 = nullptr,
+    const std::shared_ptr<ngraph::Node>& fake_quantize2 = nullptr,
+    const std::shared_ptr<ngraph::Node>& transpose = nullptr) {
+    const auto& pattern_map = matcher.get_pattern_value_map();
+    size_t matmul_input_index = 1;
+    auto iter = pattern_map.find(matmul1);
+    if (iter == pattern_map.end()) {
+        iter = pattern_map.find(matmul2);
+        if ((iter = pattern_map.find(matmul2)) == pattern_map.end()) {
+            return false;
+        }
+
+        matmul_input_index = 0;
+    }
+
+    std::shared_ptr<ngraph::Node> matmul_node = iter->second.get_node_shared_ptr();
+    auto matmul_node_shape = matmul_node->get_output_shape(0);
+    if ((iter = pattern_map.find(input)) == std::end(pattern_map)) {
+        return false;
+    }
+
+    std::shared_ptr<ngraph::Node> first_node = iter->second.get_node_shared_ptr();
+    auto reshape_input_node = std::dynamic_pointer_cast<ngraph::opset8::Reshape>(first_node);
+    bool need_reshape_before = !reshape_input_node || reshape_input_node->get_output_shape(0).size() != 2;
+    if (need_reshape_before) {
+        auto input_shape = first_node->get_output_shape(0);
+        std::vector<size_t> before_shape(2, 1);
+        std::copy_if(input_shape.begin(), input_shape.end(), before_shape.begin(), [](size_t e) { return e > 1; });
+        auto reshape_before_node = std::make_shared<ngraph::opset8::Reshape>(first_node,
+            std::make_shared<ngraph::opset8::Constant>(ngraph::element::Type_t::i64, ngraph::Shape{before_shape.size()}, before_shape), false);
+        reshape_before_node->set_friendly_name(matmul_node->get_friendly_name() + "/reshape_before_matmul");
+        ngraph::copy_runtime_info(first_node, reshape_before_node);
+        matmul_node->input(matmul_input_index).replace_source_output(reshape_before_node->output(0));
+    }
+
+    std::shared_ptr<ngraph::Node> last_node;
+    iter = pattern_map.find(transpose);
+    if (iter == pattern_map.end() &&
+        (iter = pattern_map.find(fake_quantize2)) == pattern_map.end() &&
+        (iter = pattern_map.find(add1)) == pattern_map.end() &&
+        (iter = pattern_map.find(add2)) == pattern_map.end()) {
+        last_node = matmul_node;
+    } else {
+        last_node = iter->second.get_node_shared_ptr();
+    }
+
+    auto consumers = last_node->output(0).get_target_inputs();
+    auto last_node_shape = last_node->get_output_shape(0);
+    bool need_reshape_after = false;
+    for (auto consumer : consumers) {
+        auto reshape_output_node = dynamic_cast<ngraph::opset8::Reshape*>(consumer.get_node());
+        if (!reshape_output_node || reshape_output_node->get_output_shape(0).size() != last_node_shape.size()) {
+            need_reshape_after = true;
+            break;
+        }
+    }
+
+    if (need_reshape_after) {
+        auto reshape_after_node = std::make_shared<ngraph::opset8::Reshape>(last_node,
+            std::make_shared<ngraph::opset8::Constant>(ngraph::element::Type_t::i64, ngraph::Shape{last_node_shape.size()}, last_node_shape), false);
+        reshape_after_node->set_friendly_name(last_node->get_friendly_name());
+        ngraph::copy_runtime_info(last_node, reshape_after_node);
+        for (auto consumer : consumers) {
+            consumer.replace_source_output(reshape_after_node);
+        }
+    }
+
+    return need_reshape_before || need_reshape_after;
+}
+
+static std::shared_ptr<ngraph::Node> CreateMatmulPattern(
+    std::shared_ptr<ngraph::Node>& input,
+    std::shared_ptr<ngraph::Node>& matmul1,
+    std::shared_ptr<ngraph::Node>& matmul2,
+    const ngraph::pattern::op::ValuePredicate& pred = [](const ngraph::Output<ngraph::Node>& output) { return true; }) {
+    auto constant = ngraph::pattern::wrap_type<ngraph::opset8::Constant>();
+    auto fake_quantize = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({constant,
+        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
+        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
+        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
+        ngraph::pattern::wrap_type<ngraph::opset8::Constant>()});
+    auto matmul_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{constant, fake_quantize});
+    input = ngraph::pattern::any_input([](const ngraph::Output<ngraph::Node>& node) {
+        auto shape = node.get_node_shared_ptr()->get_output_shape(0);
+        return shape.size() > 2 && std::count_if(shape.begin(), shape.end(), [](size_t e) { return e > 1; }) <= 2; });
+    matmul1 = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>({matmul_input, input}, pred);
+    matmul2 = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>({input, matmul_input}, pred);
+    return std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{matmul1, matmul2});
+}
+
+InsertReshapeAroundMatmul::InsertReshapeAroundMatmul() {
+    MATCHER_SCOPE(InsertReshapeAroundMatmul);
+
+    auto pred = [](const ngraph::Output<ngraph::Node>& node) {
+        const auto& outputs = node.get_node_shared_ptr()->outputs();
+        const auto& inputs = outputs[0].get_target_inputs();
+        if (inputs.empty()) {
+            return true;
+        }
+
+        auto next_node = inputs.begin()->get_node();
+        return outputs.size() != 1 ||
+            !dynamic_cast<ngraph::opset8::Transpose*>(next_node) &&
+            !dynamic_cast<ngraph::opset8::FakeQuantize*>(next_node) &&
+            !dynamic_cast<ngraph::opset8::Add*>(next_node);
+    };
+
+    std::shared_ptr<ngraph::Node> input;
+    std::shared_ptr<ngraph::Node> matmul1;
+    std::shared_ptr<ngraph::Node> matmul2;
+    auto matmul = CreateMatmulPattern(input, matmul1, matmul2, pred);
+
+    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &matcher) {
+        return InsertReshape(matcher, input, matmul1, matmul2);
+    };
+
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(matmul, "InsertReshapeAroundMatmul");
+    this->register_matcher(matcher, callback);
+}
+
+InsertReshapeAroundMatmulWithAdd::InsertReshapeAroundMatmulWithAdd() {
+    MATCHER_SCOPE(InsertReshapeAroundMatmulWithAdd);
+
+    auto pred = [](const ngraph::Output<ngraph::Node>& node) {
+        const auto& outputs = node.get_node_shared_ptr()->outputs();
+        const auto& inputs = outputs[0].get_target_inputs();
+        if (inputs.empty()) {
+            return true;
+        }
+
+        auto next_node = inputs.begin()->get_node();
+        return outputs.size() != 1 ||
+            !dynamic_cast<ngraph::opset8::Transpose*>(next_node) &&
+            !dynamic_cast<ngraph::opset8::FakeQuantize*>(next_node);
+    };
+
+    std::shared_ptr<ngraph::Node> input;
+    std::shared_ptr<ngraph::Node> matmul1;
+    std::shared_ptr<ngraph::Node> matmul2;
+    auto matmul = CreateMatmulPattern(input, matmul1, matmul2);
+    auto add_input = ngraph::pattern::any_input();
+    auto add1 = ngraph::pattern::wrap_type<ngraph::opset8::Add>({matmul, add_input}, pred);
+    auto add2 = ngraph::pattern::wrap_type<ngraph::opset8::Add>({add_input, matmul}, pred);
+    auto add = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{add1, add2});
+
+    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &matcher) {
+        return InsertReshape(matcher, input, matmul1, matmul2, add1, add2);
+    };
+
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(add, "InsertReshapeAroundMatmulWithAdd");
+    this->register_matcher(matcher, callback);
+}
+
+InsertReshapeAroundMatmulWithFq::InsertReshapeAroundMatmulWithFq() {
+    MATCHER_SCOPE(InsertReshapeAroundMatmulWithFq);
+
+    std::shared_ptr<ngraph::Node> input;
+    std::shared_ptr<ngraph::Node> matmul1;
+    std::shared_ptr<ngraph::Node> matmul2;
+    auto matmul = CreateMatmulPattern(input, matmul1, matmul2);
+    auto add_input = ngraph::pattern::any_input();
+    auto add1 = ngraph::pattern::wrap_type<ngraph::opset8::Add>({matmul, add_input});
+    auto add2 = ngraph::pattern::wrap_type<ngraph::opset8::Add>({add_input, matmul});
+    auto fq_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{matmul, add1, add2});
+    auto fake_quantize2 = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({fq_input, ngraph::pattern::any_input(),
+        ngraph::pattern::any_input(), ngraph::pattern::any_input(), ngraph::pattern::any_input()},
+        [](const ngraph::Output<ngraph::Node>& node) {
+            const auto& outputs = node.get_node_shared_ptr()->outputs();
+            const auto& inputs = outputs[0].get_target_inputs();
+            if (inputs.empty()) {
+                return true;
+            }
+
+            auto next_node = inputs.begin()->get_node();
+            return outputs.size() != 1 ||
+                !dynamic_cast<ngraph::opset8::Transpose*>(next_node);
+        });
+
+    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &matcher) {
+        return InsertReshape(matcher, input, matmul1, matmul2, add1, add2, fake_quantize2);
+    };
+
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(fake_quantize2, "InsertReshapeAroundMatmulWithFq");
+    this->register_matcher(matcher, callback);
+}
+
+InsertReshapeAroundMatmulWithTranspose::InsertReshapeAroundMatmulWithTranspose() {
+    MATCHER_SCOPE(InsertReshapeAroundMatmulWithTranspose);
+
+    std::shared_ptr<ngraph::Node> input;
+    std::shared_ptr<ngraph::Node> matmul1;
+    std::shared_ptr<ngraph::Node> matmul2;
+    auto matmul = CreateMatmulPattern(input, matmul1, matmul2);
+    auto add_input = ngraph::pattern::any_input();
+    auto add1 = ngraph::pattern::wrap_type<ngraph::opset8::Add>({matmul, add_input});
+    auto add2 = ngraph::pattern::wrap_type<ngraph::opset8::Add>({add_input, matmul});
+    auto fq_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{matmul, add1, add2});
+    auto fake_quantize2 = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({fq_input, ngraph::pattern::any_input(),
+        ngraph::pattern::any_input(), ngraph::pattern::any_input(), ngraph::pattern::any_input()});
+    auto transpose_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{fq_input, fake_quantize2});
+    auto transpose = ngraph::pattern::wrap_type<ngraph::opset8::Transpose>({transpose_input, ngraph::pattern::any_input()});
+
+    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &matcher) {
+        return InsertReshape(matcher, input, matmul1, matmul2, add1, add2, fake_quantize2, transpose);
+    };
+
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(transpose, "InsertReshapeAroundMatmulWithTranspose");
+    this->register_matcher(matcher, callback);
+}
+} // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/insert_reshape_around_matmul.hpp b/inference-engine/src/gna_plugin/transformations/insert_reshape_around_matmul.hpp
new file mode 100644
index 00000000000000..02a728868c4d83
--- /dev/null
+++ b/inference-engine/src/gna_plugin/transformations/insert_reshape_around_matmul.hpp
@@ -0,0 +1,39 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef INSERT_RESHAPE_AROUND_MATMUL_HPP
+#define INSERT_RESHAPE_AROUND_MATMUL_HPP
+
+#include <ngraph/pass/graph_rewrite.hpp>
+
+namespace GNAPluginNS {
+
+// @brief Insert Reshapes from 3d/4d to 2d before MatMul and from 2d to 3d/4d after MatMul
+class InsertReshapeAroundMatmul : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    InsertReshapeAroundMatmul();
+};
+
+class InsertReshapeAroundMatmulWithAdd : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    InsertReshapeAroundMatmulWithAdd();
+};
+
+class InsertReshapeAroundMatmulWithFq : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    InsertReshapeAroundMatmulWithFq();
+};
+
+class InsertReshapeAroundMatmulWithTranspose : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    InsertReshapeAroundMatmulWithTranspose();
+};
+
+} // namespace GNAPluginNS
+
+#endif // INSERT_RESHAPE_AROUND_MATMUL_HPP
diff --git a/inference-engine/src/gna_plugin/transformations/remove_single_input_concat.cpp b/inference-engine/src/gna_plugin/transformations/remove_single_input_concat.cpp
new file mode 100644
index 00000000000000..b367bd63811896
--- /dev/null
+++ b/inference-engine/src/gna_plugin/transformations/remove_single_input_concat.cpp
@@ -0,0 +1,47 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <openvino/cc/ngraph/itt.hpp>
+
+#include "transformations/remove_single_input_concat.hpp"
+
+#include <memory>
+#include <vector>
+
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/pass/manager.hpp>
+
+using NodeInput = ngraph::Input<ngraph::Node>;
+using NodeOutput = ngraph::Output<ngraph::Node>;
+
+namespace GNAPluginNS {
+    NGRAPH_RTTI_DEFINITION(RemoveSingleInputConcat, "RemoveSingleInputConcat", 0);
+
+    RemoveSingleInputConcat::RemoveSingleInputConcat() {
+        MATCHER_SCOPE(RemoveSingleInputConcat);
+
+        auto is_required_node = [](const ngraph::Output<ngraph::Node>& value) {
+            return value.get_node_shared_ptr()->get_input_size() == 1;
+        };
+
+        auto concat_operation = ngraph::pattern::wrap_type<ngraph::opset8::Concat>(is_required_node);
+
+        ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher& m) {
+            const auto& pattern_map = m.get_pattern_value_map();
+            auto concat_operation_node = pattern_map.find(concat_operation)->second.get_node_shared_ptr();
+
+            NodeOutput prev_node_output = concat_operation_node->get_input_source_output(0);
+
+            for (NodeInput child_input : concat_operation_node->get_output_target_inputs(0))
+                child_input.replace_source_output(prev_node_output);
+
+            return true;
+        };
+
+        auto m = std::make_shared<ngraph::pattern::Matcher>(concat_operation, matcher_name);
+        this->register_matcher(m, callback);
+    }
+
+} // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/remove_single_input_concat.hpp b/inference-engine/src/gna_plugin/transformations/remove_single_input_concat.hpp
new file mode 100644
index 00000000000000..7730c36d9afe07
--- /dev/null
+++ b/inference-engine/src/gna_plugin/transformations/remove_single_input_concat.hpp
@@ -0,0 +1,20 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <ngraph/pass/graph_rewrite.hpp>
+
+namespace GNAPluginNS {
+
+/**
+ * @brief remove concat layers with single input
+ */
+class RemoveSingleInputConcat : public ngraph::pass::MatcherPass {
+public:
+  NGRAPH_RTTI_DECLARATION;
+  RemoveSingleInputConcat();
+};
+
+} // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/split_convolution_with_large_buffer_size.cpp b/inference-engine/src/gna_plugin/transformations/split_convolution_with_large_buffer_size.cpp
index b29cc04dac023b..1f757740274736 100644
--- a/inference-engine/src/gna_plugin/transformations/split_convolution_with_large_buffer_size.cpp
+++ b/inference-engine/src/gna_plugin/transformations/split_convolution_with_large_buffer_size.cpp
@@ -13,6 +13,7 @@
 #include <ngraph/rt_info.hpp>
 #include "backend/gna_limitations.hpp"
 #include "layers/gna_split_layer.hpp"
+#include "layers/gna_convolution_layer.hpp"
 
 using namespace GNAPluginNS;
 
@@ -20,6 +21,34 @@ NGRAPH_RTTI_DEFINITION(SplitConvolution, "SplitConvolution", 0);
 NGRAPH_RTTI_DEFINITION(SplitConvolutionWithBias, "SplitConvolutionWithBias", 0);
 NGRAPH_RTTI_DEFINITION(SplitConvolutionWithFq, "SplitConvolutionWithFq", 0);
 
+// Don't split when convolution is 2D and is not mappable to 1D
+static bool shouldSplitCnn(const ngraph::Output<ngraph::Node>& node) {
+    auto convolution = dynamic_cast<ngraph::opset7::Convolution*>(node.get_node());
+    IE_ASSERT(convolution != nullptr);
+    auto& input = convolution->get_input_shape(0);
+    auto& filters = convolution->get_input_shape(1);
+    uint32_t width = input.back();
+    uint32_t in_channels = input.at(1);
+    if (input.size() >= 4 && filters.size() >= 4) {
+        uint32_t height = input.at(2);
+        auto kH = filters.at(2);
+        auto kW = filters.at(3);
+        auto sW = convolution->get_strides().at(1);
+        if (GNAConvolutionLayer::isConv2D(height, width, in_channels, kH, kW) &&
+            !GNAConvolutionLayer::isMappableFrom2DTo1D(height, width, kW, sW)) {
+            return false;
+        }
+    }
+    return true;
+}
+
+std::shared_ptr<ngraph::Node> getConvForMatcher() {
+    return ngraph::pattern::wrap_type<ngraph::opset7::Convolution>({ ngraph::pattern::any_input(),
+    ngraph::pattern::any_input() }, [](const ngraph::Output<ngraph::Node>& convolution) {
+            return shouldSplitCnn(convolution);
+        });
+}
+
 static bool Convert(std::shared_ptr<ngraph::Node> conv,
                     std::shared_ptr<ngraph::Node> add,
                     std::shared_ptr<ngraph::Node> bias,
@@ -29,9 +58,9 @@ static bool Convert(std::shared_ptr<ngraph::Node> conv,
     if (input_size <= GNALimitations::bufferMaxSize) {
         return false;
     }
-
-    uint32_t width = conv->get_input_shape(0).back();
-    uint32_t in_channels = conv->get_input_shape(0).at(1);
+    auto& input = conv->get_input_shape(0);
+    uint32_t width = input.back();
+    uint32_t in_channels = input.at(1);
     auto split_sizes = GetAlignedSplitSizes(width, GNALimitations::bufferMaxSize / in_channels);
     IE_ASSERT(split_sizes.size() > 1);
     std::vector<int64_t> split_sizes_casted(split_sizes.size());
@@ -41,7 +70,7 @@ static bool Convert(std::shared_ptr<ngraph::Node> conv,
 
     /* TODO check if it's NHWC convolution wrapped with transposes or all input dimensions except of width == 1,
         otherwise this split axis isn't supported */
-    const int64_t width_axis = conv->get_input_shape(0).size() - 1;
+    const int64_t width_axis = input.size() - 1;
     auto split_node = std::make_shared<ngraph::opset7::VariadicSplit>(conv->input_value(0),
         ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape({1}), std::vector<int64_t>{width_axis}),
         ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape({split_sizes_casted.size()}), split_sizes_casted));
@@ -75,9 +104,7 @@ static bool Convert(std::shared_ptr<ngraph::Node> conv,
 
 SplitConvolution::SplitConvolution() {
     MATCHER_SCOPE(SplitConvolution);
-    auto conv = ngraph::pattern::wrap_type<ngraph::opset7::Convolution>({ngraph::pattern::any_input(),
-        ngraph::pattern::any_input()});
-
+    auto conv = getConvForMatcher();
     ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher &m) {
         const auto& pattern_map = m.get_pattern_value_map();
         return Convert(pattern_map.at(conv).get_node_shared_ptr(), nullptr, nullptr, nullptr);
@@ -89,8 +116,7 @@ SplitConvolution::SplitConvolution() {
 
 SplitConvolutionWithBias::SplitConvolutionWithBias() {
     MATCHER_SCOPE(SplitConvolutionWithBias);
-    auto conv = ngraph::pattern::wrap_type<ngraph::opset7::Convolution>({ngraph::pattern::any_input(),
-        ngraph::pattern::any_input()});
+    auto conv = getConvForMatcher();
     auto bias = ngraph::pattern::wrap_type<ngraph::opset7::Constant>();
     auto add = ngraph::pattern::wrap_type<ngraph::opset7::Add>({conv, bias});
 
@@ -106,8 +132,7 @@ SplitConvolutionWithBias::SplitConvolutionWithBias() {
 
 SplitConvolutionWithFq::SplitConvolutionWithFq() {
     MATCHER_SCOPE(SplitConvolutionWithFq);
-    auto conv = ngraph::pattern::wrap_type<ngraph::opset7::Convolution>({ngraph::pattern::any_input(),
-        ngraph::pattern::any_input()});
+    auto conv = getConvForMatcher();
     auto bias = ngraph::pattern::wrap_type<ngraph::opset7::Constant>();
     auto add = ngraph::pattern::wrap_type<ngraph::opset7::Add>({conv, bias});
     auto conv_output = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{conv, add});
@@ -128,4 +153,4 @@ SplitConvolutionWithFq::SplitConvolutionWithFq() {
 
     auto m = std::make_shared<ngraph::pattern::Matcher>(out_fq, matcher_name);
     this->register_matcher(m, callback);
-}
\ No newline at end of file
+}
diff --git a/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.cpp b/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.cpp
index 2db8e10620c9dc..8b3dbe391eec60 100644
--- a/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.cpp
+++ b/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.cpp
@@ -2,31 +2,34 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
+#include <transformations/swap_input_matmul_gna.hpp>
 #include <openvino/cc/ngraph/itt.hpp>
 
 #include <memory>
 #include <vector>
 
 #include <ngraph/pass/manager.hpp>
-#include <ngraph/pattern/op/or.hpp>
-#include <ngraph/opsets/opset8.hpp>
 #include <ngraph/rt_info.hpp>
-#include <ngraph/pattern/op/wrap_type.hpp>
 #include <numeric>
-#include <transformations/swap_input_matmul_gna.hpp>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pattern/op/or.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ie/ie_common.h>
 
 #include "gna_plugin_log.hpp"
 
-using namespace GNAPluginNS;
+namespace GNAPluginNS {
 
 NGRAPH_RTTI_DEFINITION(SwapInputMatMul, "SwapInputMatMul", 0);
 NGRAPH_RTTI_DEFINITION(SwapInputMatMulWithBias, "SwapInputMatMulWithBias", 0);
 NGRAPH_RTTI_DEFINITION(SwapInputMatMulWithFq, "SwapInputMatMulWithFq", 0);
 
-static void SwapAndTransposeInputs(std::shared_ptr<ngraph::opset8::MatMul> matmul_node,
-                                   std::shared_ptr<ngraph::Node> add,
-                                   std::shared_ptr<ngraph::Node> bias,
-                                   std::shared_ptr<ngraph::Node> fq) {
+static void SwapAndTransposeInputs(
+    std::shared_ptr<ngraph::opset8::MatMul> matmul_node,
+    std::shared_ptr<ngraph::Node> add,
+    std::shared_ptr<ngraph::Node> bias,
+    std::shared_ptr<ngraph::Node> fq,
+    const std::string& last_layer_name) {
     auto create_transpose =
         [](ngraph::Output<ngraph::Node> node, const std::string& transpose_name) -> std::shared_ptr<ngraph::Node> {
         ngraph::Shape output_shape = node.get_node_shared_ptr()->get_shape();
@@ -52,15 +55,28 @@ static void SwapAndTransposeInputs(std::shared_ptr<ngraph::opset8::MatMul> matmu
 
     std::shared_ptr<ngraph::Node> old_root_node = matmul_node;
     if (bias != nullptr) {
-         // output of MatMul will be transposed comparing with original one, so the bias should be transposed too
-         if (bias->get_output_shape(0).size() > 1) {
-             bias = create_transpose(bias, bias->get_friendly_name() + "/transpose");
-             new_ops.push_back(bias);
-         }
-
-         new_matmul = std::make_shared<ngraph::opset8::Add>(new_matmul, bias);
-         old_root_node = add;
-         new_ops.push_back(new_matmul);
+        // output of MatMul will be transposed comparing with original one, so the bias should be transposed too
+        if (bias->get_output_shape(0).size() > 1) {
+            bias = create_transpose(bias, bias->get_friendly_name() + "/transpose");
+            new_ops.push_back(bias);
+
+            auto transpose_shape = bias->get_output_shape(0);
+            auto matmul_shape = matmul_node->get_output_shape(0);
+            if (transpose_shape.size() > matmul_shape.size()) {
+                std::vector<size_t> reshape_shape(matmul_shape.size(), 1);
+                std::copy_if(transpose_shape.begin(), transpose_shape.end(), reshape_shape.begin(), [](size_t e) { return e > 1; });
+                bias = std::make_shared<ngraph::opset8::Reshape>(bias,
+                    std::make_shared<ngraph::opset8::Constant>(ngraph::element::Type_t::i64,
+                        ngraph::Shape{reshape_shape.size()}, reshape_shape), false);
+                bias->set_friendly_name(add->get_friendly_name() + "/reshape");
+                ngraph::copy_runtime_info(add, bias);
+                new_ops.push_back(bias);
+            }
+        }
+
+        new_matmul = std::make_shared<ngraph::opset8::Add>(new_matmul, bias);
+        old_root_node = add;
+        new_ops.push_back(new_matmul);
     }
 
     if (fq != nullptr) {
@@ -70,113 +86,151 @@ static void SwapAndTransposeInputs(std::shared_ptr<ngraph::opset8::MatMul> matmu
         new_ops.push_back(new_matmul);
     }
 
-    auto output = create_transpose(new_matmul,  matmul_node->get_friendly_name());
+    auto output = create_transpose(new_matmul, last_layer_name);
     new_ops.push_back(output);
 
     ngraph::copy_runtime_info(matmul_node, new_ops);
     ngraph::replace_node(old_root_node, output);
 }
 
-SwapInputMatMul::SwapInputMatMul() {
-    MATCHER_SCOPE(SwapInputMatMul);
-    auto constant = ngraph::pattern::wrap_type<ngraph::opset8::Constant>({}, [](const ngraph::Output<ngraph::Node>& node) {
-        auto shape = node.get_node_shared_ptr()->get_output_shape(0);
-        if (shape.size() != 2 || shape[0] < 8 || ((shape[0] % 8 != 0 || shape[1] % 8 != 0))) {
-            return false;
-        }
-        return true;
-    });
+static std::shared_ptr<ngraph::Node> CreateMatmul(
+    bool is_first_constant,
+    ngraph::pattern::op::ValuePredicate const_predicate,
+    ngraph::pattern::op::ValuePredicate matmul_predicate = ngraph::pattern::has_static_shape()) {
+    auto constant = ngraph::pattern::wrap_type<ngraph::opset8::Constant>({}, const_predicate);
     auto fake_quantize = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({constant,
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>()});
     auto matmul_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{constant, fake_quantize});
-    auto matmul = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>({matmul_input, ngraph::pattern::any_input()},
-                                                                      ngraph::pattern::has_static_shape());
-    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher& m) {
+    if (is_first_constant) {
+        return ngraph::pattern::wrap_type<ngraph::opset8::MatMul>(
+            {matmul_input, ngraph::pattern::any_input()}, matmul_predicate);
+    }
+    return ngraph::pattern::wrap_type<ngraph::opset8::MatMul>(
+        {ngraph::pattern::any_input(), matmul_input}, matmul_predicate);
+}
+
+static std::shared_ptr<ngraph::Node> CreateMatmuls(
+    std::shared_ptr<ngraph::Node>& matmul1,
+    std::shared_ptr<ngraph::Node>& matmul2) {
+    matmul1 = CreateMatmul(
+        true,
+        [](const ngraph::Output<ngraph::Node>& node) { return true; },
+        [](const ngraph::Output<ngraph::Node>& node) {
+            auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(node.get_node_shared_ptr());
+            IE_ASSERT(matmul_node != nullptr);
+            auto input_shape = matmul_node->get_input_shape(0);
+            return input_shape.size() == 2 &&
+                (!matmul_node->get_transpose_a() && input_shape[0] > 8 ||
+                matmul_node->get_transpose_a() && input_shape[1] > 8); });
+    matmul2 = CreateMatmul(
+        false,
+        [](const ngraph::Output<ngraph::Node>& node) { return true; },
+        [](const ngraph::Output<ngraph::Node>& node) {
+            auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(node.get_node_shared_ptr());
+            IE_ASSERT(matmul_node != nullptr);
+            auto first_input_shape = matmul_node->get_input_shape(0);
+            first_input_shape.erase(std::remove(first_input_shape.begin(), first_input_shape.end(), 1), first_input_shape.end());
+            auto second_input_shape = matmul_node->get_input_shape(1);
+            return node.get_partial_shape().is_static() &&
+                second_input_shape.size() == 2 &&
+                (!matmul_node->get_transpose_b() && second_input_shape[1] <= 8 ||
+                 matmul_node->get_transpose_b() && second_input_shape[0] <= 8) &&
+                first_input_shape.size() == 2 &&
+                first_input_shape[0] > 8; });
+    return std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{matmul1, matmul2});
+}
+
+SwapInputMatMul::SwapInputMatMul() {
+    MATCHER_SCOPE(SwapInputMatMul);
+    std::shared_ptr<ngraph::Node> matmul1;
+    std::shared_ptr<ngraph::Node> matmul2;
+    auto matmul = CreateMatmuls(matmul1, matmul2);
+    auto callback = [=](ngraph::pattern::Matcher& m) {
         const auto& pattern_map = m.get_pattern_value_map();
-        auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(pattern_map.at(matmul).get_node_shared_ptr());
+        auto iter = pattern_map.find(matmul1);
+        if (iter == pattern_map.end() &&
+            (iter = pattern_map.find(matmul2)) == pattern_map.end()) {
+            return false;
+        }
+
+        auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(iter->second.get_node_shared_ptr());
         IE_ASSERT(matmul_node != nullptr);
-        SwapAndTransposeInputs(matmul_node, nullptr, nullptr, nullptr);
+        SwapAndTransposeInputs(matmul_node, nullptr, nullptr, nullptr, "");
         return true;
     };
 
-    auto m = std::make_shared<ngraph::pattern::Matcher>(matmul, matcher_name);
-    this->register_matcher(m, callback);
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(matmul, "SwapInputMatMul");
+    this->register_matcher(matcher, callback);
 }
 
 SwapInputMatMulWithBias::SwapInputMatMulWithBias() {
     MATCHER_SCOPE(SwapInputMatMulWithBias);
-    auto constant = ngraph::pattern::wrap_type<ngraph::opset8::Constant>({}, [](const ngraph::Output<ngraph::Node>& node) {
-        auto shape = node.get_node_shared_ptr()->get_output_shape(0);
-        if (shape.size() != 2 || shape[0] < 8 || ((shape[0] % 8 != 0 || shape[1] % 8 != 0))) {
-            return false;
-        }
-        return true;
-    });
-    auto fake_quantize = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({constant,
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>()});
-    auto matmul_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{constant, fake_quantize});
-    auto matmul = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>({matmul_input, ngraph::pattern::any_input()},
-                                                                      ngraph::pattern::has_static_shape());
+    std::shared_ptr<ngraph::Node> matmul1;
+    std::shared_ptr<ngraph::Node> matmul2;
+    auto matmul = CreateMatmuls(matmul1, matmul2);
     auto bias = ngraph::pattern::wrap_type<ngraph::opset8::Constant>();
     auto add = ngraph::pattern::wrap_type<ngraph::opset8::Add>({matmul, bias});
-
-    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher& m) {
+    auto callback = [=](ngraph::pattern::Matcher& m) {
         const auto& pattern_map = m.get_pattern_value_map();
-        auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(pattern_map.at(matmul).get_node_shared_ptr());
+        auto iter = pattern_map.find(matmul1);
+        if (iter == pattern_map.end() &&
+            (iter = pattern_map.find(matmul2)) == pattern_map.end()) {
+            return false;
+        }
+
+        auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(iter->second.get_node_shared_ptr());
         IE_ASSERT(matmul_node != nullptr);
-        SwapAndTransposeInputs(matmul_node, pattern_map.at(add).get_node_shared_ptr(),
-            pattern_map.at(bias).get_node_shared_ptr(), nullptr);
+        SwapAndTransposeInputs(
+            matmul_node,
+            pattern_map.at(add).get_node_shared_ptr(),
+            pattern_map.at(bias).get_node_shared_ptr(),
+            nullptr,
+            pattern_map.at(add).get_node_shared_ptr()->get_friendly_name());
         return true;
     };
 
-    auto m = std::make_shared<ngraph::pattern::Matcher>(add, matcher_name);
-    this->register_matcher(m, callback);
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(add, "SwapInputMatMulWithBias");
+    this->register_matcher(matcher, callback);
 }
 
 SwapInputMatMulWithFq::SwapInputMatMulWithFq() {
     MATCHER_SCOPE(SwapInputMatMulWithFq);
-    auto constant = ngraph::pattern::wrap_type<ngraph::opset8::Constant>({}, [](const ngraph::Output<ngraph::Node>& node) {
-        auto shape = node.get_node_shared_ptr()->get_output_shape(0);
-        if (shape.size() != 2 || shape[0] < 8 || ((shape[0] % 8 != 0 || shape[1] % 8 != 0))) {
-            return false;
-        }
-        return true;
-    });
-    auto fake_quantize = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({constant,
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
-        ngraph::pattern::wrap_type<ngraph::opset8::Constant>()});
-    auto matmul_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{constant, fake_quantize});
-    auto matmul = ngraph::pattern::wrap_type<ngraph::opset8::MatMul>({matmul_input, ngraph::pattern::any_input()},
-                                                                      ngraph::pattern::has_static_shape());
+    std::shared_ptr<ngraph::Node> matmul1;
+    std::shared_ptr<ngraph::Node> matmul2;
+    auto matmul = CreateMatmuls(matmul1, matmul2);
     auto bias = ngraph::pattern::wrap_type<ngraph::opset8::Constant>();
     auto add = ngraph::pattern::wrap_type<ngraph::opset8::Add>({matmul, bias});
-    auto matmul_out = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{add, matmul});
-    auto out_fq = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({matmul_out,
+    auto fq_input = std::make_shared<ngraph::pattern::op::Or>(ngraph::OutputVector{add, matmul});
+    auto fq = ngraph::pattern::wrap_type<ngraph::opset8::FakeQuantize>({fq_input,
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>(),
         ngraph::pattern::wrap_type<ngraph::opset8::Constant>()});
-
-    ngraph::matcher_pass_callback callback = [=](ngraph::pattern::Matcher& m) {
+    auto callback = [=](ngraph::pattern::Matcher& m) {
         const auto& pattern_map = m.get_pattern_value_map();
-        auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(pattern_map.at(matmul).get_node_shared_ptr());
+        auto iter = pattern_map.find(matmul1);
+        if (iter == pattern_map.end() &&
+            (iter = pattern_map.find(matmul2)) == pattern_map.end()) {
+            return false;
+        }
+
+        auto iter_add = pattern_map.find(add);
+        auto iter_bias = pattern_map.find(bias);
+        auto matmul_node = std::dynamic_pointer_cast<ngraph::opset8::MatMul>(iter->second.get_node_shared_ptr());
         IE_ASSERT(matmul_node != nullptr);
-        auto add_it = pattern_map.find(add);
-        auto add_node = (add_it == std::end(pattern_map) ? nullptr : add_it->second.get_node_shared_ptr());
-        auto bias_it = pattern_map.find(bias);
-        auto bias_node = (bias_it == std::end(pattern_map) ? nullptr : bias_it->second.get_node_shared_ptr());
-        SwapAndTransposeInputs(matmul_node, add_node, bias_node, pattern_map.at(out_fq).get_node_shared_ptr());
+        SwapAndTransposeInputs(
+            matmul_node,
+            iter_add != pattern_map.end() ? iter_add->second.get_node_shared_ptr() : nullptr,
+            iter_bias != pattern_map.end() ? iter_bias->second.get_node_shared_ptr() : nullptr,
+            pattern_map.at(fq).get_node_shared_ptr(),
+            pattern_map.at(fq).get_node_shared_ptr()->get_friendly_name());
         return true;
     };
 
-    auto m = std::make_shared<ngraph::pattern::Matcher>(out_fq, matcher_name);
-    this->register_matcher(m, callback);
-}
\ No newline at end of file
+    auto matcher = std::make_shared<ngraph::pattern::Matcher>(fq, "SwapInputMatMulWithFq");
+    this->register_matcher(matcher, callback);
+}
+} // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.hpp b/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.hpp
index c9604f8b7c2545..aab88799064ebf 100644
--- a/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.hpp
+++ b/inference-engine/src/gna_plugin/transformations/swap_input_matmul_gna.hpp
@@ -2,15 +2,15 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#pragma once
+#ifndef SWAP_INPUT_MATMUL_GNA_HPP
+#define SWAP_INPUT_MATMUL_GNA_HPP
 
-#include <memory>
-#include <transformations_visibility.hpp>
 #include <ngraph/pass/graph_rewrite.hpp>
 
 namespace GNAPluginNS {
-
-// @brief Swaps and transposes inputs of MatMul if its first input is const and its batch size isn't supported by GNA
+// @brief Swaps and transposes inputs of MatMul if
+// 1. its first input is const and its batch size isn't supported by GNA
+// 2. its first input is non-const and its batch size isn't supported by GNA
 class SwapInputMatMul: public ngraph::pass::MatcherPass {
 public:
     NGRAPH_RTTI_DECLARATION;
@@ -28,4 +28,6 @@ class SwapInputMatMulWithFq: public ngraph::pass::MatcherPass {
     NGRAPH_RTTI_DECLARATION;
     SwapInputMatMulWithFq();
 };
-} // namespace GNAPluginNS
\ No newline at end of file
+} // namespace GNAPluginNS
+
+#endif // SWAP_INPUT_MATMUL_GNA_HPP
diff --git a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp
index 79fe863a18fbb2..c70da2db49c242 100644
--- a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp
+++ b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.cpp
@@ -5,6 +5,7 @@
 
 #include <ngraph/opsets/opset7.hpp>
 #include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/rt_info.hpp>
 #include "transformation_helper.hpp"
 
 
@@ -72,4 +73,29 @@ std::shared_ptr<ngraph::opset7::StridedSlice> FlatCrop(ngraph::Output<ngraph::No
         std::vector<int64_t>{1, 0});                                                                            // end mask
 }
 
+std::shared_ptr<ngraph::Node> VerifyBiasGetConst(std::shared_ptr<ngraph::Node> conv, std::shared_ptr<ngraph::Node> bias) {
+    auto add_const = std::dynamic_pointer_cast<ngraph::opset7::Constant>(bias->input_value(1).get_node_shared_ptr());
+
+    // Check if it's really a bias and not just addition
+    if (add_const) {
+        auto bias_size = shape_size(add_const->get_shape());
+        auto conv_filter_count = conv->get_output_shape(0)[1];
+        if (bias_size == conv_filter_count)
+            return add_const;
+    }
+    return nullptr;
+}
+
+std::shared_ptr<ngraph::Node> InsertFQLayer(const std::shared_ptr<ngraph::opset7::FakeQuantize> fq_layer,
+    std::shared_ptr<ngraph::Node> last_node) {
+    if (fq_layer != nullptr) {
+        auto new_fq = fq_layer->clone_with_new_inputs({last_node,
+            fq_layer->input_value(1), fq_layer->input_value(2),
+            fq_layer->input_value(3), fq_layer->input_value(4)});
+        ngraph::copy_runtime_info(new_fq, fq_layer);
+        return new_fq;
+    }
+    return last_node;
+}
+
 } // namespace GNAPluginNS
diff --git a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp
index 14fca200f7b196..d09f09fa18db37 100644
--- a/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp
+++ b/inference-engine/src/gna_plugin/transformations/utils/transformation_helper.hpp
@@ -61,4 +61,21 @@ bool TransposeOrderMatches(std::shared_ptr<ngraph::opset7::Transpose> transpose,
  * @return pointer to the newly created slice
  */
 std::shared_ptr<ngraph::opset7::StridedSlice> FlatCrop(ngraph::Output<ngraph::Node> input, size_t offset, size_t size);
+
+/**
+ * @brief checks whether an add present after convolution is a bias and gets its const input
+ * @param conv convolution layer preceding potential bias
+ * @param bias potential bias layer passed from ngraph matcher
+ * @return bias const if the add layer present after convolution is a bias, nullptr otherwise
+ */
+std::shared_ptr<ngraph::Node> VerifyBiasGetConst(std::shared_ptr<ngraph::Node> conv, std::shared_ptr<ngraph::Node> bias);
+
+/**
+ * @brief inserts a new fake quantize layer (if it exists) copied from an existing fake quantize layer and conncts it to the output of a given layer
+ * @param fq_layer existing fake quantize layer to be copied
+ * @param last_node the node to which output the new fake quantize layer will be connected
+ * @return new fake quantize layer or the last node
+ */
+std::shared_ptr<ngraph::Node> InsertFQLayer(const std::shared_ptr<ngraph::opset7::FakeQuantize> fq_layer, std::shared_ptr<ngraph::Node> last_node);
+
 } // namespace GNAPluginNS
diff --git a/inference-engine/src/inference_engine/CMakeLists.txt b/inference-engine/src/inference_engine/CMakeLists.txt
index e79a57093669c8..1162adf49c6fce 100644
--- a/inference-engine/src/inference_engine/CMakeLists.txt
+++ b/inference-engine/src/inference_engine/CMakeLists.txt
@@ -120,12 +120,12 @@ ie_faster_build(${TARGET_NAME}_obj
 )
 
 target_compile_definitions(${TARGET_NAME}_obj PRIVATE IMPLEMENT_INFERENCE_ENGINE_API
-                                                      $<TARGET_PROPERTY:ngraph::ngraph,INTERFACE_COMPILE_DEFINITIONS>
-                                                      $<TARGET_PROPERTY:ngraph::frontend_manager::static,INTERFACE_COMPILE_DEFINITIONS>)
+                                                      $<TARGET_PROPERTY:ngraph,INTERFACE_COMPILE_DEFINITIONS>
+                                                      $<TARGET_PROPERTY:frontend_manager::static,INTERFACE_COMPILE_DEFINITIONS>)
 
-target_include_directories(${TARGET_NAME}_obj SYSTEM PRIVATE $<TARGET_PROPERTY:ngraph::ngraph,INTERFACE_INCLUDE_DIRECTORIES>
+target_include_directories(${TARGET_NAME}_obj SYSTEM PRIVATE $<TARGET_PROPERTY:ngraph,INTERFACE_INCLUDE_DIRECTORIES>
                                                              $<TARGET_PROPERTY:pugixml::static,INTERFACE_INCLUDE_DIRECTORIES>
-                                                             $<TARGET_PROPERTY:ngraph::frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>
+                                                             $<TARGET_PROPERTY:frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>
                                                              $<TARGET_PROPERTY:xbyak,INTERFACE_INCLUDE_DIRECTORIES>)
 
 target_include_directories(${TARGET_NAME}_obj PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/src"
@@ -150,6 +150,8 @@ add_library(${TARGET_NAME} SHARED
             ${vs_version_file}
             $<TARGET_OBJECTS:${TARGET_NAME}_obj>)
 
+add_library(openvino::runtime ALIAS ${TARGET_NAME})
+
 add_clang_format_target(${TARGET_NAME}_clang FOR_SOURCES ${IE_STATIC_DEPENDENT_FILES} ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${PUBLIC_HEADERS})
 
 ov_ncc_naming_style(FOR_TARGET ${TARGET_NAME}
@@ -166,14 +168,12 @@ if (TBBBIND_2_4_FOUND)
 endif()
 
 target_link_libraries(${TARGET_NAME} PRIVATE pugixml::static openvino::itt ${CMAKE_DL_LIBS} Threads::Threads
-                                             ngraph::frontend_manager::static inference_engine_transformations
+                                             frontend_manager::static inference_engine_transformations
                                      PUBLIC ngraph)
 
 target_include_directories(${TARGET_NAME} INTERFACE
             $<BUILD_INTERFACE:${PUBLIC_HEADERS_DIR}>
             $<BUILD_INTERFACE:${PUBLIC_HEADERS_DIR}/ie>
-            $<INSTALL_INTERFACE:${IE_CPACK_IE_DIR}/include>
-            $<INSTALL_INTERFACE:${IE_CPACK_IE_DIR}/include/ie>
     PRIVATE $<TARGET_PROPERTY:${TARGET_NAME}_plugin_api,INTERFACE_INCLUDE_DIRECTORIES>
             $<TARGET_PROPERTY:${TARGET_NAME}_legacy,INTERFACE_INCLUDE_DIRECTORIES>)
 
@@ -209,7 +209,7 @@ if(WIN32)
     set_target_properties(${TARGET_NAME}_s PROPERTIES COMPILE_PDB_NAME ${TARGET_NAME}_s)
 endif()
 
-target_link_libraries(${TARGET_NAME}_s PRIVATE openvino::itt ${CMAKE_DL_LIBS} ngraph ngraph::frontend_manager::static
+target_link_libraries(${TARGET_NAME}_s PRIVATE openvino::itt ${CMAKE_DL_LIBS} ngraph frontend_manager::static
                                                inference_engine_transformations pugixml::static)
 
 target_compile_definitions(${TARGET_NAME}_s PUBLIC USE_STATIC_IE)
@@ -223,8 +223,8 @@ set_target_properties(${TARGET_NAME} ${TARGET_NAME}_obj ${TARGET_NAME}_s
 
 # Export for build tree
 
-export(TARGETS ngraph ${TARGET_NAME} NAMESPACE IE::
-        APPEND FILE "${CMAKE_BINARY_DIR}/InferenceEngineTargets.cmake")
+export(TARGETS ${TARGET_NAME} NAMESPACE openvino::
+       APPEND FILE "${CMAKE_BINARY_DIR}/OpenVINOTargets.cmake")
 
 # Export for developer package
 
@@ -248,25 +248,26 @@ if(THREADING MATCHES "^(TBB|TBB_AUTO)$" AND TBBROOT MATCHES ${TEMP})
     list(APPEND core_components tbb)
 
     install(DIRECTORY "${TBB}/include"
-            DESTINATION ${IE_CPACK_IE_DIR}/external/tbb
+            DESTINATION runtime/3rdparty/tbb
             COMPONENT tbb)
     install(DIRECTORY "${TBB}/lib"
-            DESTINATION ${IE_CPACK_IE_DIR}/external/tbb
+            DESTINATION runtime/3rdparty/tbb
             COMPONENT tbb)
+    # Windows only
     if(EXISTS "${TBB}/bin")
         install(DIRECTORY "${TBB}/bin"
-                DESTINATION ${IE_CPACK_IE_DIR}/external/tbb
+                DESTINATION runtime/3rdparty/tbb
                 COMPONENT tbb)
     endif()
     install(FILES "${TBB}/LICENSE"
-            DESTINATION ${IE_CPACK_IE_DIR}/external/tbb
+            DESTINATION runtime/3rdparty/tbb
             COMPONENT tbb)
 
-    set(IE_TBB_DIR_INSTALL "external/tbb/cmake")
+    set(IE_TBB_DIR_INSTALL "3rdparty/tbb/cmake")
 
     install(FILES "${TBB}/cmake/TBBConfig.cmake"
                   "${TBB}/cmake/TBBConfigVersion.cmake"
-            DESTINATION ${IE_CPACK_IE_DIR}/${IE_TBB_DIR_INSTALL}
+            DESTINATION runtime/${IE_TBB_DIR_INSTALL}
             COMPONENT tbb)
 endif()
 
@@ -275,13 +276,17 @@ endif()
 ie_cpack_add_component(core REQUIRED DEPENDS ${core_components})
 ie_cpack_add_component(core_dev REQUIRED core ngraph_dev)
 
-install(DIRECTORY "${PUBLIC_HEADERS_DIR}" DESTINATION ${IE_CPACK_IE_DIR}
+install(DIRECTORY "${PUBLIC_HEADERS_DIR}/" DESTINATION runtime/include
         COMPONENT core_dev)
 
-install(TARGETS ${TARGET_NAME} EXPORT InferenceEngineTargets
+set_target_properties(${TARGET_NAME} PROPERTIES EXPORT_NAME runtime)
+install(TARGETS ${TARGET_NAME} EXPORT OpenVINOTargets
         RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT core
         ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT core
-        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT core)
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT core
+        INCLUDES DESTINATION runtime/include
+                             # TODO: remove later once samples are updated
+                             runtime/include/ie)
 
 install(FILES $<TARGET_FILE_DIR:${TARGET_NAME}>/plugins.xml
         DESTINATION ${IE_CPACK_RUNTIME_PATH}
@@ -298,10 +303,10 @@ endif()
 
 # Install cmake scripts
 
-install(EXPORT InferenceEngineTargets
-        FILE InferenceEngineTargets.cmake
-        NAMESPACE IE::
-        DESTINATION ${IE_CPACK_IE_DIR}/share
+install(EXPORT OpenVINOTargets
+        FILE OpenVINOTargets.cmake
+        NAMESPACE openvino::
+        DESTINATION runtime/cmake
         COMPONENT core_dev)
 
 set(IE_NGRAPH_DIR "${CMAKE_BINARY_DIR}/ngraph")
@@ -313,22 +318,38 @@ configure_package_config_file("${OpenVINO_SOURCE_DIR}/cmake/templates/InferenceE
                                INSTALL_DESTINATION "${CMAKE_INSTALL_PREFIX}"
                                PATH_VARS ${PATH_VARS})
 
+configure_package_config_file("${OpenVINO_SOURCE_DIR}/cmake/templates/OpenVINOConfig.cmake.in"
+                              "${CMAKE_BINARY_DIR}/OpenVINOConfig.cmake"
+                              INSTALL_DESTINATION "${CMAKE_INSTALL_PREFIX}"
+                              PATH_VARS ${PATH_VARS})
+
 set(IE_INCLUDE_DIR "include/ie")
-set(IE_NGRAPH_DIR "../ngraph/cmake")
+set(IE_NGRAPH_DIR ".")
 set(IE_TBB_DIR "${IE_TBB_DIR_INSTALL}")
-set(IE_PARALLEL_CMAKE "share/ie_parallel.cmake")
+set(IE_PARALLEL_CMAKE "cmake/ie_parallel.cmake")
 
 configure_package_config_file("${OpenVINO_SOURCE_DIR}/cmake/templates/InferenceEngineConfig.cmake.in"
                               "${CMAKE_BINARY_DIR}/share/InferenceEngineConfig.cmake"
+                              INSTALL_DESTINATION cmake
+                              PATH_VARS ${PATH_VARS})
+
+configure_package_config_file("${OpenVINO_SOURCE_DIR}/cmake/templates/OpenVINOConfig.cmake.in"
+                              "${CMAKE_BINARY_DIR}/share/OpenVINOConfig.cmake"
                               INSTALL_DESTINATION share
                               PATH_VARS ${PATH_VARS})
 
 configure_file("${OpenVINO_SOURCE_DIR}/cmake/templates/InferenceEngineConfig-version.cmake.in"
-               "${CMAKE_BINARY_DIR}/InferenceEngineConfig-version.cmake"
-               @ONLY)
+               "${CMAKE_BINARY_DIR}/InferenceEngineConfig-version.cmake" @ONLY)
+configure_file("${OpenVINO_SOURCE_DIR}/cmake/templates/OpenVINOConfig-version.cmake.in"
+               "${CMAKE_BINARY_DIR}/OpenVINOConfig-version.cmake" @ONLY)
 
 install(FILES "${CMAKE_BINARY_DIR}/share/InferenceEngineConfig.cmake"
               "${CMAKE_BINARY_DIR}/InferenceEngineConfig-version.cmake"
               "${InferenceEngine_SOURCE_DIR}/cmake/ie_parallel.cmake"
-        DESTINATION ${IE_CPACK_IE_DIR}/share
+        DESTINATION runtime/cmake
+        COMPONENT core_dev)
+
+install(FILES "${CMAKE_BINARY_DIR}/share/OpenVINOConfig.cmake"
+              "${CMAKE_BINARY_DIR}/OpenVINOConfig-version.cmake"
+        DESTINATION runtime/cmake
         COMPONENT core_dev)
diff --git a/inference-engine/src/inference_engine/include/ie/details/ie_so_loader.h b/inference-engine/src/inference_engine/include/ie/details/ie_so_loader.h
index 6497284d98aa81..555f91542591a6 100644
--- a/inference-engine/src/inference_engine/include/ie/details/ie_so_loader.h
+++ b/inference-engine/src/inference_engine/include/ie/details/ie_so_loader.h
@@ -24,6 +24,11 @@ class INFERENCE_ENGINE_API_CLASS(SharedObjectLoader) {
     std::shared_ptr<Impl> _impl;
 
 public:
+    /**
+     * @brief Constructs from existing object
+     */
+    SharedObjectLoader(const std::shared_ptr<void>& impl);
+
     /**
      * @brief Default constructor
      */
@@ -55,6 +60,12 @@ class INFERENCE_ENGINE_API_CLASS(SharedObjectLoader) {
      * @throws Exception if the function is not found
      */
     void* get_symbol(const char* symbolName) const;
+
+    /**
+     * @brief Retruns reference to type erased implementation
+     * @throws Exception if the function is not found
+     */
+    std::shared_ptr<void> get() const;
 };
 
 }  // namespace details
diff --git a/inference-engine/src/inference_engine/include/ie/gpu/gpu_context_api_ocl.hpp b/inference-engine/src/inference_engine/include/ie/gpu/gpu_context_api_ocl.hpp
index 27a1c0f1a80ae2..8b59db7e978097 100644
--- a/inference-engine/src/inference_engine/include/ie/gpu/gpu_context_api_ocl.hpp
+++ b/inference-engine/src/inference_engine/include/ie/gpu/gpu_context_api_ocl.hpp
@@ -10,7 +10,7 @@
  */
 #pragma once
 
-#include <cpp_interfaces/interface/ie_iremote_context.hpp>
+#include <ie_remote_context.hpp>
 #include <memory>
 #include <string>
 
@@ -29,7 +29,7 @@ namespace gpu {
  * The plugin object derived from this class can be obtained either with
  * GetContext() method of Executable network or using CreateContext() Core call.
  */
-class ClContext : public IRemoteContext, public details::param_map_obj_getter {
+class ClContext : public RemoteContext, public details::param_map_obj_getter {
 public:
     /**
      * @brief A smart pointer to the ClContext object
diff --git a/inference-engine/src/inference_engine/include/ie/ie_api.h b/inference-engine/src/inference_engine/include/ie/ie_api.h
index eea1cc8dfe0881..988258f8fe5d2f 100644
--- a/inference-engine/src/inference_engine/include/ie/ie_api.h
+++ b/inference-engine/src/inference_engine/include/ie/ie_api.h
@@ -39,7 +39,7 @@
 #elif defined __INTEL_COMPILER
 #    define INFERENCE_ENGINE_DEPRECATED(msg) __attribute__((deprecated(msg)))
 #elif defined(__GNUC__)
-#    define INFERENCE_ENGINE_DEPRECATED(msg) __attribute__((deprecated((msg))))
+#    define INFERENCE_ENGINE_DEPRECATED(msg) __attribute__((deprecated(msg)))
 #else
 #    define INFERENCE_ENGINE_DEPRECATED(msg)
 #endif
diff --git a/inference-engine/src/inference_engine/include/ie/ie_core.hpp b/inference-engine/src/inference_engine/include/ie/ie_core.hpp
index a02232bc39426e..38dd3ba8412761 100644
--- a/inference-engine/src/inference_engine/include/ie/ie_core.hpp
+++ b/inference-engine/src/inference_engine/include/ie/ie_core.hpp
@@ -59,7 +59,7 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * For IR format (*.bin):
      *  * if path is empty, will try to read bin file with the same name as xml and
      *  * if bin file with the same name was not found, will load IR without weights.
-     * For ONNX format (*.onnx or *.prototxt):
+     * For ONNX format (*.onnx):
      *  * binPath parameter is not used.
      * @return CNNNetwork
      */
@@ -73,7 +73,7 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * For IR format (*.bin):
      *  * if path is empty, will try to read bin file with the same name as xml and
      *  * if bin file with the same name was not found, will load IR without weights.
-     * For ONNX format (*.onnx or *.prototxt):
+     * For ONNX format (*.onnx):
      *  * binPath parameter is not used.
      * @return CNNNetwork
      */
@@ -249,7 +249,7 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
     /**
      * @brief Returns devices available for neural networks inference
      *
-     * @return A vector of devices. The devices are returned as { CPU, FPGA.0, FPGA.1, MYRIAD }
+     * @return A vector of devices. The devices are returned as { CPU, GPU.0, GPU.1, MYRIAD }
      * If there more than one device of specific type, they are enumerated with .# suffix.
      */
     std::vector<std::string> GetAvailableDevices() const;
diff --git a/inference-engine/src/inference_engine/include/ie/ie_plugin_config.hpp b/inference-engine/src/inference_engine/include/ie/ie_plugin_config.hpp
index f1b75fab57c76e..76d63512f21c0b 100644
--- a/inference-engine/src/inference_engine/include/ie/ie_plugin_config.hpp
+++ b/inference-engine/src/inference_engine/include/ie/ie_plugin_config.hpp
@@ -229,6 +229,21 @@ namespace PluginConfigParams {
 #define CONFIG_VALUE(name)         InferenceEngine::PluginConfigParams::name
 #define DECLARE_CONFIG_VALUE(name) static constexpr auto name = #name
 
+/**
+ * @brief High-level OpenVINO Performance Hints
+ * unlike low-level config keys that are individual (per-device), the hints are smth that every device accepts
+ * and turns into device-specific settings
+ */
+DECLARE_CONFIG_KEY(PERFORMANCE_HINT);
+DECLARE_CONFIG_VALUE(LATENCY);
+DECLARE_CONFIG_VALUE(THROUGHPUT);
+/**
+ * @brief (Optional) config key that backs the (above) Performance Hints
+ * by giving additional information on how many inference requests the application will be keeping in flight
+ * usually this value comes from the actual use-case (e.g. number of video-cameras, or other sources of inputs)
+ */
+DECLARE_CONFIG_KEY(PERFORMANCE_HINT_NUM_REQUESTS);
+
 /**
  * @brief generic boolean values
  */
diff --git a/inference-engine/src/inference_engine/include/ie/ie_remote_context.hpp b/inference-engine/src/inference_engine/include/ie/ie_remote_context.hpp
index 86baaf228840d7..0fee1c8680834e 100644
--- a/inference-engine/src/inference_engine/include/ie/ie_remote_context.hpp
+++ b/inference-engine/src/inference_engine/include/ie/ie_remote_context.hpp
@@ -23,7 +23,7 @@ namespace InferenceEngine {
  * Such context represents a scope on the device within which executable
  * networks and remote memory blobs can exist, function and exchange data.
  */
-class RemoteContext {
+class RemoteContext : public std::enable_shared_from_this<RemoteContext> {
 public:
     /**
      * @brief A smart pointer to the RemoteContext object
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/common.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/common.hpp
index c2dea4c2304f1b..f9c075e8381e27 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/common.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/common.hpp
@@ -13,7 +13,8 @@
 #include <map>
 #include <string>
 
-namespace InferenceEngine {};
+namespace InferenceEngine {}
+
 namespace ov {
 namespace ie = InferenceEngine;
 namespace runtime {
@@ -21,5 +22,13 @@ namespace runtime {
  * @brief This type of map is commonly used to pass set of parameters
  */
 using ConfigMap = std::map<std::string, std::string>;
+
+/**
+ * @brief This type of map is used for result of Core::query_model
+ *   - `key` means operation name
+ *   - `value` means device name supporting this operation
+ */
+using SupportedOpsMap = std::map<std::string, std::string>;
+
 }  // namespace runtime
 }  // namespace ov
\ No newline at end of file
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp
index 0ee954167e711f..c2c9a475d47975 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/core.hpp
@@ -16,7 +16,7 @@
 #include <vector>
 
 #include "common.hpp"
-#include "cpp/ie_executable_network.hpp"
+#include "executable_network.hpp"
 #include "ie_plugin_config.hpp"
 #include "ie_version.hpp"
 #include "remote_context.hpp"
@@ -69,7 +69,7 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * For IR format (*.bin):
      *  * if path is empty, will try to read bin file with the same name as xml and
      *  * if bin file with the same name was not found, will load IR without weights.
-     * For ONNX format (*.onnx or *.prototxt):
+     * For ONNX format (*.onnx):
      *  * binPath parameter is not used.
      * @return Function
      */
@@ -83,7 +83,7 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * For IR format (*.bin):
      *  * if path is empty, will try to read bin file with the same name as xml and
      *  * if bin file with the same name was not found, will load IR without weights.
-     * For ONNX format (*.onnx or *.prototxt):
+     * For ONNX format (*.onnx):
      *  * binPath parameter is not used.
      * @return Function
      */
@@ -117,9 +117,9 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * operation
      * @return An executable network reference
      */
-    ie::ExecutableNetwork compile_model(const std::shared_ptr<const ov::Function>& network,
-                                        const std::string& deviceName,
-                                        const ConfigMap& config = {});
+    ExecutableNetwork compile_model(const std::shared_ptr<const ov::Function>& network,
+                                    const std::string& deviceName,
+                                    const ConfigMap& config = {});
 
     /**
      * @brief Reads model and creates an executable network from IR or ONNX file
@@ -134,9 +134,9 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      *
      * @return An executable network reference
      */
-    ie::ExecutableNetwork compile_model(const std::string& modelPath,
-                                        const std::string& deviceName,
-                                        const ConfigMap& config = {});
+    ExecutableNetwork compile_model(const std::string& modelPath,
+                                    const std::string& deviceName,
+                                    const ConfigMap& config = {});
 
     /**
      * @brief Creates an executable network from a network object within a specified remote context.
@@ -146,9 +146,9 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * operation
      * @return An executable network object
      */
-    ie::ExecutableNetwork compile_model(const std::shared_ptr<const ov::Function>& network,
-                                        const RemoteContext& context,
-                                        const ConfigMap& config = {});
+    ExecutableNetwork compile_model(const std::shared_ptr<const ov::Function>& network,
+                                    const RemoteContext& context,
+                                    const ConfigMap& config = {});
 
     /**
      * @brief Registers extension
@@ -164,9 +164,9 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * operation*
      * @return An executable network reference
      */
-    ie::ExecutableNetwork import_model(std::istream& networkModel,
-                                       const std::string& deviceName,
-                                       const ConfigMap& config = {});
+    ExecutableNetwork import_model(std::istream& networkModel,
+                                   const std::string& deviceName,
+                                   const ConfigMap& config = {});
 
     /**
      * @brief Creates an executable network from a previously exported network within a specified
@@ -178,9 +178,9 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * operation
      * @return An executable network reference
      */
-    ie::ExecutableNetwork import_model(std::istream& networkModel,
-                                       const RemoteContext& context,
-                                       const ConfigMap& config = {});
+    ExecutableNetwork import_model(std::istream& networkModel,
+                                   const RemoteContext& context,
+                                   const ConfigMap& config = {});
 
     /**
      * @brief Query device if it supports specified network with specified configuration
@@ -188,11 +188,11 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
      * @param deviceName A name of a device to query
      * @param network Network object to query
      * @param config Optional map of pairs: (config parameter name, config parameter value)
-     * @return An object containing a map of pairs a layer name -> a device name supporting this layer.
+     * @return An object containing a map of pairs a operation name -> a device name supporting this operation.
      */
-    ie::QueryNetworkResult query_model(const std::shared_ptr<const ov::Function>& network,
-                                       const std::string& deviceName,
-                                       const ConfigMap& config = {}) const;
+    SupportedOpsMap query_model(const std::shared_ptr<const ov::Function>& network,
+                                const std::string& deviceName,
+                                const ConfigMap& config = {}) const;
 
     /**
      * @brief Sets configuration for device, acceptable keys can be found in ie_plugin_config.hpp
@@ -230,7 +230,7 @@ class INFERENCE_ENGINE_API_CLASS(Core) {
     /**
      * @brief Returns devices available for neural networks inference
      *
-     * @return A vector of devices. The devices are returned as { CPU, FPGA.0, FPGA.1, MYRIAD }
+     * @return A vector of devices. The devices are returned as { CPU, GPU.0, GPU.1, MYRIAD }
      * If there more than one device of specific type, they are enumerated with .# suffix.
      */
     std::vector<std::string> get_available_devices() const;
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/executable_network.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/executable_network.hpp
new file mode 100644
index 00000000000000..1190eaca0e2eeb
--- /dev/null
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/executable_network.hpp
@@ -0,0 +1,146 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+/**
+ * @brief A header file that provides ExecutableNetwork class
+ *
+ * @file openvino/runtime/executable_network.hpp
+ */
+
+#pragma once
+
+#include <map>
+#include <memory>
+#include <ostream>
+#include <string>
+#include <vector>
+
+#include "ie_parameter.hpp"
+#include "openvino/core/function.hpp"
+#include "openvino/runtime/infer_request.hpp"
+#include "openvino/runtime/remote_context.hpp"
+
+namespace InferenceEngine {
+class IExecutableNetworkInternal;
+class RemoteContext;
+}  // namespace InferenceEngine
+namespace ov {
+namespace runtime {
+
+class Core;
+
+/**
+ * @brief This is an interface of an executable network
+ */
+class INFERENCE_ENGINE_API_CLASS(ExecutableNetwork) {
+    std::shared_ptr<void> _so;
+    std::shared_ptr<InferenceEngine::IExecutableNetworkInternal> _impl;
+
+    /**
+     * @brief Constructs ExecutableNetwork from the initialized std::shared_ptr
+     * @param so Plugin to use. This is required to ensure that ExecutableNetwork can work properly even if plugin
+     * object is destroyed.
+     * @param impl Initialized shared pointer
+     */
+    ExecutableNetwork(const std::shared_ptr<void>& so, const std::shared_ptr<ie::IExecutableNetworkInternal>& impl);
+    friend class ov::runtime::Core;
+
+public:
+    /**
+     * @brief A default constructor.
+     */
+    ExecutableNetwork() = default;
+
+    /**
+     * @brief Get executable graph information from a device
+     *
+     * @return Function containing Executable Graph Info
+     */
+    std::shared_ptr<const Function> get_runtime_function() const;
+
+    /**
+     * @brief Get parameters of executeble graph function
+     *
+     * @return vector of paramter nodes
+     */
+    ParameterVector get_parameters() const;
+
+    /**
+     * @brief Get results of executeble graph function
+     *
+     * @return vector of result nodes
+     */
+    ResultVector get_results() const;
+
+    /**
+     * @brief Creates an inference request object used to infer the network.
+     *
+     * The created request has allocated input and output blobs (that can be changed later).
+     *
+     * @return InferRequest object
+     */
+    InferRequest create_infer_request();
+
+    /**
+     * @brief Exports the current executable network.
+     *
+     * @see Core::ImportNetwork
+     *
+     * @param networkModel Network model output stream
+     */
+    void export_model(std::ostream& networkModel);
+
+    /**
+     * @brief Sets configuration for current executable network
+     *
+     * @param config Map of pairs: (config parameter name, config parameter value)
+     */
+    void set_config(const ie::ParamMap& config);
+
+    /** @brief Gets configuration for current executable network.
+     *
+     * The method is responsible to extract information
+     * which affects executable network execution. The list of supported configuration values can be extracted via
+     * ExecutableNetwork::get_metric with the SUPPORTED_CONFIG_KEYS key, but some of these keys cannot be changed
+     * dynamically, e.g. DEVICE_ID cannot changed if an executable network has already been compiled for particular
+     * device.
+     *
+     * @param name config key, can be found in ie_plugin_config.hpp
+     * @return Configuration parameter value
+     */
+    ie::Parameter get_config(const std::string& name) const;
+
+    /**
+     * @brief Gets general runtime metric for an executable network.
+     *
+     * It can be network name, actual device ID on
+     * which executable network is running or all other properties which cannot be changed dynamically.
+     *
+     * @param name metric name to request
+     * @return Metric parameter value
+     */
+    ie::Parameter get_metric(const std::string& name) const;
+
+    /**
+     * @brief Returns pointer to plugin-specific shared context
+     * on remote accelerator device that was used to create this ExecutableNetwork
+     * @return A context
+     */
+    std::shared_ptr<ie::RemoteContext> get_context() const;
+
+    /**
+     * @brief Checks if current ExecutableNetwork object is not initialized
+     * @return true if current ExecutableNetwork object is not initialized, false - otherwise
+     */
+    bool operator!() const noexcept;
+
+    /**
+     * @brief Checks if current ExecutableNetwork object is initialized
+     * @return true if current ExecutableNetwork object is initialized, false - otherwise
+     */
+    explicit operator bool() const noexcept;
+};
+
+}  // namespace runtime
+}  // namespace ov
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp
index d5993d9a09c7a5..fc5969b446d9ab 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/infer_request.hpp
@@ -24,13 +24,16 @@ class Blob;
 
 namespace ov {
 namespace runtime {
+
+class ExecutableNetwork;
+
 /**
  * @brief This is an interface of asynchronous infer request
  *
  * It can throw exceptions safely for the application, where it is properly handled.
  */
 class INFERENCE_ENGINE_API_CLASS(InferRequest) {
-    std::shared_ptr<SharedObject> _so;
+    std::shared_ptr<void> _so;
     std::shared_ptr<ie::IInferRequestInternal> _impl;
 
     /**
@@ -39,8 +42,8 @@ class INFERENCE_ENGINE_API_CLASS(InferRequest) {
      * destroyed.
      * @param impl Initialized shared pointer
      */
-    InferRequest(const std::shared_ptr<SharedObject>& so, const std::shared_ptr<ie::IInferRequestInternal>& impl);
-    friend class ExecutableNetwork;
+    InferRequest(const std::shared_ptr<void>& so, const std::shared_ptr<ie::IInferRequestInternal>& impl);
+    friend class ov::runtime::ExecutableNetwork;
 
 public:
     /**
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp
index 7a46b99fff7425..d174b6a6d5dca2 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/remote_context.hpp
@@ -19,7 +19,6 @@
 #include "ie_remote_context.hpp"
 
 namespace InferenceEngine {
-class IRemoteContext;
 class RemoteBlob;
 }  // namespace InferenceEngine
 
@@ -35,8 +34,8 @@ class Core;
  * networks and remote memory blobs can exist, function and exchange data.
  */
 class INFERENCE_ENGINE_API_CLASS(RemoteContext) {
-    ie::details::SharedObjectLoader _so;
-    std::shared_ptr<ie::IRemoteContext> _impl;
+    std::shared_ptr<void> _so;
+    std::shared_ptr<ie::RemoteContext> _impl;
 
     /**
      * @brief Constructs RemoteContext from the initialized std::shared_ptr
@@ -44,7 +43,7 @@ class INFERENCE_ENGINE_API_CLASS(RemoteContext) {
      * object is destroyed.
      * @param impl Initialized shared pointer
      */
-    RemoteContext(const ie::details::SharedObjectLoader& so, const std::shared_ptr<ie::IRemoteContext>& impl);
+    RemoteContext(const std::shared_ptr<void>& so, const std::shared_ptr<ie::RemoteContext>& impl);
     friend class Core;
 
 public:
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/runtime.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/runtime.hpp
new file mode 100644
index 00000000000000..57b867b4663ce2
--- /dev/null
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/runtime.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+/**
+ * @brief This is a header file for the OpenVINO Runtime Components
+ *
+ * @file openvino/runtime/runtime.hpp
+ */
+#pragma once
+
+#include "openvino/runtime/core.hpp"
+#include "openvino/runtime/executable_network.hpp"
+#include "openvino/runtime/infer_request.hpp"
+#include "openvino/runtime/profiling_info.hpp"
diff --git a/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp b/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp
index e15679b118b7ab..e243a0a0f3b6aa 100644
--- a/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp
+++ b/inference-engine/src/inference_engine/include/openvino/runtime/variable_state.hpp
@@ -26,14 +26,13 @@ class Blob;
 namespace ov {
 namespace runtime {
 
-class SharedObject;
 class InferRequest;
 
 /**
  * @brief VariableState class
  */
 class INFERENCE_ENGINE_API_CLASS(VariableState) {
-    std::shared_ptr<SharedObject> _so;
+    std::shared_ptr<void> _so;
     std::shared_ptr<ie::IVariableStateInternal> _impl;
 
     /**
@@ -42,7 +41,7 @@ class INFERENCE_ENGINE_API_CLASS(VariableState) {
      * @param so Optional: Plugin to use. This is required to ensure that VariableState can work properly even if plugin
      * object is destroyed.
      */
-    VariableState(const std::shared_ptr<SharedObject>& so, const std::shared_ptr<ie::IVariableStateInternal>& impl);
+    VariableState(const std::shared_ptr<void>& so, const std::shared_ptr<ie::IVariableStateInternal>& impl);
 
     friend class ov::runtime::InferRequest;
 
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp b/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp
index 0ddd99db096531..dde888a82f77eb 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_executable_network.cpp
@@ -6,9 +6,10 @@
 
 #include "cpp/exception2status.hpp"
 #include "cpp_interfaces/interface/ie_iexecutable_network_internal.hpp"
-#include "cpp_interfaces/interface/ie_iremote_context.hpp"
 #include "ie_common.h"
 #include "ie_executable_network_base.hpp"
+#include "ie_remote_context.hpp"
+#include "openvino/runtime/executable_network.hpp"
 
 namespace InferenceEngine {
 
@@ -18,7 +19,7 @@ namespace InferenceEngine {
     try {                                                                   \
         __VA_ARGS__;                                                        \
     } catch (...) {                                                         \
-        details::Rethrow();                                                 \
+        InferenceEngine::details::Rethrow();                                \
     }
 
 ExecutableNetwork::ExecutableNetwork(const details::SharedObjectLoader& so, const IExecutableNetworkInternal::Ptr& impl)
@@ -55,9 +56,10 @@ ExecutableNetwork::operator IExecutableNetwork::Ptr() {
 
 std::vector<VariableState> ExecutableNetwork::QueryState() {
     std::vector<VariableState> controller;
-    EXEC_NET_CALL_STATEMENT(for (auto&& state
-                                 : _impl->QueryState()) {
-        controller.emplace_back(VariableState{_so, state});
+    EXEC_NET_CALL_STATEMENT({
+        for (auto&& state : _impl->QueryState()) {
+            controller.emplace_back(VariableState{_so, state});
+        }
     });
     return controller;
 }
@@ -106,3 +108,58 @@ ExecutableNetwork::operator bool() const noexcept {
     return !!_impl;
 }
 }  // namespace InferenceEngine
+
+namespace ov {
+namespace runtime {
+ExecutableNetwork::ExecutableNetwork(const std::shared_ptr<void>& so,
+                                     const std::shared_ptr<ie::IExecutableNetworkInternal>& impl)
+    : _so{so},
+      _impl{impl} {
+    IE_ASSERT(_impl != nullptr);
+}
+
+std::shared_ptr<const Function> ExecutableNetwork::get_runtime_function() const {
+    EXEC_NET_CALL_STATEMENT(return std::const_pointer_cast<const Function>(_impl->GetExecGraphInfo()));
+}
+
+ParameterVector ExecutableNetwork::get_parameters() const {
+    EXEC_NET_CALL_STATEMENT(return _impl->GetExecGraphInfo()->get_parameters());
+}
+
+ResultVector ExecutableNetwork::get_results() const {
+    EXEC_NET_CALL_STATEMENT(return _impl->GetExecGraphInfo()->get_results());
+}
+
+InferRequest ExecutableNetwork::create_infer_request() {
+    EXEC_NET_CALL_STATEMENT(return {_so, _impl->CreateInferRequest()});
+}
+
+void ExecutableNetwork::export_model(std::ostream& networkModel) {
+    EXEC_NET_CALL_STATEMENT(_impl->Export(networkModel));
+}
+
+void ExecutableNetwork::set_config(const ie::ParamMap& config) {
+    EXEC_NET_CALL_STATEMENT(_impl->SetConfig(config));
+}
+
+ie::Parameter ExecutableNetwork::get_config(const std::string& name) const {
+    EXEC_NET_CALL_STATEMENT(return _impl->GetConfig(name));
+}
+
+ie::Parameter ExecutableNetwork::get_metric(const std::string& name) const {
+    EXEC_NET_CALL_STATEMENT(return _impl->GetMetric(name));
+}
+
+std::shared_ptr<ie::RemoteContext> ExecutableNetwork::get_context() const {
+    EXEC_NET_CALL_STATEMENT(return _impl->GetContext());
+}
+
+bool ExecutableNetwork::operator!() const noexcept {
+    return !_impl;
+}
+
+ExecutableNetwork::operator bool() const noexcept {
+    return !!_impl;
+}
+}  // namespace runtime
+}  // namespace ov
\ No newline at end of file
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_executable_network_base.hpp b/inference-engine/src/inference_engine/src/cpp/ie_executable_network_base.hpp
index 559fe1ace6d1fe..7aac9444d4a796 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_executable_network_base.hpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_executable_network_base.hpp
@@ -17,7 +17,7 @@
 #include "cpp/exception2status.hpp"
 #include "cpp_interfaces/interface/ie_iexecutable_network_internal.hpp"
 #include "cpp_interfaces/interface/ie_ivariable_state_internal.hpp"
-#include "cpp_interfaces/interface/ie_iremote_context.hpp"
+#include "ie_remote_context.hpp"
 #include "ie_iexecutable_network.hpp"
 #include "ie_infer_async_request_base.hpp"
 
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp b/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp
index 11937e6309d114..94b53157723a7f 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_infer_request.cpp
@@ -196,7 +196,7 @@ bool InferRequest::operator==(const InferRequest& r) const noexcept {
 namespace ov {
 namespace runtime {
 
-InferRequest::InferRequest(const std::shared_ptr<SharedObject>& so, const ie::IInferRequestInternal::Ptr& impl)
+InferRequest::InferRequest(const std::shared_ptr<void>& so, const ie::IInferRequestInternal::Ptr& impl)
     : _so{so},
       _impl{impl} {
     IE_ASSERT(_impl != nullptr);
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp b/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp
index a6fd3ab6a2043d..1b74aea1ce5ab6 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_plugin.hpp
@@ -17,6 +17,8 @@
 #include "cpp/ie_cnn_network.h"
 #include "cpp/exception2status.hpp"
 #include "cpp_interfaces/interface/ie_iplugin_internal.hpp"
+#include "so_ptr.hpp"
+#include "openvino/runtime/common.hpp"
 
 #if defined __GNUC__
 # pragma GCC diagnostic push
@@ -27,7 +29,7 @@
     if (!_ptr) IE_THROW() << "Wrapper used in the PLUGIN_CALL_STATEMENT was not initialized.";    \
     try {                                                                                         \
         __VA_ARGS__;                                                                              \
-    } catch(...) {details::Rethrow();}
+    } catch(...) {::InferenceEngine::details::Rethrow();}
 
 namespace InferenceEngine {
 /**
@@ -65,7 +67,7 @@ class InferencePlugin : protected details::SOPointer<IInferencePlugin> {
     }
 
     details::SOPointer<IExecutableNetworkInternal> LoadNetwork(const CNNNetwork& network,
-                                                               const std::shared_ptr<IRemoteContext>& context,
+                                                               const std::shared_ptr<RemoteContext>& context,
                                                                const std::map<std::string, std::string>& config) {
         PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(network, config, context)});
     }
@@ -93,7 +95,7 @@ class InferencePlugin : protected details::SOPointer<IInferencePlugin> {
     }
 
     details::SOPointer<IExecutableNetworkInternal> ImportNetwork(std::istream& networkModel,
-                                                                 const std::shared_ptr<IRemoteContext>& context,
+                                                                 const std::shared_ptr<RemoteContext>& context,
                                                                  const std::map<std::string, std::string>& config) {
         PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(networkModel, context, config)});
     }
@@ -102,11 +104,11 @@ class InferencePlugin : protected details::SOPointer<IInferencePlugin> {
         PLUGIN_CALL_STATEMENT(return _ptr->GetMetric(name, options));
     }
 
-    details::SOPointer<IRemoteContext> CreateContext(const ParamMap& params) {
+    details::SOPointer<RemoteContext> CreateContext(const ParamMap& params) {
         PLUGIN_CALL_STATEMENT(return {_so, _ptr->CreateContext(params)});
     }
 
-    details::SOPointer<IRemoteContext> GetDefaultContext(const ParamMap& params) {
+    details::SOPointer<RemoteContext> GetDefaultContext(const ParamMap& params) {
         PLUGIN_CALL_STATEMENT(return {_so, _ptr->GetDefaultContext(params)});
     }
 
@@ -116,8 +118,105 @@ class InferencePlugin : protected details::SOPointer<IInferencePlugin> {
 };
 }  // namespace InferenceEngine
 
-#undef PLUGIN_CALL_STATEMENT
 
 #if defined __GNUC__
 # pragma GCC diagnostic pop
 #endif
+
+namespace ov {
+namespace runtime {
+
+/**
+ * @brief This class is a C++ API wrapper for IInferencePlugin.
+ *
+ * It can throw exceptions safely for the application, where it is properly handled.
+ */
+struct InferencePlugin {
+    std::shared_ptr<void> _so;
+    std::shared_ptr<ie::IInferencePlugin> _ptr;
+
+    InferencePlugin(const std::shared_ptr<void>& so, const std::shared_ptr<ie::IInferencePlugin>& impl) :
+        _so{so},
+        _ptr{impl} {
+        IE_ASSERT(_ptr != nullptr);
+    }
+
+    void set_name(const std::string& deviceName) {
+        PLUGIN_CALL_STATEMENT(_ptr->SetName(deviceName));
+    }
+
+    void set_core(std::weak_ptr<ie::ICore> core) {
+        PLUGIN_CALL_STATEMENT(_ptr->SetCore(core));
+    }
+
+    const ie::Version get_version() const {
+        PLUGIN_CALL_STATEMENT(return _ptr->GetVersion());
+    }
+
+    void add_extension(const ie::IExtensionPtr& extension) {
+        PLUGIN_CALL_STATEMENT(_ptr->AddExtension(extension));
+    }
+
+    void set_config(const ConfigMap& config) {
+        PLUGIN_CALL_STATEMENT(_ptr->SetConfig(config));
+    }
+
+    SoPtr<ie::IExecutableNetworkInternal> load_model(const ie::CNNNetwork& network, const ConfigMap& config) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(network, config)});
+    }
+
+    SoPtr<ie::IExecutableNetworkInternal> load_model(const ie::CNNNetwork& network,
+                                                               const std::shared_ptr<ie::RemoteContext>& context,
+                                                               const ConfigMap& config) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(network, config, context)});
+    }
+
+    SoPtr<ie::IExecutableNetworkInternal> load_model(const std::string& modelPath, const ConfigMap& config) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->LoadNetwork(modelPath, config)});
+    }
+
+    ie::QueryNetworkResult query_model(const ie::CNNNetwork& network,
+                                       const ConfigMap& config) const {
+        ie::QueryNetworkResult res;
+        PLUGIN_CALL_STATEMENT(res = _ptr->QueryNetwork(network, config));
+        if (res.rc != ie::OK) IE_THROW() << res.resp.msg;
+        return res;
+    }
+
+    SoPtr<ie::IExecutableNetworkInternal> import_model(const std::string& modelFileName,
+                                                                 const ConfigMap& config) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(modelFileName, config)});
+    }
+
+    SoPtr<ie::IExecutableNetworkInternal> import_model(std::istream& networkModel,
+                                    const ConfigMap& config) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(networkModel, config)});
+    }
+
+    SoPtr<ie::IExecutableNetworkInternal> import_model(std::istream& networkModel,
+                                                                 const std::shared_ptr<ie::RemoteContext>& context,
+                                                                 const ConfigMap& config) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->ImportNetwork(networkModel, context, config)});
+    }
+
+    ie::Parameter get_metric(const std::string& name, const ie::ParamMap& options) const {
+        PLUGIN_CALL_STATEMENT(return _ptr->GetMetric(name, options));
+    }
+
+    SoPtr<ie::RemoteContext> create_context(const ie::ParamMap& params) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->CreateContext(params)});
+    }
+
+    SoPtr<ie::RemoteContext> get_default_context(const ie::ParamMap& params) {
+        PLUGIN_CALL_STATEMENT(return {_so, _ptr->GetDefaultContext(params)});
+    }
+
+    ie::Parameter get_config(const std::string& name, const ie::ParamMap& options) const {
+        PLUGIN_CALL_STATEMENT(return _ptr->GetConfig(name, options));
+    }
+};
+
+}  // namespace runtime
+}  // namespace ov
+
+#undef PLUGIN_CALL_STATEMENT
\ No newline at end of file
diff --git a/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp b/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp
index e9aeb57d720d2d..67e6172d11ef04 100644
--- a/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp
+++ b/inference-engine/src/inference_engine/src/cpp/ie_variable_state.cpp
@@ -49,7 +49,7 @@ void VariableState::SetState(Blob::Ptr state) {
 namespace ov {
 namespace runtime {
 
-VariableState::VariableState(const std::shared_ptr<SharedObject>& so, const ie::IVariableStateInternal::Ptr& impl)
+VariableState::VariableState(const std::shared_ptr<void>& so, const ie::IVariableStateInternal::Ptr& impl)
     : _so{so},
       _impl{impl} {
     IE_ASSERT(_impl != nullptr);
diff --git a/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iexecutable_network_internal.cpp b/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iexecutable_network_internal.cpp
index d084f6ab797ea3..f53cde11ed1380 100644
--- a/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iexecutable_network_internal.cpp
+++ b/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iexecutable_network_internal.cpp
@@ -26,6 +26,10 @@ void IExecutableNetworkInternal::setNetworkOutputs(const OutputsDataMap& network
     _networkOutputs = networkOutputs;
 }
 
+void IExecutableNetworkInternal::setRuntimeFunction(std::shared_ptr<ov::Function> function) {
+    _runtime_function = std::move(function);
+}
+
 ConstOutputsDataMap IExecutableNetworkInternal::GetOutputsInfo() const {
     ConstOutputsDataMap outputMap;
     for (const auto& output : _networkOutputs) {
@@ -63,7 +67,7 @@ void IExecutableNetworkInternal::Export(std::ostream& networkModel) {
 }
 
 std::shared_ptr<ngraph::Function> IExecutableNetworkInternal::GetExecGraphInfo() {
-    IE_THROW(NotImplemented);
+    return _runtime_function;
 }
 
 std::vector<std::shared_ptr<IVariableStateInternal>> IExecutableNetworkInternal::QueryState() {
@@ -86,7 +90,7 @@ Parameter IExecutableNetworkInternal::GetMetric(const std::string&) const {
     IE_THROW(NotImplemented);
 }
 
-std::shared_ptr<IRemoteContext> IExecutableNetworkInternal::GetContext() const {
+std::shared_ptr<RemoteContext> IExecutableNetworkInternal::GetContext() const {
     IE_THROW(NotImplemented);
 }
 
diff --git a/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iplugin_internal.cpp b/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iplugin_internal.cpp
index bda5694322dadf..17487acb64e29e 100644
--- a/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iplugin_internal.cpp
+++ b/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iplugin_internal.cpp
@@ -16,9 +16,11 @@
 #include <string>
 
 #include "blob_factory.hpp"
+#include "exec_graph_info.hpp"
 #include "ie_icore.hpp"
 #include "ie_iextension.h"
 #include "ie_input_info.hpp"
+#include "ie_ngraph_utils.hpp"
 #include "ie_parameter.hpp"
 
 namespace InferenceEngine {
@@ -116,7 +118,7 @@ std::map<std::string, std::shared_ptr<const T>> const_map_cast(const std::map<st
 std::shared_ptr<IExecutableNetworkInternal> IInferencePlugin::LoadNetwork(
     const CNNNetwork& network,
     const std::map<std::string, std::string>& config,
-    const std::shared_ptr<IRemoteContext>& context) {
+    const std::shared_ptr<RemoteContext>& context) {
     std::shared_ptr<IExecutableNetworkInternal> impl;
     if (nullptr == context) {
         impl = LoadExeNetworkImpl(network, config);
@@ -125,6 +127,10 @@ std::shared_ptr<IExecutableNetworkInternal> IInferencePlugin::LoadNetwork(
     }
 
     SetExeNetworkInfo(impl, const_map_cast(network.getInputsInfo()), const_map_cast(network.getOutputsInfo()));
+    auto function = network.getFunction();
+    if (function) {
+        SetExeNetworkInfo(impl, std::const_pointer_cast<ov::Function>(function));
+    }
 
     return impl;
 }
@@ -152,11 +158,11 @@ Parameter IInferencePlugin::GetMetric(const std::string&, const std::map<std::st
     IE_THROW(NotImplemented);
 }
 
-std::shared_ptr<IRemoteContext> IInferencePlugin::CreateContext(const ParamMap&) {
+std::shared_ptr<RemoteContext> IInferencePlugin::CreateContext(const ParamMap&) {
     IE_THROW(NotImplemented);
 }
 
-std::shared_ptr<IRemoteContext> IInferencePlugin::GetDefaultContext(const ParamMap&) {
+std::shared_ptr<RemoteContext> IInferencePlugin::GetDefaultContext(const ParamMap&) {
     IE_THROW(NotImplemented);
 }
 
@@ -180,7 +186,7 @@ std::shared_ptr<IExecutableNetworkInternal> IInferencePlugin::ImportNetwork(
 
 std::shared_ptr<IExecutableNetworkInternal> IInferencePlugin::ImportNetwork(
     std::istream& networkModel,
-    const std::shared_ptr<IRemoteContext>& context,
+    const std::shared_ptr<RemoteContext>& context,
     const std::map<std::string, std::string>& config) {
     IE_THROW(NotImplemented);
 }
@@ -207,7 +213,7 @@ std::shared_ptr<IExecutableNetworkInternal> IInferencePlugin::LoadExeNetworkImpl
 
 std::shared_ptr<IExecutableNetworkInternal> IInferencePlugin::LoadExeNetworkImpl(
     const CNNNetwork&,
-    const std::shared_ptr<IRemoteContext>&,
+    const std::shared_ptr<RemoteContext>&,
     const std::map<std::string, std::string>&) {
     IE_THROW(NotImplemented);
 }
@@ -219,6 +225,85 @@ void IInferencePlugin::SetExeNetworkInfo(const std::shared_ptr<IExecutableNetwor
     // Set inputs/outputs and pointer to plugin manually here
     exeNetwork->setNetworkInputs(copyInfo(constMapCast(inputs)));
     exeNetwork->setNetworkOutputs(copyInfo(constMapCast(outputs)));
+
+    ngraph::ParameterVector parameters;
+    ngraph::ResultVector results;
+    std::vector<ngraph::Output<ngraph::Node>> node_outputs;
+
+    for (auto&& input : inputs) {
+        auto tensor_desc = input.second->getTensorDesc();
+        auto dims = tensor_desc.getDims();
+        parameters.push_back(
+            std::make_shared<ngraph::op::v0::Parameter>(details::convertPrecision(tensor_desc.getPrecision()),
+                                                        std::vector<ov::Dimension>{dims.begin(), dims.end()}));
+        parameters.back()->set_friendly_name(input.first);
+        node_outputs.push_back(parameters.back()->output(0));
+    }
+
+    auto node = std::make_shared<ExecGraphInfoSerialization::ExecutionNode>(node_outputs, outputs.size());
+
+    int i = 0;
+    for (auto&& output : outputs) {
+        auto tensor_desc = output.second->getTensorDesc();
+        auto dims = tensor_desc.getDims();
+        node->set_output_type(i,
+                              details::convertPrecision(tensor_desc.getPrecision()),
+                              std::vector<ov::Dimension>{dims.begin(), dims.end()});
+        results.push_back(std::make_shared<ngraph::op::v0::Result>(node->output(i)));
+        ++i;
+    }
+    exeNetwork->setRuntimeFunction(std::make_shared<ov::Function>(results, parameters, "execution_info"));
+    exeNetwork->SetPointerToPlugin(shared_from_this());
+}
+
+void IInferencePlugin::SetExeNetworkInfo(const std::shared_ptr<IExecutableNetworkInternal>& exeNetwork,
+                                         const std::shared_ptr<ov::Function>& function) {
+    IE_ASSERT(exeNetwork != nullptr);
+    IE_ASSERT(function != nullptr);
+
+    ngraph::ParameterVector parameters;
+    ngraph::ResultVector results;
+    ngraph::NodeVector nodes;
+
+    std::map<ngraph::Output<ngraph::Node>, ngraph::Output<ngraph::Node>> output_map;
+
+    for (auto&& node : function->get_ordered_ops()) {
+        ngraph::Node* new_node = nullptr;
+        if (ngraph::is_type<ngraph::op::Parameter>(node)) {
+            parameters.push_back(std::static_pointer_cast<ngraph::op::v0::Parameter>(node->clone_with_new_inputs({})));
+            for (std::size_t i = 0; i < node->outputs().size(); ++i) {
+                output_map.emplace(node->output(i), parameters.back()->output(i));
+            }
+            new_node = parameters.back().get();
+        } else {
+            std::vector<ngraph::Output<ngraph::Node>> outputs;
+            for (auto&& input : node->inputs()) {
+                outputs.emplace_back(output_map.at(input.get_source_output()));
+            }
+            if (ngraph::is_type<ngraph::op::Result>(node)) {
+                results.push_back(
+                    std::static_pointer_cast<ngraph::op::v0::Result>(node->clone_with_new_inputs(outputs)));
+                new_node = results.back().get();
+            } else {
+                nodes.push_back(
+                    std::make_shared<ExecGraphInfoSerialization::ExecutionNode>(outputs, node->outputs().size()));
+                new_node = nodes.back().get();
+                for (std::size_t i = 0; i < node->outputs().size(); ++i) {
+                    auto output = node->output(i);
+                    output_map.emplace(output, nodes.back()->output(i));
+                    new_node->set_output_type(i, output.get_element_type(), output.get_partial_shape());
+                }
+            }
+        }
+        IE_ASSERT(new_node != nullptr);
+        new_node->set_friendly_name(node->get_friendly_name());
+        new_node->get_rt_info()[ExecGraphInfoSerialization::PERF_COUNTER] =
+            std::make_shared<::ngraph::VariantWrapper<std::string>>("not_executed");
+        new_node->get_rt_info()[ExecGraphInfoSerialization::ORIGINAL_NAMES] =
+            std::make_shared<::ngraph::VariantWrapper<std::string>>(node->get_friendly_name());
+    }
+    exeNetwork->setRuntimeFunction(
+        std::make_shared<ov::Function>(results, parameters, function->get_friendly_name() + "_execution_info"));
     exeNetwork->SetPointerToPlugin(shared_from_this());
 }
 
diff --git a/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iremote_context.cpp b/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iremote_context.cpp
deleted file mode 100644
index 8ad2777a00737c..00000000000000
--- a/inference-engine/src/inference_engine/src/cpp_interfaces/interface/ie_iremote_context.cpp
+++ /dev/null
@@ -1,19 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <cpp_interfaces/interface/ie_iremote_context.hpp>
-
-namespace InferenceEngine {
-std::string IRemoteContext::getDeviceName() const noexcept {
-    return {};
-}
-
-RemoteBlob::Ptr IRemoteContext::CreateBlob(const TensorDesc&, const ParamMap&) {
-    IE_THROW(NotImplemented);
-}
-
-ParamMap IRemoteContext::getParams() const {
-    IE_THROW(NotImplemented);
-}
-}  // namespace InferenceEngine
diff --git a/inference-engine/src/inference_engine/src/ie_core.cpp b/inference-engine/src/inference_engine/src/ie_core.cpp
index 9ede317d1cd103..cd15015fa8215d 100644
--- a/inference-engine/src/inference_engine/src/ie_core.cpp
+++ b/inference-engine/src/inference_engine/src/ie_core.cpp
@@ -16,7 +16,6 @@
 #include "cpp/ie_plugin.hpp"
 #include "cpp_interfaces/interface/ie_iexecutable_network_internal.hpp"
 #include "cpp_interfaces/interface/ie_internal_plugin_config.hpp"
-#include "cpp_interfaces/interface/ie_iremote_context.hpp"
 #include "file_utils.h"
 #include "ie_cache_guard.hpp"
 #include "ie_cache_manager.hpp"
@@ -24,17 +23,20 @@
 #include "ie_itt.hpp"
 #include "ie_network_reader.hpp"
 #include "ie_plugin_config.hpp"
+#include "ie_remote_context.hpp"
 #include "ngraph/graph_util.hpp"
 #include "ngraph/ngraph.hpp"
 #include "ngraph/opsets/opset.hpp"
 #include "ngraph/pass/constant_folding.hpp"
 #include "openvino/runtime/core.hpp"
+#include "openvino/runtime/executable_network.hpp"
 #include "xml_parse_utils.h"
 
 using namespace InferenceEngine::PluginConfigParams;
 using namespace std::placeholders;
 
-namespace core_detail {
+namespace ov {
+namespace runtime {
 
 template <typename T>
 struct Parsed {
@@ -47,13 +49,13 @@ std::string parseXmlConfig(const std::string& xmlFile) {
     if (xmlConfigFile_.empty()) {
         // register plugins from default plugins.xml config
         FileUtils::FilePath xmlConfigFileDefault =
-            FileUtils::makePath(InferenceEngine::getInferenceEngineLibraryPath(), FileUtils::toFilePath("plugins.xml"));
+            FileUtils::makePath(ie::getInferenceEngineLibraryPath(), FileUtils::toFilePath("plugins.xml"));
         xmlConfigFile_ = FileUtils::fromFilePath(xmlConfigFileDefault);
     }
     return xmlConfigFile_;
 }
 
-template <typename T = InferenceEngine::Parameter>
+template <typename T = ie::Parameter>
 Parsed<T> parseDeviceNameIntoConfig(const std::string& deviceName, const std::map<std::string, T>& config = {}) {
     auto config_ = config;
     auto deviceName_ = deviceName;
@@ -62,20 +64,18 @@ Parsed<T> parseDeviceNameIntoConfig(const std::string& deviceName, const std::ma
         config_["TARGET_FALLBACK"] = deviceName.substr(7);
     } else if (deviceName_.find("MULTI:") == 0) {
         deviceName_ = "MULTI";
-        config_[InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES] = deviceName.substr(6);
+        config_[ie::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES] = deviceName.substr(6);
     } else if (deviceName.find("AUTO") == 0) {
-        deviceName_ = "MULTI";
+        deviceName_ = "AUTO";
         if (deviceName.find("AUTO:") == 0) {
-            config_[InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES] =
+            config_[ie::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES] =
                 deviceName.substr(std::string("AUTO:").size());
         }
-        config_.insert({CONFIG_KEY_INTERNAL(WORK_MODE), ""});
     } else {
-        if (deviceName_ == "AUTO") {
-            deviceName_ = "MULTI";
-            config_.insert({CONFIG_KEY_INTERNAL(WORK_MODE), ""});
+        if (deviceName_.empty()) {
+            deviceName_ = "AUTO";
         }
-        InferenceEngine::DeviceIDParser parser(deviceName_);
+        ie::DeviceIDParser parser(deviceName_);
         deviceName_ = parser.getDeviceName();
         std::string deviceIDLocal = parser.getDeviceID();
 
@@ -86,7 +86,7 @@ Parsed<T> parseDeviceNameIntoConfig(const std::string& deviceName, const std::ma
     return {deviceName_, config_};
 }
 
-InferenceEngine::Parameter copyParameterValue(const InferenceEngine::Parameter& value) {
+ie::Parameter copyParameterValue(const ie::Parameter& value) {
     if (value.is<bool>()) {
         return {value.as<bool>()};
     } else if (value.is<int>()) {
@@ -118,18 +118,18 @@ template <typename F>
 void allowNotImplemented(F&& f) {
     try {
         f();
-    } catch (const InferenceEngine::NotImplemented&) {
+    } catch (const ie::NotImplemented&) {
     }
 }
 
-class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_this<InferenceEngine::ICore> {
-    mutable std::map<std::string, InferenceEngine::InferencePlugin> plugins;
+class CoreImpl : public ie::ICore, public std::enable_shared_from_this<ie::ICore> {
+    mutable std::map<std::string, ov::runtime::InferencePlugin> plugins;
 
     class CoreConfig final {
     public:
         struct CacheConfig {
             std::string _cacheDir;
-            std::shared_ptr<InferenceEngine::ICacheManager> _cacheManager;
+            std::shared_ptr<ie::ICacheManager> _cacheManager;
         };
 
         void setAndUpdate(std::map<std::string, std::string>& config) {
@@ -139,8 +139,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
                 _cacheConfig._cacheDir = it->second;
                 if (!it->second.empty()) {
                     FileUtils::createDirectoryRecursive(it->second);
-                    _cacheConfig._cacheManager =
-                        std::make_shared<InferenceEngine::FileStorageCacheManager>(std::move(it->second));
+                    _cacheConfig._cacheManager = std::make_shared<ie::FileStorageCacheManager>(std::move(it->second));
                 } else {
                     _cacheConfig._cacheManager = nullptr;
                 }
@@ -163,7 +162,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
     // Core settings (cache config, etc)
     CoreConfig coreConfig;
 
-    InferenceEngine::CacheGuard cacheGuard;
+    ie::CacheGuard cacheGuard;
 
     struct PluginDescriptor {
         FileUtils::FilePath libraryLocation;
@@ -171,8 +170,8 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         std::vector<FileUtils::FilePath> listOfExtentions;
     };
 
-    std::unordered_set<std::string> opsetNames;
-    std::vector<InferenceEngine::IExtensionPtr> extensions;
+    mutable std::unordered_set<std::string> opsetNames;
+    mutable std::vector<ie::IExtensionPtr> extensions;
 
     std::map<std::string, PluginDescriptor> pluginRegistry;
     mutable std::mutex pluginsMutex;  // to lock parallel access to pluginRegistry and plugins
@@ -183,53 +182,54 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         return DeviceSupportsImportExport(plugin);
     }
 
-    bool DeviceSupportsImportExport(const InferenceEngine::InferencePlugin& plugin) const {
-        std::vector<std::string> supportedMetricKeys = plugin.GetMetric(METRIC_KEY(SUPPORTED_METRICS), {});
+    bool DeviceSupportsImportExport(const ov::runtime::InferencePlugin& plugin) const {
+        std::vector<std::string> supportedMetricKeys = plugin.get_metric(METRIC_KEY(SUPPORTED_METRICS), {});
         auto it = std::find(supportedMetricKeys.begin(), supportedMetricKeys.end(), METRIC_KEY(IMPORT_EXPORT_SUPPORT));
-        bool supported = (it != supportedMetricKeys.end()) && plugin.GetMetric(METRIC_KEY(IMPORT_EXPORT_SUPPORT), {});
+        bool supported = (it != supportedMetricKeys.end()) && plugin.get_metric(METRIC_KEY(IMPORT_EXPORT_SUPPORT), {});
         return supported;
     }
 
-    bool DeviceSupportsCacheDir(const InferenceEngine::InferencePlugin& plugin) const {
+    bool DeviceSupportsCacheDir(const ov::runtime::InferencePlugin& plugin) const {
         return DeviceSupportsConfigKey(plugin, CONFIG_KEY(CACHE_DIR));
     }
 
-    bool DeviceSupportsConfigKey(const InferenceEngine::InferencePlugin& plugin, const std::string& key) const {
+    bool DeviceSupportsConfigKey(const ov::runtime::InferencePlugin& plugin, const std::string& key) const {
         bool supported = false;
         std::vector<std::string> supportedMetricKeys;
         try {
             // If plugin doesn't support 'SUPPORTED_METRICS' - treat it as config is not supported as well
-            supportedMetricKeys = plugin.GetMetric(METRIC_KEY(SUPPORTED_METRICS), {}).as<std::vector<std::string>>();
+            supportedMetricKeys = plugin.get_metric(METRIC_KEY(SUPPORTED_METRICS), {}).as<std::vector<std::string>>();
         } catch (...) {
         }
         auto it = std::find(supportedMetricKeys.begin(), supportedMetricKeys.end(), METRIC_KEY(SUPPORTED_CONFIG_KEYS));
         if (it != supportedMetricKeys.end()) {
-            std::vector<std::string> configKeys = plugin.GetMetric(METRIC_KEY(SUPPORTED_CONFIG_KEYS), {});
+            std::vector<std::string> configKeys = plugin.get_metric(METRIC_KEY(SUPPORTED_CONFIG_KEYS), {});
             supported = std::find(configKeys.begin(), configKeys.end(), key) != configKeys.end();
         }
         return supported;
     }
 
-    InferenceEngine::SoExecutableNetworkInternal LoadNetworkImpl(const InferenceEngine::CNNNetwork& network,
-                                                                 InferenceEngine::InferencePlugin& plugin,
-                                                                 const std::map<std::string, std::string>& parsedConfig,
-                                                                 const InferenceEngine::IRemoteContext::Ptr& context,
-                                                                 const std::string& blobID,
-                                                                 const std::string& modelPath = std::string(),
-                                                                 bool forceDisableCache = false) {
-        OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "CoreImpl::LoadNetworkImpl");
-        InferenceEngine::SoExecutableNetworkInternal execNetwork;
+    ov::runtime::SoPtr<ie::IExecutableNetworkInternal> load_model_impl(
+        const InferenceEngine::CNNNetwork& network,
+        InferencePlugin& plugin,
+        const std::map<std::string, std::string>& parsedConfig,
+        const ie::RemoteContext::Ptr& context,
+        const std::string& blobID,
+        const std::string& modelPath = std::string(),
+        bool forceDisableCache = false) {
+        OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "CoreImpl::load_model_impl");
+        ov::runtime::SoPtr<ie::IExecutableNetworkInternal> execNetwork;
         execNetwork =
-            context ? plugin.LoadNetwork(network, context, parsedConfig) : plugin.LoadNetwork(network, parsedConfig);
+            context ? plugin.load_model(network, context, parsedConfig) : plugin.load_model(network, parsedConfig);
         auto cacheManager = coreConfig.getCacheConfig()._cacheManager;
         if (!forceDisableCache && cacheManager && DeviceSupportsImportExport(plugin)) {
             try {
                 // need to export network for further import from "cache"
-                OV_ITT_SCOPE(FIRST_INFERENCE, InferenceEngine::itt::domains::IE_LT, "Core::LoadNetwork::Export");
+                OV_ITT_SCOPE(FIRST_INFERENCE, ie::itt::domains::IE_LT, "Core::LoadNetwork::Export");
                 cacheManager->writeCacheEntry(blobID, [&](std::ostream& networkStream) {
-                    networkStream << InferenceEngine::CompiledBlobHeader(
-                        InferenceEngine::GetInferenceEngineVersion()->buildNumber,
-                        InferenceEngine::NetworkCompilationContext::calculateFileInfo(modelPath));
+                    networkStream << ie::CompiledBlobHeader(
+                        ie::GetInferenceEngineVersion()->buildNumber,
+                        ie::NetworkCompilationContext::calculateFileInfo(modelPath));
                     execNetwork->Export(networkStream);
                 });
             } catch (...) {
@@ -240,41 +240,40 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         return execNetwork;
     }
 
-    InferenceEngine::SoExecutableNetworkInternal LoadNetworkFromCache(
-        const std::shared_ptr<InferenceEngine::ICacheManager>& cacheManager,
+    ov::runtime::SoPtr<ie::IExecutableNetworkInternal> LoadNetworkFromCache(
+        const std::shared_ptr<ie::ICacheManager>& cacheManager,
         const std::string& blobId,
-        InferenceEngine::InferencePlugin& plugin,
+        ov::runtime::InferencePlugin& plugin,
         const std::map<std::string, std::string>& config,
-        const std::shared_ptr<InferenceEngine::IRemoteContext>& context,
+        const std::shared_ptr<ie::RemoteContext>& context,
         bool& networkIsImported,
         const std::string& modelPath = std::string()) {
-        InferenceEngine::SoExecutableNetworkInternal execNetwork;
+        ov::runtime::SoPtr<ie::IExecutableNetworkInternal> execNetwork;
         struct HeaderException {};
 
         IE_ASSERT(cacheManager != nullptr);
         try {
             cacheManager->readCacheEntry(blobId, [&](std::istream& networkStream) {
                 OV_ITT_SCOPE(FIRST_INFERENCE,
-                             InferenceEngine::itt::domains::IE_LT,
+                             ie::itt::domains::IE_LT,
                              "Core::LoadNetworkFromCache::ReadStreamAndImport");
                 try {
-                    InferenceEngine::CompiledBlobHeader header;
+                    ie::CompiledBlobHeader header;
                     networkStream >> header;
-                    if (header.getIeVersion() != InferenceEngine::GetInferenceEngineVersion()->buildNumber) {
+                    if (header.getIeVersion() != ie::GetInferenceEngineVersion()->buildNumber) {
                         // Build number mismatch, don't use this cache
-                        throw InferenceEngine::NetworkNotRead("Version does not match");
+                        throw ie::NetworkNotRead("Version does not match");
                     }
-                    if (header.getFileInfo() !=
-                        InferenceEngine::NetworkCompilationContext::calculateFileInfo(modelPath)) {
+                    if (header.getFileInfo() != ie::NetworkCompilationContext::calculateFileInfo(modelPath)) {
                         // Original file is changed, don't use cache
-                        throw InferenceEngine::NetworkNotRead("Original model file is changed");
+                        throw ie::NetworkNotRead("Original model file is changed");
                     }
                 } catch (...) {
                     throw HeaderException();
                 }
 
-                execNetwork = context ? plugin.ImportNetwork(networkStream, context, config)
-                                      : plugin.ImportNetwork(networkStream, config);
+                execNetwork = context ? plugin.import_model(networkStream, context, config)
+                                      : plugin.import_model(networkStream, config);
                 networkIsImported = true;
             });
         } catch (const HeaderException&) {
@@ -290,10 +289,10 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         return execNetwork;
     }
 
-    std::map<std::string, std::string> CreateCompileConfig(const InferenceEngine::InferencePlugin& plugin,
+    std::map<std::string, std::string> CreateCompileConfig(const ov::runtime::InferencePlugin& plugin,
                                                            const std::string& deviceFamily,
                                                            const std::map<std::string, std::string>& origConfig) const {
-        std::map<std::string, InferenceEngine::Parameter> getMetricConfig;
+        std::map<std::string, ie::Parameter> getMetricConfig;
         auto compileConfig = origConfig;
 
         // 0. Remove TARGET_FALLBACK key, move it to getMetricConfig
@@ -311,11 +310,12 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         }
 
         // 2. replace it with DEVICE_ARCHITECTURE value
-        std::vector<std::string> supportedMetricKeys = plugin.GetMetric(METRIC_KEY(SUPPORTED_METRICS), getMetricConfig);
+        std::vector<std::string> supportedMetricKeys =
+            plugin.get_metric(METRIC_KEY(SUPPORTED_METRICS), getMetricConfig);
         auto archIt =
             std::find(supportedMetricKeys.begin(), supportedMetricKeys.end(), METRIC_KEY(DEVICE_ARCHITECTURE));
         if (archIt != supportedMetricKeys.end()) {
-            auto value = plugin.GetMetric(METRIC_KEY(DEVICE_ARCHITECTURE), getMetricConfig);
+            auto value = plugin.get_metric(METRIC_KEY(DEVICE_ARCHITECTURE), getMetricConfig);
             compileConfig[METRIC_KEY(DEVICE_ARCHITECTURE)] = value.as<std::string>();
         } else {
             // Take device name if device does not support DEVICE_ARCHITECTURE metric
@@ -324,20 +324,20 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         return compileConfig;
     }
 
-    std::string CalculateNetworkHash(const InferenceEngine::CNNNetwork& network,
+    std::string CalculateNetworkHash(const ie::CNNNetwork& network,
                                      const std::string& deviceFamily,
-                                     const InferenceEngine::InferencePlugin& plugin,
+                                     const ov::runtime::InferencePlugin& plugin,
                                      const std::map<std::string, std::string>& config) const {
         auto compileConfig = CreateCompileConfig(plugin, deviceFamily, config);
-        return InferenceEngine::NetworkCompilationContext::computeHash(network, compileConfig);
+        return ie::NetworkCompilationContext::computeHash(network, compileConfig);
     }
 
     std::string CalculateFileHash(const std::string& modelName,
                                   const std::string& deviceFamily,
-                                  const InferenceEngine::InferencePlugin& plugin,
+                                  const ov::runtime::InferencePlugin& plugin,
                                   const std::map<std::string, std::string>& config) const {
         auto compileConfig = CreateCompileConfig(plugin, deviceFamily, config);
-        return InferenceEngine::NetworkCompilationContext::computeHash(modelName, compileConfig);
+        return ie::NetworkCompilationContext::computeHash(modelName, compileConfig);
     }
 
 public:
@@ -382,8 +382,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
 
             // append IR library path for default IE plugins
             {
-                FileUtils::FilePath absFilePath =
-                    FileUtils::makePath(InferenceEngine::getInferenceEngineLibraryPath(), pluginPath);
+                FileUtils::FilePath absFilePath = FileUtils::makePath(ie::getInferenceEngineLibraryPath(), pluginPath);
                 if (FileUtils::fileExist(absFilePath))
                     pluginPath = absFilePath;
             }
@@ -428,33 +427,31 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
      * @brief Returns global task executor
      * @return Reference to task executor
      */
-    InferenceEngine::ITaskExecutor::Ptr GetTaskExecutor() const override {
+    ie::ITaskExecutor::Ptr GetTaskExecutor() const override {
         return nullptr;
     }
 
-    InferenceEngine::CNNNetwork ReadNetwork(const std::string& modelPath, const std::string& binPath) const override {
+    ie::CNNNetwork ReadNetwork(const std::string& modelPath, const std::string& binPath) const override {
         OV_ITT_SCOPE(FIRST_INFERENCE, ov::itt::domains::IE_RT, "CoreImpl::ReadNetwork from file");
-        return InferenceEngine::details::ReadNetwork(modelPath, binPath, extensions);
+        return ie::details::ReadNetwork(modelPath, binPath, extensions);
     }
 
-    InferenceEngine::CNNNetwork ReadNetwork(const std::string& model,
-                                            const InferenceEngine::Blob::CPtr& weights) const override {
+    ie::CNNNetwork ReadNetwork(const std::string& model, const ie::Blob::CPtr& weights) const override {
         OV_ITT_SCOPE(FIRST_INFERENCE, ov::itt::domains::IE_RT, "CoreImpl::ReadNetwork from memory");
-        return InferenceEngine::details::ReadNetwork(model, weights, extensions);
+        return ie::details::ReadNetwork(model, weights, extensions);
     }
 
     // TODO: In future this method can be added to ICore interface
-    InferenceEngine::SoExecutableNetworkInternal LoadNetwork(
-        const InferenceEngine::CNNNetwork& network,
-        const std::shared_ptr<InferenceEngine::IRemoteContext>& context,
-        const std::map<std::string, std::string>& config) {
-        OV_ITT_SCOPE(FIRST_INFERENCE, InferenceEngine::itt::domains::IE_LT, "Core::LoadNetwork::RemoteContext");
+    ov::runtime::SoPtr<ie::IExecutableNetworkInternal> LoadNetwork(const ie::CNNNetwork& network,
+                                                                   const std::shared_ptr<ie::RemoteContext>& context,
+                                                                   const std::map<std::string, std::string>& config) {
+        OV_ITT_SCOPE(FIRST_INFERENCE, ie::itt::domains::IE_LT, "Core::LoadNetwork::RemoteContext");
         if (context == nullptr) {
             IE_THROW() << "Remote context is null";
         }
         auto parsed = parseDeviceNameIntoConfig(context->getDeviceName(), config);
         auto plugin = GetCPPPluginByName(parsed._deviceName);
-        InferenceEngine::SoExecutableNetworkInternal res;
+        ov::runtime::SoPtr<ie::IExecutableNetworkInternal> res;
         auto cacheManager = coreConfig.getCacheConfig()._cacheManager;
         if (cacheManager && DeviceSupportsImportExport(plugin)) {
             auto hash = CalculateNetworkHash(network, parsed._deviceName, plugin, parsed._config);
@@ -462,19 +459,18 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
             auto lock = cacheGuard.getHashLock(hash);
             res = LoadNetworkFromCache(cacheManager, hash, plugin, parsed._config, context, loadedFromCache);
             if (!loadedFromCache) {
-                res = LoadNetworkImpl(network, plugin, parsed._config, context, hash);
+                res = load_model_impl(network, plugin, parsed._config, context, hash);
             }
         } else {
-            res = LoadNetworkImpl(network, plugin, parsed._config, context, {});
+            res = load_model_impl(network, plugin, parsed._config, context, {});
         }
         return res;
     }
 
-    InferenceEngine::SoExecutableNetworkInternal LoadNetwork(
-        const InferenceEngine::CNNNetwork& network,
-        const std::string& deviceName,
-        const std::map<std::string, std::string>& config) override {
-        OV_ITT_SCOPE(FIRST_INFERENCE, InferenceEngine::itt::domains::IE_LT, "Core::LoadNetwork::CNN");
+    ie::SoExecutableNetworkInternal LoadNetwork(const ie::CNNNetwork& network,
+                                                const std::string& deviceName,
+                                                const std::map<std::string, std::string>& config) override {
+        OV_ITT_SCOPE(FIRST_INFERENCE, ie::itt::domains::IE_LT, "Core::LoadNetwork::CNN");
         bool forceDisableCache = config.count(CONFIG_KEY_INTERNAL(FORCE_DISABLE_CACHE)) > 0;
         auto parsed = parseDeviceNameIntoConfig(deviceName, config);
         if (forceDisableCache) {
@@ -482,7 +478,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
             parsed._config.erase(CONFIG_KEY_INTERNAL(FORCE_DISABLE_CACHE));
         }
         auto plugin = GetCPPPluginByName(parsed._deviceName);
-        InferenceEngine::SoExecutableNetworkInternal res;
+        ov::runtime::SoPtr<ie::IExecutableNetworkInternal> res;
         auto cacheManager = coreConfig.getCacheConfig()._cacheManager;
         if (!forceDisableCache && cacheManager && DeviceSupportsImportExport(plugin)) {
             auto hash = CalculateNetworkHash(network, parsed._deviceName, plugin, parsed._config);
@@ -490,22 +486,21 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
             auto lock = cacheGuard.getHashLock(hash);
             res = LoadNetworkFromCache(cacheManager, hash, plugin, parsed._config, nullptr, loadedFromCache);
             if (!loadedFromCache) {
-                res = LoadNetworkImpl(network, plugin, parsed._config, nullptr, hash, {}, forceDisableCache);
+                res = load_model_impl(network, plugin, parsed._config, nullptr, hash, {}, forceDisableCache);
             }
         } else {
-            res = LoadNetworkImpl(network, plugin, parsed._config, nullptr, {}, {}, forceDisableCache);
+            res = load_model_impl(network, plugin, parsed._config, nullptr, {}, {}, forceDisableCache);
         }
-        return res;
+        return {{res._so}, res._ptr};
     }
 
-    InferenceEngine::SoExecutableNetworkInternal LoadNetwork(
-        const std::string& modelPath,
-        const std::string& deviceName,
-        const std::map<std::string, std::string>& config) override {
-        OV_ITT_SCOPE(FIRST_INFERENCE, InferenceEngine::itt::domains::IE_LT, "Core::LoadNetwork::Path");
+    ie::SoExecutableNetworkInternal LoadNetwork(const std::string& modelPath,
+                                                const std::string& deviceName,
+                                                const std::map<std::string, std::string>& config) override {
+        OV_ITT_SCOPE(FIRST_INFERENCE, ie::itt::domains::IE_LT, "Core::LoadNetwork::Path");
         auto parsed = parseDeviceNameIntoConfig(deviceName, config);
         auto plugin = GetCPPPluginByName(parsed._deviceName);
-        InferenceEngine::SoExecutableNetworkInternal res;
+        ov::runtime::SoPtr<ie::IExecutableNetworkInternal> res;
         auto cacheManager = coreConfig.getCacheConfig()._cacheManager;
         if (cacheManager && DeviceSupportsImportExport(plugin)) {
             bool loadedFromCache = false;
@@ -514,31 +509,31 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
             res = LoadNetworkFromCache(cacheManager, hash, plugin, parsed._config, nullptr, loadedFromCache, modelPath);
             if (!loadedFromCache) {
                 auto cnnNetwork = ReadNetwork(modelPath, std::string());
-                res = LoadNetworkImpl(cnnNetwork, plugin, parsed._config, nullptr, hash, modelPath);
+                res = load_model_impl(cnnNetwork, plugin, parsed._config, nullptr, hash, modelPath);
             }
         } else if (cacheManager) {
-            res = plugin.LoadNetwork(modelPath, parsed._config);
+            res = plugin.load_model(modelPath, parsed._config);
         } else {
             auto cnnNetwork = ReadNetwork(modelPath, std::string());
-            res = LoadNetworkImpl(cnnNetwork, plugin, parsed._config, nullptr, {}, modelPath);
+            res = load_model_impl(cnnNetwork, plugin, parsed._config, nullptr, {}, modelPath);
         }
-        return res;
+        return {{res._so}, res._ptr};
     }
 
-    InferenceEngine::SoExecutableNetworkInternal ImportNetwork(
-        std::istream& networkModel,
-        const std::string& deviceName,
-        const std::map<std::string, std::string>& config) override {
+    ie::SoExecutableNetworkInternal ImportNetwork(std::istream& networkModel,
+                                                  const std::string& deviceName,
+                                                  const std::map<std::string, std::string>& config) override {
         auto parsed = parseDeviceNameIntoConfig(deviceName, config);
-        return GetCPPPluginByName(parsed._deviceName).ImportNetwork(networkModel, parsed._config);
+        auto exec = GetCPPPluginByName(parsed._deviceName).import_model(networkModel, parsed._config);
+        return {{exec._so}, exec._ptr};
     }
 
-    InferenceEngine::QueryNetworkResult QueryNetwork(const InferenceEngine::CNNNetwork& network,
-                                                     const std::string& deviceName,
-                                                     const std::map<std::string, std::string>& config) const override {
+    ie::QueryNetworkResult QueryNetwork(const ie::CNNNetwork& network,
+                                        const std::string& deviceName,
+                                        const std::map<std::string, std::string>& config) const override {
         OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "Core::QueryNetwork");
         auto parsed = parseDeviceNameIntoConfig(deviceName, config);
-        auto res = GetCPPPluginByName(parsed._deviceName).QueryNetwork(network, parsed._config);
+        auto res = GetCPPPluginByName(parsed._deviceName).query_model(network, parsed._config);
         if (!network.getFunction() || res.supportedLayersMap.empty())
             return res;
 
@@ -561,7 +556,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         return res;
     }
 
-    InferenceEngine::Parameter GetMetric(const std::string& deviceName, const std::string& name) const override {
+    ie::Parameter GetMetric(const std::string& deviceName, const std::string& name) const override {
         // HETERO case
         {
             if (deviceName.find("HETERO:") == 0) {
@@ -584,28 +579,23 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         {
             if (deviceName.find("AUTO:") == 0) {
                 IE_THROW()
-                    << "You can get specific metrics with the GetMetric only for the MULTI itself (without devices). "
+                    << "You can get specific metrics with the GetMetric only for the AUTO itself (without devices). "
                        "To get individual devices's metrics call GetMetric for each device separately";
             }
         }
 
-        std::string pluginName = deviceName;
-        if (pluginName == "AUTO") {
-            pluginName = "MULTI";
-        }
-
-        auto parsed = parseDeviceNameIntoConfig(pluginName);
+        auto parsed = parseDeviceNameIntoConfig(deviceName);
 
         // we need to return a copy of Parameter object which is created on Core side,
         // not in InferenceEngine plugin side, which can be unloaded from Core in a parallel thread
         // TODO: remove this WA after *-31417 is resolved
-        return copyParameterValue(GetCPPPluginByName(parsed._deviceName).GetMetric(name, parsed._config));
+        return copyParameterValue(GetCPPPluginByName(parsed._deviceName).get_metric(name, parsed._config));
     }
 
     /**
      * @brief Returns devices available for neural networks inference
      *
-     * @return A vector of devices. The devices are returned as { CPU, FPGA.0, FPGA.1, MYRIAD }
+     * @return A vector of devices. The devices are returned as { CPU, GPU.0, GPU.1, MYRIAD }
      * If there more than one device of specific type, they are enumerated with .# suffix.
      */
     std::vector<std::string> GetAvailableDevices() const override {
@@ -615,9 +605,9 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         for (auto&& deviceName : GetListOfDevicesInRegistry()) {
             std::vector<std::string> devicesIDs;
             try {
-                const InferenceEngine::Parameter p = GetMetric(deviceName, propertyName);
+                const ie::Parameter p = GetMetric(deviceName, propertyName);
                 devicesIDs = p.as<std::vector<std::string>>();
-            } catch (InferenceEngine::Exception&) {
+            } catch (ie::Exception&) {
                 // plugin is not created by e.g. invalid env
             } catch (const std::exception& ex) {
                 IE_THROW() << "An exception is thrown while trying to create the " << deviceName
@@ -644,40 +634,39 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
      * @param deviceName A name of device
      * @return Reference to a CPP plugin wrapper
      */
-    InferenceEngine::InferencePlugin GetCPPPluginByName(const std::string& pluginName) const {
-        OV_ITT_SCOPE(FIRST_INFERENCE, InferenceEngine::itt::domains::IE_LT, "CoreImpl::GetCPPPluginByName");
+    ov::runtime::InferencePlugin GetCPPPluginByName(const std::string& pluginName) const {
+        OV_ITT_SCOPE(FIRST_INFERENCE, ie::itt::domains::IE_LT, "CoreImpl::GetCPPPluginByName");
 
         std::lock_guard<std::mutex> lock(pluginsMutex);
         auto deviceName = pluginName;
-        if (deviceName == "AUTO") {
-            deviceName = "MULTI";
-        }
         auto it = pluginRegistry.find(deviceName);
         if (it == pluginRegistry.end()) {
             IE_THROW() << "Device with \"" << deviceName << "\" name is not registered in the InferenceEngine";
         }
 
         // Plugin is in registry, but not created, let's create
-
-        if (plugins.find(deviceName) == plugins.end()) {
+        auto it_plugin = plugins.find(deviceName);
+        if (it_plugin == plugins.end()) {
             PluginDescriptor desc = it->second;
-
+            auto so = load_shared_object(desc.libraryLocation.c_str());
             try {
-                InferenceEngine::InferencePlugin plugin{desc.libraryLocation};
+                using CreateF = void(std::shared_ptr<ie::IInferencePlugin>&);
+                std::shared_ptr<ie::IInferencePlugin> plugin_impl;
+                reinterpret_cast<CreateF*>(get_symbol(so, OV_PP_TOSTRING(IE_CREATE_PLUGIN)))(plugin_impl);
+                auto plugin = InferencePlugin{so, plugin_impl};
 
                 {
-                    plugin.SetName(deviceName);
+                    plugin.set_name(deviceName);
 
                     // Set Inference Engine class reference to plugins
-                    std::weak_ptr<InferenceEngine::ICore> mutableCore =
-                        std::const_pointer_cast<InferenceEngine::ICore>(shared_from_this());
-                    plugin.SetCore(mutableCore);
+                    std::weak_ptr<ie::ICore> mutableCore = std::const_pointer_cast<ie::ICore>(shared_from_this());
+                    plugin.set_core(mutableCore);
                 }
 
                 // Add registered extensions to new plugin
                 allowNotImplemented([&]() {
                     for (const auto& ext : extensions) {
-                        plugin.AddExtension(ext);
+                        plugin.add_extension(ext);
                     }
                 });
 
@@ -690,26 +679,30 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
                         }
                     }
                     allowNotImplemented([&]() {
-                        plugin.SetConfig(desc.defaultConfig);
+                        plugin.set_config(desc.defaultConfig);
                     });
 
                     allowNotImplemented([&]() {
                         for (auto&& extensionLocation : desc.listOfExtentions) {
-                            plugin.AddExtension(std::make_shared<InferenceEngine::Extension>(extensionLocation));
+                            plugin.add_extension(std::make_shared<ie::Extension>(extensionLocation));
                         }
                     });
                 }
 
-                plugins[deviceName] = plugin;
-            } catch (const InferenceEngine::Exception& ex) {
+                auto result = plugins.emplace(deviceName, plugin).first->second;
+
+                TryToRegisterLibraryAsExtensionUnsafe(desc.libraryLocation);
+
+                return result;
+            } catch (const ie::Exception& ex) {
                 IE_THROW() << "Failed to create plugin " << FileUtils::fromFilePath(desc.libraryLocation)
                            << " for device " << deviceName << "\n"
                            << "Please, check your environment\n"
                            << ex.what() << "\n";
             }
-        }
-
-        return plugins[deviceName];
+        } else {
+            return it_plugin->second;
+        };
     }
 
     /**
@@ -747,8 +740,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
         {
             pluginPath = FileUtils::makePluginLibraryName({}, FileUtils::toFilePath(pluginName.c_str()));
 
-            FileUtils::FilePath absFilePath =
-                FileUtils::makePath(InferenceEngine::getInferenceEngineLibraryPath(), pluginPath);
+            FileUtils::FilePath absFilePath = FileUtils::makePath(ie::getInferenceEngineLibraryPath(), pluginPath);
             if (FileUtils::fileExist(absFilePath))
                 pluginPath = absFilePath;
         }
@@ -776,7 +768,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
      * @brief Sets config values for a plugin or set of plugins
      * @param deviceName A device name to set config to
      *        If empty, config is set for all the plugins / plugin's meta-data
-     * @note  `deviceName` is not allowed in form of MULTI:CPU, HETERO:FPGA,CPU, AUTO:CPU
+     * @note  `deviceName` is not allowed in form of MULTI:CPU, HETERO:GPU,CPU, AUTO:CPU
      *        just simple forms like CPU, GPU, MULTU, GPU.0, etc
      */
     void SetConfigForPlugins(const std::map<std::string, std::string>& configMap, const std::string& deviceName) {
@@ -814,7 +806,7 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
                             configCopy[CONFIG_KEY(CACHE_DIR)] = cacheConfig._cacheDir;
                         }
                     }
-                    plugin.second.SetConfig(configCopy);
+                    plugin.second.set_config(configCopy);
                 });
             }
         }
@@ -824,37 +816,21 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
      * @brief Registers the extension in a Core object
      *        Such extensions can be used for both CNNNetwork readers and device plugins
      */
-    void AddExtension(const InferenceEngine::IExtensionPtr& extension) {
+    void AddExtension(const ie::IExtensionPtr& extension) {
         std::lock_guard<std::mutex> lock(pluginsMutex);
-
-        std::map<std::string, ngraph::OpSet> opsets = extension->getOpSets();
-        for (const auto& it : opsets) {
-            if (opsetNames.find(it.first) != opsetNames.end())
-                IE_THROW() << "Cannot add opset with name: " << it.first
-                           << ". Opset with the same name already exists.";
-            opsetNames.insert(it.first);
-        }
-
-        // add extensions for already created plugins
-        for (auto& plugin : plugins) {
-            try {
-                plugin.second.AddExtension(extension);
-            } catch (...) {
-            }
-        }
-        extensions.emplace_back(extension);
+        AddExtensionUnsafe(extension);
     }
 
     /**
      * @brief Provides a list of extensions
      * @return A list of registered extensions
      */
-    const std::vector<InferenceEngine::IExtensionPtr>& GetExtensions() const {
+    const std::vector<ie::IExtensionPtr>& GetExtensions() const {
         return extensions;
     }
 
-    std::map<std::string, InferenceEngine::Version> GetVersions(const std::string& deviceName) const {
-        std::map<std::string, InferenceEngine::Version> versions;
+    std::map<std::string, ie::Version> GetVersions(const std::string& deviceName) const {
+        std::map<std::string, ie::Version> versions;
         std::vector<std::string> deviceNames;
 
         {
@@ -862,40 +838,71 @@ class CoreImpl : public InferenceEngine::ICore, public std::enable_shared_from_t
             if (deviceName.find("HETERO") == 0) {
                 auto pos = deviceName.find_first_of(":");
                 if (pos != std::string::npos) {
-                    deviceNames = InferenceEngine::DeviceIDParser::getHeteroDevices(deviceName.substr(pos + 1));
+                    deviceNames = ie::DeviceIDParser::getHeteroDevices(deviceName.substr(pos + 1));
                 }
                 deviceNames.push_back("HETERO");
             } else if (deviceName.find("MULTI") == 0) {
                 auto pos = deviceName.find_first_of(":");
                 if (pos != std::string::npos) {
-                    deviceNames = InferenceEngine::DeviceIDParser::getMultiDevices(deviceName.substr(pos + 1));
+                    deviceNames = ie::DeviceIDParser::getMultiDevices(deviceName.substr(pos + 1));
                 }
                 deviceNames.push_back("MULTI");
             } else if (deviceName.find("AUTO") == 0) {
                 auto pos = deviceName.find_first_of(":");
                 if (pos != std::string::npos) {
-                    deviceNames = InferenceEngine::DeviceIDParser::getMultiDevices(deviceName.substr(pos + 1));
+                    deviceNames = ie::DeviceIDParser::getMultiDevices(deviceName.substr(pos + 1));
                 }
-                deviceNames.emplace_back("MULTI");
+                deviceNames.emplace_back("AUTO");
             } else {
                 deviceNames.push_back(deviceName);
             }
         }
 
         for (auto&& deviceName_ : deviceNames) {
-            InferenceEngine::DeviceIDParser parser(deviceName_);
+            ie::DeviceIDParser parser(deviceName_);
             std::string deviceNameLocal = parser.getDeviceName();
 
-            InferenceEngine::InferencePlugin cppPlugin = GetCPPPluginByName(deviceNameLocal);
-            const InferenceEngine::Version version = cppPlugin.GetVersion();
+            ov::runtime::InferencePlugin cppPlugin = GetCPPPluginByName(deviceNameLocal);
+            const ie::Version version = cppPlugin.get_version();
             versions[deviceNameLocal] = version;
         }
 
         return versions;
     }
+
+private:
+    void AddExtensionUnsafe(const ie::IExtensionPtr& extension) const {
+        std::map<std::string, ngraph::OpSet> opsets = extension->getOpSets();
+        for (const auto& it : opsets) {
+            if (opsetNames.find(it.first) != opsetNames.end())
+                IE_THROW() << "Cannot add opset with name: " << it.first
+                           << ". Opset with the same name already exists.";
+            opsetNames.insert(it.first);
+        }
+
+        // add extensions for already created plugins
+        for (auto& plugin : plugins) {
+            try {
+                plugin.second.add_extension(extension);
+            } catch (...) {
+            }
+        }
+        extensions.emplace_back(extension);
+    }
+
+    template <typename C, typename = InferenceEngine::details::enableIfSupportedChar<C>>
+    void TryToRegisterLibraryAsExtensionUnsafe(const std::basic_string<C>& path) const {
+        try {
+            const auto extension_ptr = std::make_shared<InferenceEngine::Extension>(path);
+            AddExtensionUnsafe(extension_ptr);
+        } catch (const InferenceEngine::NotFound&) {
+        } catch (const InferenceEngine::GeneralError&) {
+        }
+    }
 };
 
-}  // namespace core_detail
+}  // namespace runtime
+}  // namespace ov
 
 namespace InferenceEngine {
 
@@ -958,12 +965,12 @@ std::vector<std::string> DeviceIDParser::getMultiDevices(std::string devicesList
     return deviceNames;
 }
 
-class Core::Impl : public core_detail::CoreImpl {};
+class Core::Impl : public ov::runtime::CoreImpl {};
 
 Core::Core(const std::string& xmlConfigFile) {
     _impl = std::make_shared<Impl>();
 
-    RegisterPlugins(core_detail::parseXmlConfig(xmlConfigFile));
+    RegisterPlugins(ov::runtime::parseXmlConfig(xmlConfigFile));
 }
 
 std::map<std::string, Version> Core::GetVersions(const std::string& deviceName) const {
@@ -996,8 +1003,8 @@ ExecutableNetwork Core::LoadNetwork(const CNNNetwork& network,
 ExecutableNetwork Core::LoadNetwork(const CNNNetwork& network,
                                     RemoteContext::Ptr context,
                                     const std::map<std::string, std::string>& config) {
-    auto exec = _impl->LoadNetwork(network, std::dynamic_pointer_cast<IRemoteContext>(context), config);
-    return {exec, exec};
+    auto exec = _impl->LoadNetwork(network, std::dynamic_pointer_cast<RemoteContext>(context), config);
+    return {{exec._so}, exec._ptr};
 }
 
 ExecutableNetwork Core::LoadNetwork(const std::string& modelPath,
@@ -1018,10 +1025,8 @@ RemoteContext::Ptr Core::CreateContext(const std::string& deviceName, const Para
         IE_THROW() << "AUTO device does not support remote context";
     }
 
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, params);
-    InferenceEngine::IRemoteContext::Ptr context =
-        _impl->GetCPPPluginByName(parsed._deviceName).CreateContext(parsed._config);
-    return context;
+    auto parsed = ov::runtime::parseDeviceNameIntoConfig(deviceName, params);
+    return _impl->GetCPPPluginByName(parsed._deviceName).create_context(parsed._config)._ptr;
 }
 
 RemoteContext::Ptr Core::GetDefaultContext(const std::string& deviceName) {
@@ -1035,10 +1040,8 @@ RemoteContext::Ptr Core::GetDefaultContext(const std::string& deviceName) {
         IE_THROW() << "AUTO device does not support remote context";
     }
 
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, ParamMap());
-    InferenceEngine::IRemoteContext::Ptr context =
-        _impl->GetCPPPluginByName(parsed._deviceName).GetDefaultContext(parsed._config);
-    return context;
+    auto parsed = ov::runtime::parseDeviceNameIntoConfig(deviceName, ParamMap());
+    return _impl->GetCPPPluginByName(parsed._deviceName).get_default_context(parsed._config)._ptr;
 }
 
 void Core::AddExtension(IExtensionPtr extension, const std::string& deviceName_) {
@@ -1063,9 +1066,9 @@ ExecutableNetwork Core::ImportNetwork(const std::string& modelFileName,
                                       const std::string& deviceName,
                                       const std::map<std::string, std::string>& config) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "Core::ImportNetwork");
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, config);
-    auto exec = _impl->GetCPPPluginByName(parsed._deviceName).ImportNetwork(modelFileName, parsed._config);
-    return {exec, exec};
+    auto parsed = ov::runtime::parseDeviceNameIntoConfig(deviceName, config);
+    auto exec = _impl->GetCPPPluginByName(parsed._deviceName).import_model(modelFileName, parsed._config);
+    return {{exec._so}, exec._ptr};
 }
 
 ExecutableNetwork Core::ImportNetwork(std::istream& networkModel,
@@ -1094,8 +1097,8 @@ ExecutableNetwork Core::ImportNetwork(std::istream& networkModel) {
     }
     networkModel.seekg(currentPos, networkModel.beg);
 
-    auto exec = _impl->GetCPPPluginByName(deviceName).ImportNetwork(networkModel, {});
-    return {exec, exec};
+    auto exec = _impl->GetCPPPluginByName(deviceName).import_model(networkModel, {});
+    return {{exec._so}, exec._ptr};
 }
 
 ExecutableNetwork Core::ImportNetwork(std::istream& networkModel,
@@ -1111,10 +1114,10 @@ ExecutableNetwork Core::ImportNetwork(std::istream& networkModel,
     DeviceIDParser device(deviceName_);
     std::string deviceName = device.getDeviceName();
 
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, config);
+    auto parsed = ov::runtime::parseDeviceNameIntoConfig(deviceName, config);
     auto exec = _impl->GetCPPPluginByName(deviceName)
-                    .ImportNetwork(networkModel, std::dynamic_pointer_cast<IRemoteContext>(context), parsed._config);
-    return {exec, exec};
+                    .import_model(networkModel, std::dynamic_pointer_cast<RemoteContext>(context), parsed._config);
+    return {{exec._so}, exec._ptr};
 }
 
 QueryNetworkResult Core::QueryNetwork(const CNNNetwork& network,
@@ -1142,7 +1145,7 @@ void Core::SetConfig(const std::map<std::string, std::string>& config, const std
                       "You can configure the devices with SetConfig before creating the AUTO on top.";
     }
 
-    // GPU.0, FPGA.1 cases
+    // GPU.0, GPU.1 cases
     if (deviceName.find(".") != std::string::npos) {
         IE_THROW()
             << "SetConfig is supported only for device family itself (without particular device .#). "
@@ -1152,7 +1155,7 @@ void Core::SetConfig(const std::map<std::string, std::string>& config, const std
     if (deviceName.empty()) {
         _impl->SetConfigForPlugins(config, std::string());
     } else {
-        auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, config);
+        auto parsed = ov::runtime::parseDeviceNameIntoConfig(deviceName, config);
         _impl->SetConfigForPlugins(parsed._config, parsed._deviceName);
     }
 }
@@ -1180,13 +1183,13 @@ Parameter Core::GetConfig(const std::string& deviceName, const std::string& name
         }
     }
 
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName);
+    auto parsed = ov::runtime::parseDeviceNameIntoConfig(deviceName);
 
     // we need to return a copy of Parameter object which is created on Core side,
     // not in InferenceEngine plugin side, which can be unloaded from Core in a parallel thread
     // TODO: remove this WA after *-31417 is resolved
-    return core_detail::copyParameterValue(
-        _impl->GetCPPPluginByName(parsed._deviceName).GetConfig(name, parsed._config));
+    return ov::runtime::copyParameterValue(
+        _impl->GetCPPPluginByName(parsed._deviceName).get_config(name, parsed._config));
 }
 
 Parameter Core::GetMetric(const std::string& deviceName, const std::string& name) const {
@@ -1217,12 +1220,12 @@ void Core::UnregisterPlugin(const std::string& deviceName_) {
 namespace ov {
 namespace runtime {
 
-class Core::Impl : public core_detail::CoreImpl {};
+class Core::Impl : public CoreImpl {};
 
 Core::Core(const std::string& xmlConfigFile) {
     _impl = std::make_shared<Impl>();
 
-    register_plugins(core_detail::parseXmlConfig(xmlConfigFile));
+    register_plugins(parseXmlConfig(xmlConfigFile));
 }
 
 std::map<std::string, ie::Version> Core::get_versions(const std::string& deviceName) const {
@@ -1242,43 +1245,46 @@ std::shared_ptr<ngraph::Function> Core::read_model(const std::string& modelPath,
 std::shared_ptr<ngraph::Function> Core::read_model(const std::string& model, const ie::Blob::CPtr& weights) const {
     return _impl->ReadNetwork(model, weights).getFunction();
 }
-ie::ExecutableNetwork Core::compile_model(const std::shared_ptr<const ngraph::Function>& network,
-                                          const std::string& deviceName,
-                                          const ConfigMap& config) {
+ExecutableNetwork Core::compile_model(const std::shared_ptr<const ngraph::Function>& network,
+                                      const std::string& deviceName,
+                                      const ConfigMap& config) {
     auto exec =
         _impl->LoadNetwork(ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network)), deviceName, config);
-    return {exec, exec};
+    return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
+            exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};
 }
-ie::ExecutableNetwork Core::compile_model(const std::string& modelPath,
-                                          const std::string& deviceName,
-                                          const ConfigMap& config) {
+ExecutableNetwork Core::compile_model(const std::string& modelPath,
+                                      const std::string& deviceName,
+                                      const ConfigMap& config) {
     auto exec = _impl->LoadNetwork(modelPath, deviceName, config);
-    return {exec, exec};
+    return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
+            exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};
 }
 
-ie::ExecutableNetwork Core::compile_model(const std::shared_ptr<const ngraph::Function>& network,
-                                          const RemoteContext& context,
-                                          const ConfigMap& config) {
+ExecutableNetwork Core::compile_model(const std::shared_ptr<const ngraph::Function>& network,
+                                      const RemoteContext& context,
+                                      const ConfigMap& config) {
     auto exec =
         _impl->LoadNetwork(ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network)), context._impl, config);
-    return {exec, exec};
+    return {exec._so, exec._ptr};
 }
 
 void Core::add_extension(const ie::IExtensionPtr& extension) {
     _impl->AddExtension(extension);
 }
 
-ie::ExecutableNetwork Core::import_model(std::istream& networkModel,
-                                         const std::string& deviceName,
-                                         const ConfigMap& config) {
+ExecutableNetwork Core::import_model(std::istream& networkModel,
+                                     const std::string& deviceName,
+                                     const ConfigMap& config) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "Core::import_model");
     auto exec = _impl->ImportNetwork(networkModel, deviceName, config);
-    return {exec, exec};
+    return {exec.operator const InferenceEngine::details::SharedObjectLoader&().get(),
+            exec.operator std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>&()};
 }
 
-ie::ExecutableNetwork Core::import_model(std::istream& networkModel,
-                                         const RemoteContext& context,
-                                         const ConfigMap& config) {
+ExecutableNetwork Core::import_model(std::istream& networkModel,
+                                     const RemoteContext& context,
+                                     const ConfigMap& config) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::IE, "Core::import_model");
 
     using ExportMagic = std::array<char, 4>;
@@ -1296,15 +1302,18 @@ ie::ExecutableNetwork Core::import_model(std::istream& networkModel,
     }
     networkModel.seekg(currentPos, networkModel.beg);
 
-    auto exec = _impl->GetCPPPluginByName(deviceName).ImportNetwork(networkModel, {});
-    return {exec, exec};
+    auto exec = _impl->GetCPPPluginByName(deviceName).import_model(networkModel, {});
+    return {exec._so, exec._ptr};
 }
 
-ie::QueryNetworkResult Core::query_model(const std::shared_ptr<const ngraph::Function>& network,
-                                         const std::string& deviceName,
-                                         const ConfigMap& config) const {
-    return _impl->QueryNetwork(ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network)), deviceName, config);
+SupportedOpsMap Core::query_model(const std::shared_ptr<const ngraph::Function>& network,
+                                  const std::string& deviceName,
+                                  const ConfigMap& config) const {
+    auto cnnNet = ie::CNNNetwork(std::const_pointer_cast<ngraph::Function>(network));
+    auto qnResult = _impl->QueryNetwork(cnnNet, deviceName, config);
+    return qnResult.supportedLayersMap;
 }
+
 void Core::set_config(const ConfigMap& config, const std::string& deviceName) {
     // HETERO case
     if (deviceName.find("HETERO:") == 0) {
@@ -1324,7 +1333,7 @@ void Core::set_config(const ConfigMap& config, const std::string& deviceName) {
                       "You can configure the devices with SetConfig before creating the AUTO on top.";
     }
 
-    // GPU.0, FPGA.1 cases
+    // GPU.0, GPU.1 cases
     if (deviceName.find(".") != std::string::npos) {
         IE_THROW()
             << "SetConfig is supported only for device family itself (without particular device .#). "
@@ -1334,7 +1343,7 @@ void Core::set_config(const ConfigMap& config, const std::string& deviceName) {
     if (deviceName.empty()) {
         _impl->SetConfigForPlugins(config, std::string());
     } else {
-        auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, config);
+        auto parsed = parseDeviceNameIntoConfig(deviceName, config);
         _impl->SetConfigForPlugins(parsed._config, parsed._deviceName);
     }
 }
@@ -1362,13 +1371,12 @@ ie::Parameter Core::get_config(const std::string& deviceName, const std::string&
         }
     }
 
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName);
+    auto parsed = parseDeviceNameIntoConfig(deviceName);
 
     // we need to return a copy of Parameter object which is created on Core side,
     // not in ie plugin side, which can be unloaded from Core in a parallel thread
     // TODO: remove this WA after *-31417 is resolved
-    return core_detail::copyParameterValue(
-        _impl->GetCPPPluginByName(parsed._deviceName).GetConfig(name, parsed._config));
+    return copyParameterValue(_impl->GetCPPPluginByName(parsed._deviceName).get_config(name, parsed._config));
 }
 
 ie::Parameter Core::get_metric(const std::string& deviceName, const std::string& name) const {
@@ -1405,9 +1413,9 @@ RemoteContext Core::create_context(const std::string& deviceName, const ie::Para
         IE_THROW() << "AUTO device does not support remote context";
     }
 
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, params);
-    auto remoteContext = _impl->GetCPPPluginByName(parsed._deviceName).CreateContext(parsed._config);
-    return {remoteContext, remoteContext};
+    auto parsed = parseDeviceNameIntoConfig(deviceName, params);
+    auto remoteContext = _impl->GetCPPPluginByName(parsed._deviceName).create_context(parsed._config);
+    return {remoteContext._so, remoteContext._ptr};
 }
 
 RemoteContext Core::get_default_context(const std::string& deviceName) {
@@ -1421,11 +1429,11 @@ RemoteContext Core::get_default_context(const std::string& deviceName) {
         IE_THROW() << "AUTO device does not support remote context";
     }
 
-    auto parsed = core_detail::parseDeviceNameIntoConfig(deviceName, ie::ParamMap());
+    auto parsed = parseDeviceNameIntoConfig(deviceName, ie::ParamMap());
 
-    auto remoteCtx = _impl->GetCPPPluginByName(parsed._deviceName).GetDefaultContext(parsed._config);
+    auto remoteContext = _impl->GetCPPPluginByName(parsed._deviceName).get_default_context(parsed._config);
 
-    return {remoteCtx, remoteCtx};
+    return {remoteContext._so, remoteContext._ptr};
 }
 
 }  // namespace runtime
diff --git a/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp b/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp
index 1961c1a713032d..cf1d6c0af28d21 100644
--- a/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp
+++ b/inference-engine/src/inference_engine/src/os/lin/lin_shared_object_loader.cpp
@@ -10,47 +10,65 @@
 #include "file_utils.h"
 #include "shared_object.hpp"
 
+namespace ov {
+namespace runtime {
+std::shared_ptr<void> load_shared_object(const char* path) {
+    auto shared_object = std::shared_ptr<void>{dlopen(path, RTLD_NOW), [](void* shared_object) {
+                                                   if (shared_object != nullptr) {
+                                                       if (0 != dlclose(shared_object)) {
+                                                           std::cerr << "dlclose failed: " << dlerror() << std::endl;
+                                                       }
+                                                   }
+                                               }};
+    if (!shared_object) {
+        IE_THROW() << "Cannot load library '" << path << "': " << dlerror();
+    }
+    return shared_object;
+}
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+std::shared_ptr<void> load_shared_object(const wchar_t* path) {
+    return load_shared_object(FileUtils::wStringtoMBCSstringChar(path).c_str());
+}
+#endif  // ENABLE_UNICODE_PATH_SUPPORT
+
+void* get_symbol(const std::shared_ptr<void>& shared_object, const char* symbol_name) {
+    if (!shared_object) {
+        IE_THROW() << "Cannot get '" << symbol_name << "' content from unknown library!";
+    }
+    void* procAddr = nullptr;
+    procAddr = dlsym(shared_object.get(), symbol_name);
+    if (procAddr == nullptr) {
+        IE_THROW(NotFound) << "dlSym cannot locate method '" << symbol_name << "': " << dlerror();
+    }
+    return procAddr;
+}
+}  // namespace runtime
+}  // namespace ov
+
 namespace InferenceEngine {
 namespace details {
 
-class SharedObjectLoader::Impl {
-private:
-    void* shared_object = nullptr;
+struct SharedObjectLoader::Impl {
+    std::shared_ptr<void> shared_object = nullptr;
 
-public:
-    explicit Impl(const char* pluginName) {
-        shared_object = dlopen(pluginName, RTLD_NOW);
+    explicit Impl(const std::shared_ptr<void>& shared_object_) : shared_object{shared_object_} {}
 
-        if (shared_object == nullptr)
-            IE_THROW() << "Cannot load library '" << pluginName << "': " << dlerror();
-    }
+    explicit Impl(const char* pluginName) : shared_object{ov::runtime::load_shared_object(pluginName)} {}
 
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
     explicit Impl(const wchar_t* pluginName) : Impl(FileUtils::wStringtoMBCSstringChar(pluginName).c_str()) {}
 #endif  // ENABLE_UNICODE_PATH_SUPPORT
 
-    ~Impl() {
-        if (0 != dlclose(shared_object)) {
-            std::cerr << "dlclose failed: " << dlerror() << std::endl;
-        }
-    }
-
-    /**
-     * @brief Searches for a function symbol in the loaded module
-     * @param symbolName Name of the function to find
-     * @return A pointer to the function if found
-     * @throws Exception if the function is not found
-     */
     void* get_symbol(const char* symbolName) const {
-        void* procAddr = nullptr;
-
-        procAddr = dlsym(shared_object, symbolName);
-        if (procAddr == nullptr)
-            IE_THROW(NotFound) << "dlSym cannot locate method '" << symbolName << "': " << dlerror();
-        return procAddr;
+        return ov::runtime::get_symbol(shared_object, symbolName);
     }
 };
 
+SharedObjectLoader::SharedObjectLoader(const std::shared_ptr<void>& shared_object) {
+    _impl.reset(new Impl(shared_object));
+}
+
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
 SharedObjectLoader::SharedObjectLoader(const wchar_t* pluginName) {
     _impl.reset(new Impl(pluginName));
@@ -70,35 +88,9 @@ void* SharedObjectLoader::get_symbol(const char* symbolName) const {
     return _impl->get_symbol(symbolName);
 }
 
-}  // namespace details
-}  // namespace InferenceEngine
-
-namespace ov {
-namespace runtime {
-SharedObject::SharedObject(const char* path) {
-    shared_object = dlopen(path, RTLD_NOW);
-
-    if (shared_object == nullptr)
-        IE_THROW() << "Cannot load library '" << path << "': " << dlerror();
+std::shared_ptr<void> SharedObjectLoader::get() const {
+    return _impl->shared_object;
 }
 
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-SharedObject::SharedObject(const wchar_t* path) : SharedObject(FileUtils::wStringtoMBCSstringChar(path).c_str()) {}
-#endif  // ENABLE_UNICODE_PATH_SUPPORT
-
-SharedObject::~SharedObject() {
-    if (0 != dlclose(shared_object)) {
-        std::cerr << "dlclose failed: " << dlerror() << std::endl;
-    }
-}
-
-void* SharedObject::get_symbol(const char* symbolName) const {
-    void* procAddr = nullptr;
-
-    procAddr = dlsym(shared_object, symbolName);
-    if (procAddr == nullptr)
-        IE_THROW(NotFound) << "dlSym cannot locate method '" << symbolName << "': " << dlerror();
-    return procAddr;
-}
-}  // namespace runtime
-}  // namespace ov
+}  // namespace details
+}  // namespace InferenceEngine
\ No newline at end of file
diff --git a/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp b/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp
index 7896b56e5d28eb..525ab076094dae 100644
--- a/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp
+++ b/inference-engine/src/inference_engine/src/os/win/win_shared_object_loader.cpp
@@ -70,216 +70,10 @@
 
 #include <windows.h>
 
-namespace InferenceEngine {
-namespace details {
-
-typedef DWORD(*GetDllDirectoryA_Fnc)(DWORD, LPSTR);
-typedef DWORD(*GetDllDirectoryW_Fnc)(DWORD, LPWSTR);
-
-static GetDllDirectoryA_Fnc IEGetDllDirectoryA;
-static GetDllDirectoryW_Fnc IEGetDllDirectoryW;
-
-/**
- * @brief WINAPI based implementation for loading a shared object
- */
-class SharedObjectLoader::Impl {
- private:
-    HMODULE shared_object;
-
-    void LoadSymbols() {
-        static std::once_flag loadFlag;
-        std::call_once(loadFlag, [&] () {
-            if (HMODULE hm = GetModuleHandleW(L"kernel32.dll")) {
-                IEGetDllDirectoryA = reinterpret_cast<GetDllDirectoryA_Fnc>(GetProcAddress(hm, "GetDllDirectoryA"));
-                IEGetDllDirectoryW = reinterpret_cast<GetDllDirectoryW_Fnc>(GetProcAddress(hm, "GetDllDirectoryW"));
-            }
-        });
-    }
-
-    // Exclude current directory from DLL search path process wise.
-    // If application specific path was configured before then
-    // current directory is already excluded.
-    // GetDLLDirectory does not distinguish if application specific
-    // path was set to "" or NULL so reset it to "" to keep
-    // application safe.
-    void ExcludeCurrentDirectoryA() {
-#if !WINAPI_PARTITION_SYSTEM
-        LoadSymbols();
-        if (IEGetDllDirectoryA && IEGetDllDirectoryA(0, NULL) <= 1) {
-            SetDllDirectoryA("");
-        }
-#endif
-    }
-
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-    void ExcludeCurrentDirectoryW() {
-#if !WINAPI_PARTITION_SYSTEM
-        LoadSymbols();
-        if (IEGetDllDirectoryW && IEGetDllDirectoryW(0, NULL) <= 1) {
-            SetDllDirectoryW(L"");
-        }
-#endif
-    }
-#endif
-
-    static const char  kPathSeparator = '\\';
-
-    static const char* FindLastPathSeparator(LPCSTR path) {
-        const char* const last_sep = strchr(path, kPathSeparator);
-        return last_sep;
-    }
-
-    static std::string GetDirname(LPCSTR path) {
-        auto pos = FindLastPathSeparator(path);
-        if (pos == nullptr) {
-            return path;
-        }
-        std::string original(path);
-        original[pos - path] = 0;
-        return original;
-    }
-
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-    static const wchar_t* FindLastPathSeparator(LPCWSTR path) {
-        const wchar_t* const last_sep = wcsrchr(path, kPathSeparator);
-        return last_sep;
-    }
-
-    static std::wstring GetDirname(LPCWSTR path) {
-        auto pos = FindLastPathSeparator(path);
-        if (pos == nullptr) {
-            return path;
-        }
-        std::wstring original(path);
-        original[pos - path] = 0;
-        return original;
-    }
-
-    void LoadPluginFromDirectoryW(LPCWSTR path) {
-#if !WINAPI_PARTITION_SYSTEM
-        LoadSymbols();
-        if (IEGetDllDirectoryW) {
-            DWORD nBufferLength = IEGetDllDirectoryW(0, NULL);
-            std::vector<WCHAR> lpBuffer(nBufferLength);
-            IEGetDllDirectoryW(nBufferLength, &lpBuffer.front());
-
-            auto dirname = GetDirname(path);
-            SetDllDirectoryW(dirname.c_str());
-            shared_object = LoadLibraryW(path);
-
-            SetDllDirectoryW(&lpBuffer.front());
-        }
-#endif
-    }
-#endif
-    void LoadPluginFromDirectoryA(LPCSTR path) {
-#if !WINAPI_PARTITION_SYSTEM
-        LoadSymbols();
-        if (IEGetDllDirectoryA) {
-            DWORD nBufferLength = IEGetDllDirectoryA(0, NULL);
-            std::vector<CHAR> lpBuffer(nBufferLength);
-            IEGetDllDirectoryA(nBufferLength, &lpBuffer.front());
-
-            auto dirname = GetDirname(path);
-            SetDllDirectoryA(dirname.c_str());
-            shared_object = LoadLibraryA(path);
-
-            SetDllDirectoryA(&lpBuffer.front());
-        }
-#endif
-    }
-
- public:
-    /**
-     * @brief A shared pointer to SharedObjectLoader
-     */
-    using Ptr = std::shared_ptr<SharedObjectLoader>;
-
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-    /**
-     * @brief Loads a library with the name specified. The library is loaded according to the
-     *        WinAPI LoadLibrary rules
-     * @param pluginName Full or relative path to the plugin library
-     */
-    explicit Impl(const wchar_t* pluginName) {
-        ExcludeCurrentDirectoryW();
-        LoadPluginFromDirectoryW(pluginName);
-
-        if (!shared_object) {
-            shared_object = LoadLibraryW(pluginName);
-        }
-
-        if (!shared_object) {
-            char cwd[1024];
-            IE_THROW() << "Cannot load library '" << FileUtils::wStringtoMBCSstringChar(std::wstring(pluginName)) << "': " << GetLastError()
-                               << " from cwd: " << _getcwd(cwd, sizeof(cwd));
-        }
-    }
-#endif
-
-    explicit Impl(const char* pluginName) {
-        ExcludeCurrentDirectoryA();
-        LoadPluginFromDirectoryA(pluginName);
-
-        if (!shared_object) {
-            shared_object = LoadLibraryA(pluginName);
-        }
-
-        if (!shared_object) {
-            char cwd[1024];
-            IE_THROW() << "Cannot load library '" << pluginName << "': " << GetLastError()
-                << " from cwd: " << _getcwd(cwd, sizeof(cwd));
-        }
-    }
-
-    ~Impl() {
-        FreeLibrary(shared_object);
-    }
-
-    /**
-     * @brief Searches for a function symbol in the loaded module
-     * @param symbolName Name of function to find
-     * @return A pointer to the function if found
-     * @throws Exception if the function is not found
-     */
-    void* get_symbol(const char* symbolName) const {
-        if (!shared_object) {
-            IE_THROW() << "Cannot get '" << symbolName << "' content from unknown library!";
-        }
-        auto procAddr = reinterpret_cast<void*>(GetProcAddress(shared_object, symbolName));
-        if (procAddr == nullptr)
-            IE_THROW(NotFound)
-                << "GetProcAddress cannot locate method '" << symbolName << "': " << GetLastError();
-
-        return procAddr;
-    }
-};
-
-SharedObjectLoader::~SharedObjectLoader() {}
-
-SharedObjectLoader::SharedObjectLoader(const char * pluginName) {
-    _impl = std::make_shared<Impl>(pluginName);
-}
-#ifdef ENABLE_UNICODE_PATH_SUPPORT
-SharedObjectLoader::SharedObjectLoader(const wchar_t* pluginName) {
-    _impl = std::make_shared<Impl>(pluginName);
-}
-#endif
-
-void* SharedObjectLoader::get_symbol(const char* symbolName) const {
-    if (_impl == nullptr) {
-        IE_THROW(NotAllocated) << "SharedObjectLoader is not initialized";
-    }
-    return _impl->get_symbol(symbolName);
-}
-
-}  // namespace details
-}  // namespace InferenceEngine
-
-
 namespace ov {
 namespace runtime {
-SharedObject::SharedObject(const char* path) {
+std::shared_ptr<void> load_shared_object(const char* path) {
+    void* shared_object = nullptr;
     using GetDllDirectoryA_Fnc = DWORD(*)(DWORD, LPSTR);
     GetDllDirectoryA_Fnc IEGetDllDirectoryA = nullptr;
     if (HMODULE hm = GetModuleHandleW(L"kernel32.dll")) {
@@ -297,7 +91,7 @@ SharedObject::SharedObject(const char* path) {
         IEGetDllDirectoryA(nBufferLength, &lpBuffer.front());
 
         // GetDirname
-        auto dirname = [&] {
+        auto dirname = [path] {
             auto pos = strchr(path, '\\');
             if (pos == nullptr) {
                 return std::string{path};
@@ -316,15 +110,21 @@ SharedObject::SharedObject(const char* path) {
     if (!shared_object) {
         shared_object = LoadLibraryA(path);
     }
+
     if (!shared_object) {
         char cwd[1024];
         IE_THROW() << "Cannot load library '" << path << "': " << GetLastError()
             << " from cwd: " << _getcwd(cwd, sizeof(cwd));
     }
+    return {shared_object,
+            [] (void* shared_object) {
+                FreeLibrary(reinterpret_cast<HMODULE>(shared_object));
+            }};
 }
 
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
-SharedObject::SharedObject(const wchar_t* path) {
+std::shared_ptr<void> load_shared_object(const wchar_t* path) {
+    void* shared_object = nullptr;
     using GetDllDirectoryW_Fnc = DWORD(*)(DWORD, LPWSTR);
     static GetDllDirectoryW_Fnc IEGetDllDirectoryW = nullptr;
     if (HMODULE hm = GetModuleHandleW(L"kernel32.dll")) {
@@ -339,8 +139,7 @@ SharedObject::SharedObject(const wchar_t* path) {
         DWORD nBufferLength = IEGetDllDirectoryW(0, NULL);
         std::vector<WCHAR> lpBuffer(nBufferLength);
         IEGetDllDirectoryW(nBufferLength, &lpBuffer.front());
-
-        auto dirname = [&] {
+        auto dirname = [path] {
             auto pos = wcsrchr(path, '\\');
             if (pos == nullptr) {
                 return std::wstring{path};
@@ -363,24 +162,71 @@ SharedObject::SharedObject(const wchar_t* path) {
         IE_THROW() << "Cannot load library '" << FileUtils::wStringtoMBCSstringChar(std::wstring(path)) << "': " << GetLastError()
                             << " from cwd: " << _getcwd(cwd, sizeof(cwd));
     }
+    return {shared_object,
+            [] (void* shared_object) {
+                FreeLibrary(reinterpret_cast<HMODULE>(shared_object));
+            }};
 }
 #endif
 
-SharedObject::~SharedObject() {
-    FreeLibrary(reinterpret_cast<HMODULE>(shared_object));
-}
-
-void* SharedObject::get_symbol(const char* symbolName) const {
+void* get_symbol(const std::shared_ptr<void>& shared_object, const char* symbol_name) {
     if (!shared_object) {
-        IE_THROW() << "Cannot get '" << symbolName << "' content from unknown library!";
+        IE_THROW() << "Cannot get '" << symbol_name << "' content from unknown library!";
     }
     auto procAddr = reinterpret_cast<void*>(GetProcAddress(
-        reinterpret_cast<HMODULE>(const_cast<void*>(shared_object)), symbolName));
-    if (procAddr == nullptr)
+        reinterpret_cast<HMODULE>(const_cast<void*>(shared_object.get())), symbol_name));
+    if (procAddr == nullptr) {
         IE_THROW(NotFound)
-            << "GetProcAddress cannot locate method '" << symbolName << "': " << GetLastError();
-
+            << "GetProcAddress cannot locate method '" << symbol_name << "': " << GetLastError();
+    }
     return procAddr;
 }
 }  // namespace runtime
 }  // namespace ov
+
+namespace InferenceEngine {
+namespace details {
+struct SharedObjectLoader::Impl {
+    std::shared_ptr<void> shared_object = nullptr;
+
+    explicit Impl(const std::shared_ptr<void>& shared_object_) : shared_object{shared_object_} {}
+
+    explicit Impl(const char* pluginName) : shared_object{ov::runtime::load_shared_object(pluginName)} {}
+
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+    explicit Impl(const wchar_t* pluginName) : shared_object{ov::runtime::load_shared_object(pluginName)} {}
+#endif  // ENABLE_UNICODE_PATH_SUPPORT
+
+    void* get_symbol(const char* symbolName) const {
+        return ov::runtime::get_symbol(shared_object, symbolName);
+    }
+};
+
+SharedObjectLoader::SharedObjectLoader(const std::shared_ptr<void>& shared_object) {
+    _impl.reset(new Impl(shared_object));
+}
+
+SharedObjectLoader::~SharedObjectLoader() {}
+
+SharedObjectLoader::SharedObjectLoader(const char * pluginName) {
+    _impl = std::make_shared<Impl>(pluginName);
+}
+#ifdef ENABLE_UNICODE_PATH_SUPPORT
+SharedObjectLoader::SharedObjectLoader(const wchar_t* pluginName) {
+    _impl = std::make_shared<Impl>(pluginName);
+}
+#endif
+
+void* SharedObjectLoader::get_symbol(const char* symbolName) const {
+    if (_impl == nullptr) {
+        IE_THROW(NotAllocated) << "SharedObjectLoader is not initialized";
+    }
+    return _impl->get_symbol(symbolName);
+}
+
+std::shared_ptr<void> SharedObjectLoader::get() const {
+    return _impl->shared_object;
+}
+
+}  // namespace details
+}  // namespace InferenceEngine
diff --git a/inference-engine/src/inference_engine/src/remote_context.cpp b/inference-engine/src/inference_engine/src/remote_context.cpp
index 4c55388ff9c2f4..62913b54537355 100644
--- a/inference-engine/src/inference_engine/src/remote_context.cpp
+++ b/inference-engine/src/inference_engine/src/remote_context.cpp
@@ -4,8 +4,8 @@
 
 #include "openvino/runtime/remote_context.hpp"
 
-#include "cpp_interfaces/interface/ie_iremote_context.hpp"
 #include "ie_remote_blob.hpp"
+#include "ie_remote_context.hpp"
 
 #define REMOTE_CONTEXT_STATEMENT(...)                                   \
     if (_impl == nullptr)                                               \
@@ -19,7 +19,7 @@
 namespace ov {
 namespace runtime {
 
-RemoteContext::RemoteContext(const ie::details::SharedObjectLoader& so, const ie::IRemoteContext::Ptr& impl)
+RemoteContext::RemoteContext(const std::shared_ptr<void>& so, const ie::RemoteContext::Ptr& impl)
     : _so(so),
       _impl(impl) {
     if (_impl == nullptr)
diff --git a/inference-engine/src/inference_engine/src/threading/ie_istreams_executor.cpp b/inference-engine/src/inference_engine/src/threading/ie_istreams_executor.cpp
index a87b18b362e8f7..ab958eddb659de 100644
--- a/inference-engine/src/inference_engine/src/threading/ie_istreams_executor.cpp
+++ b/inference-engine/src/inference_engine/src/threading/ie_istreams_executor.cpp
@@ -27,6 +27,19 @@ std::vector<std::string> IStreamsExecutor::Config::SupportedKeys() {
         CONFIG_KEY_INTERNAL(CPU_THREADS_PER_STREAM),
     };
 }
+int IStreamsExecutor::Config::GetDefaultNumStreams() {
+    const int sockets = static_cast<int>(getAvailableNUMANodes().size());
+    // bare minimum of streams (that evenly divides available number of core)
+    const int num_cores = sockets == 1 ? std::thread::hardware_concurrency() : getNumberOfCPUCores();
+    if (0 == num_cores % 4)
+        return std::max(4, num_cores / 4);
+    else if (0 == num_cores % 5)
+        return std::max(5, num_cores / 5);
+    else if (0 == num_cores % 3)
+        return std::max(3, num_cores / 3);
+    else  // if user disables some cores say in BIOS, so we got weird #cores which is not easy to divide
+        return 1;
+}
 
 void IStreamsExecutor::Config::SetConfig(const std::string& key, const std::string& value) {
     if (key == CONFIG_KEY(CPU_BIND_THREAD)) {
@@ -50,17 +63,8 @@ void IStreamsExecutor::Config::SetConfig(const std::string& key, const std::stri
         if (value == CONFIG_VALUE(CPU_THROUGHPUT_NUMA)) {
             _streams = static_cast<int>(getAvailableNUMANodes().size());
         } else if (value == CONFIG_VALUE(CPU_THROUGHPUT_AUTO)) {
-            const int sockets = static_cast<int>(getAvailableNUMANodes().size());
             // bare minimum of streams (that evenly divides available number of cores)
-            const int num_cores = sockets == 1 ? std::thread::hardware_concurrency() : getNumberOfCPUCores();
-            if (0 == num_cores % 4)
-                _streams = std::max(4, num_cores / 4);
-            else if (0 == num_cores % 5)
-                _streams = std::max(5, num_cores / 5);
-            else if (0 == num_cores % 3)
-                _streams = std::max(3, num_cores / 3);
-            else  // if user disables some cores say in BIOS, so we got weird #cores which is not easy to divide
-                _streams = 1;
+            _streams = GetDefaultNumStreams();
         } else {
             int val_i;
             try {
diff --git a/inference-engine/src/legacy_api/CMakeLists.txt b/inference-engine/src/legacy_api/CMakeLists.txt
index 9de8bf16910835..bfc5c11129a39c 100644
--- a/inference-engine/src/legacy_api/CMakeLists.txt
+++ b/inference-engine/src/legacy_api/CMakeLists.txt
@@ -42,10 +42,10 @@ target_include_directories(${TARGET_NAME}_obj PRIVATE
     ${IE_MAIN_SOURCE_DIR}/src/inference_engine/src # For CNNNetworkNGraphImpl
     $<TARGET_PROPERTY:inference_engine_transformations,INTERFACE_INCLUDE_DIRECTORIES>
     $<TARGET_PROPERTY:inference_engine_plugin_api,INTERFACE_INCLUDE_DIRECTORIES>
-    $<TARGET_PROPERTY:ngraph::ngraph,INTERFACE_INCLUDE_DIRECTORIES>
+    $<TARGET_PROPERTY:ngraph,INTERFACE_INCLUDE_DIRECTORIES>
     $<TARGET_PROPERTY:pugixml::static,INTERFACE_INCLUDE_DIRECTORIES>)
 
-target_compile_definitions(${TARGET_NAME}_obj PRIVATE $<TARGET_PROPERTY:ngraph::ngraph,INTERFACE_COMPILE_DEFINITIONS>)
+target_compile_definitions(${TARGET_NAME}_obj PRIVATE $<TARGET_PROPERTY:ngraph,INTERFACE_COMPILE_DEFINITIONS>)
 
 target_link_libraries(${TARGET_NAME}_obj PRIVATE openvino::itt)
 
diff --git a/inference-engine/src/legacy_api/src/convert_function_to_cnn_network.cpp b/inference-engine/src/legacy_api/src/convert_function_to_cnn_network.cpp
index 7d92c77219d834..4b61ca5de01c70 100644
--- a/inference-engine/src/legacy_api/src/convert_function_to_cnn_network.cpp
+++ b/inference-engine/src/legacy_api/src/convert_function_to_cnn_network.cpp
@@ -433,6 +433,9 @@ void InferenceEngine::details::CNNLayerCreator::on_adapter(const std::string& na
             const auto data_beg = static_cast<char*>(a->get()->get_ptr());
             params[name] = std::string(data_beg, a->get()->size());
         }
+    } else if (const auto& a = ngraph::as_type<ngraph::AttributeAdapter<ngraph::element::TypeVector>>(& adapter)) {
+        const auto & attrs = a->get();
+        params[name] = joinVec(attrs);
     } else {
         IE_THROW() << "Error converting ngraph to CNN network. "
                               "Attribute adapter can not be found for " << name << " parameter";
diff --git a/inference-engine/src/low_precision_transformations/include/low_precision/move_fake_quantize.hpp b/inference-engine/src/low_precision_transformations/include/low_precision/move_fake_quantize.hpp
new file mode 100644
index 00000000000000..4e0e8054e554e5
--- /dev/null
+++ b/inference-engine/src/low_precision_transformations/include/low_precision/move_fake_quantize.hpp
@@ -0,0 +1,25 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <ngraph/ngraph.hpp>
+#include "low_precision/layer_transformation.hpp"
+
+namespace ngraph {
+namespace pass {
+namespace low_precision {
+
+class LP_TRANSFORMATIONS_API MoveFakeQuantize : public LayerTransformation {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    MoveFakeQuantize(const Params& params = Params());
+    bool transform(TransformationContext& context, ngraph::pattern::Matcher &m) override;
+    bool isPrecisionPreserved(std::shared_ptr<Node> layer) const noexcept override;
+};
+
+} // namespace low_precision
+} // namespace pass
+} // namespace ngraph
diff --git a/inference-engine/src/low_precision_transformations/src/concat.cpp b/inference-engine/src/low_precision_transformations/src/concat.cpp
index ae95a834d7d2f9..8df69b6fb215bd 100644
--- a/inference-engine/src/low_precision_transformations/src/concat.cpp
+++ b/inference-engine/src/low_precision_transformations/src/concat.cpp
@@ -138,6 +138,7 @@ bool ConcatTransformation::transform(TransformationContext& context, ngraph::pat
         const auto convert = convertNodes[0]->clone_with_new_inputs({ newConcat });
 
         NetworkHelper::copyInfo({ concat, convert }, convert);
+        convert->set_friendly_name(concat->get_friendly_name() + "/DequantizationConvert");
         lastDequantization = convert;
     }
 
@@ -150,6 +151,7 @@ bool ConcatTransformation::transform(TransformationContext& context, ngraph::pat
                 ngraph::pass::low_precision::fold<ngraph::opset1::Concat>(subtractNodes, 1)));
 
         NetworkHelper::copyInfo({ concat, subtract }, subtract);
+        subtract->set_friendly_name(concat->get_friendly_name() + "/DequantizationSubtract");
         lastDequantization = subtract;
     }
 
@@ -163,6 +165,7 @@ bool ConcatTransformation::transform(TransformationContext& context, ngraph::pat
             layerDequantizations[0].multiply->get_output_element_type(0));
 
         NetworkHelper::copyInfo({ concat, multiply }, multiply);
+        multiply->set_friendly_name(concat->get_friendly_name() + "/DequantizationMultyply");
         lastDequantization = multiply;
     }
 
@@ -182,18 +185,36 @@ bool ConcatTransformation::canBeTransformed(const TransformationContext& context
         return false;
     }
 
-    const auto axis = concat->get_axis();
-    const auto outPShape = concat->get_output_partial_shape(0);
-    const size_t normalizedAxis = ngraph::normalize_axis(concat->get_friendly_name(), axis, outPShape.rank());
+    const auto& axis = concat->get_axis();
+    const auto& outPShape = concat->get_output_partial_shape(0);
+    const auto& outRank = outPShape.rank();
+    if (outRank.is_dynamic()) {
+        return false;
+    }
+
+    const size_t normalizedAxis = ngraph::normalize_axis(concat->get_friendly_name(), axis, outRank);
 
     if (normalizedAxis != 1ul) {
         return false;
     }
 
-    if (outPShape.rank().is_dynamic() || outPShape[normalizedAxis].is_dynamic()) {
+    if (outPShape[normalizedAxis].is_dynamic()) {
         return false;
     }
 
+    auto checkConstShape = [&normalizedAxis, &outRank](const std::shared_ptr<opset1::Constant>& constant) {
+        const size_t rankValue = outRank.get_length();
+        Shape constantShape = constant->get_shape();
+
+        while (constantShape.size() < rankValue) {
+            constantShape.insert(constantShape.begin(), 1ul);
+        }
+
+        const auto dqDimensionsCount = std::count_if(constantShape.begin(), constantShape.end(), [](size_t elem) { return elem > 1; });
+        const bool dqOnlyByConcatAxis = (dqDimensionsCount == 0) || (dqDimensionsCount == 1 && constantShape[normalizedAxis] != 1ul);
+        return dqOnlyByConcatAxis;
+    };
+
     element::Type precision;
     for (size_t i = 0ul; i < concat->get_input_size(); i++) {
         const FakeQuantizeDequantization dequantization = NetworkHelper::getDequantization(concat, i);
@@ -201,6 +222,11 @@ bool ConcatTransformation::canBeTransformed(const TransformationContext& context
             return false;
         }
 
+        if (((dequantization.subtract != nullptr) && (!checkConstShape(dequantization.subtractConstant))) ||
+            ((dequantization.multiply != nullptr) && (!checkConstShape(dequantization.multiplyConstant)))) {
+            return false;
+        }
+
         if (precision == element::undefined) {
             precision = dequantization.data.get_element_type();
         } else if (precision != dequantization.data.get_element_type()) {
@@ -302,13 +328,12 @@ bool ConcatTransformation::isQuantizedStatic(const std::shared_ptr<const Node>&
         return false;
     }
 
-    const auto axis = concat->get_axis();
     const auto outputRank = concat->get_output_partial_shape(0).rank();
-    if (axis < 0 && outputRank.is_dynamic()) {
+    if (outputRank.is_dynamic()) {
         return false;
     }
 
-    const size_t normalizedAxis = ngraph::normalize_axis(concat->get_friendly_name(), axis, outputRank);
+    const size_t normalizedAxis = ngraph::normalize_axis(concat->get_friendly_name(), concat->get_axis(), outputRank);
     return normalizedAxis == 1ul;
 }
 
diff --git a/inference-engine/src/low_precision_transformations/src/convolution.cpp b/inference-engine/src/low_precision_transformations/src/convolution.cpp
index 9a0c0e40474878..97abcb2b9abff0 100644
--- a/inference-engine/src/low_precision_transformations/src/convolution.cpp
+++ b/inference-engine/src/low_precision_transformations/src/convolution.cpp
@@ -309,7 +309,7 @@ bool ConvolutionTransformation::transform(TransformationContext &context, ngraph
 
     std::shared_ptr<ngraph::opset1::Multiply> finalDequantization = NetworkHelper::optimizeMultipliesAfter(
         convolution->output(0).get_target_inputs().begin()->get_node()->shared_from_this());
-    copy_runtime_info({ convolution, finalDequantization }, finalDequantization);
+    ngraph::copy_runtime_info({ convolution, finalDequantization }, finalDequantization);
     updateOutput(context, finalDequantization, convolution);
 
     // [C, 1, 1] -> [1, C, 1, 1]
diff --git a/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp b/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp
index 14a0104a46ca6a..aecd9c072ae160 100644
--- a/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp
+++ b/inference-engine/src/low_precision_transformations/src/fake_quantize_dequantization.cpp
@@ -34,7 +34,7 @@ FakeQuantizeDequantization::FakeQuantizeDequantization(
 }
 
 bool FakeQuantizeDequantization::empty() const {
-    return (convert == nullptr) && (subtract == nullptr) && (multiply == nullptr);
+    return (subtract == nullptr) && (multiply == nullptr);
 }
 
 bool FakeQuantizeDequantization::multiplyHasZeroOrDenormal() const {
diff --git a/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp b/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp
index 1b05f965dc1bab..72c08bb5c78a66 100644
--- a/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp
+++ b/inference-engine/src/low_precision_transformations/src/layer_transformation.cpp
@@ -171,11 +171,14 @@ std::stringstream toStream(const std::vector<float>& dequantizationValues) {
 }
 
 void LayerTransformation::printDequantizationInfo(const std::shared_ptr<Node>& layer) {
-    const QuantizationDetails quantizationDetails = QuantizationDetails::getDetails(ov::as_type_ptr<opset1::FakeQuantize>(layer));
-    std::cout <<
-        layer->get_type_name() << (NetworkHelper::isConstantPath(layer) ? " on weights " : " on activations ") <<
-        layer->get_friendly_name() << ":" << std::endl <<
-        "   details  : " << quantizationDetails << std::endl;
+    auto fq = as_type_ptr<opset1::FakeQuantize>(layer);
+    if (fq) {
+        const QuantizationDetails quantizationDetails = QuantizationDetails::getDetails(ov::as_type_ptr<opset1::FakeQuantize>(layer));
+        std::cout <<
+            layer->get_type_name() << (NetworkHelper::isConstantPath(layer) ? " on weights " : " on activations ") <<
+            layer->get_friendly_name() << ":" << std::endl <<
+            "   details  : " << quantizationDetails << std::endl;
+    }
 }
 
 void LayerTransformation::printDequantizationInfo(const DataPrecision& dataPrecision) {
diff --git a/inference-engine/src/low_precision_transformations/src/low_precision.cpp b/inference-engine/src/low_precision_transformations/src/low_precision.cpp
index ca34f0e8c776e2..936ba903ce0718 100644
--- a/inference-engine/src/low_precision_transformations/src/low_precision.cpp
+++ b/inference-engine/src/low_precision_transformations/src/low_precision.cpp
@@ -66,6 +66,7 @@
 #include "low_precision/transpose.hpp"
 #include "low_precision/unsqueeze.hpp"
 #include "low_precision/variadic_split.hpp"
+#include "low_precision/move_fake_quantize.hpp"
 
 // cleanup transformations
 #include "low_precision/convert.hpp"
@@ -197,6 +198,7 @@ bool ngraph::pass::low_precision::LowPrecision::run_on_function(std::shared_ptr<
     prerequisites->add_matcher<PullReshapeThroughDequantization>(supportedTypes);
     prerequisites->add_matcher<PullTransposeThroughDequantization>(supportedTypes);
     prerequisites->add_matcher<ngraph::pass::LinOpSequenceFusion>();
+    prerequisites->add_matcher<ngraph::pass::low_precision::MoveFakeQuantize>();
 
     manager.register_pass<TypeRelaxedReplacer>();
 
diff --git a/inference-engine/src/low_precision_transformations/src/move_fake_quantize.cpp b/inference-engine/src/low_precision_transformations/src/move_fake_quantize.cpp
new file mode 100644
index 00000000000000..7192282c2d2b36
--- /dev/null
+++ b/inference-engine/src/low_precision_transformations/src/move_fake_quantize.cpp
@@ -0,0 +1,107 @@
+﻿// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "low_precision/move_fake_quantize.hpp"
+
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/opsets/opset1.hpp>
+
+#include <memory>
+#include <ngraph/ngraph.hpp>
+#include <ngraph/opsets/opset1.hpp>
+#include <ngraph/pattern/op/or.hpp>
+
+#include "low_precision/concat.hpp"
+#include "low_precision/network_helper.hpp"
+
+namespace ngraph {
+namespace pass {
+namespace low_precision {
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::low_precision::MoveFakeQuantize, "MoveFakeQuantize", 0);
+
+MoveFakeQuantize::MoveFakeQuantize(const Params& params) : LayerTransformation(params) {
+    const auto concat = ngraph::pattern::wrap_type<opset1::Concat>(pattern::consumers_count(1));
+    const auto operation = ngraph::pattern::wrap_type<opset1::Relu>({ concat });
+    const auto input_low = ngraph::pattern::wrap_type<ngraph::opset1::Constant>();
+    const auto input_high = ngraph::pattern::wrap_type<ngraph::opset1::Constant>();
+    const auto output_low = ngraph::pattern::wrap_type<ngraph::opset1::Constant>();
+    const auto output_high = ngraph::pattern::wrap_type<ngraph::opset1::Constant>();
+    const auto fq_with_operation = ngraph::pattern::wrap_type<opset1::FakeQuantize>({ operation,
+        input_low,
+        input_high,
+        output_low,
+        output_high});
+    const auto fq = ngraph::pattern::wrap_type<opset1::FakeQuantize>({ concat,
+        input_low,
+        input_high,
+        output_low,
+        output_high });
+
+    ngraph::graph_rewrite_callback callback = [this](pattern::Matcher& m) {
+        auto op = m.get_match_root();
+        if (transformation_callback(op)) {
+            return false;
+        }
+
+        return transform(*context, m);
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(
+        std::make_shared<pattern::op::Or>(OutputVector{fq, fq_with_operation}),
+        "MoveFakeQuantize");
+    this->register_matcher(m, callback);
+}
+
+bool MoveFakeQuantize::transform(TransformationContext& context, ngraph::pattern::Matcher& m) {
+    auto fq = m.get_match_root();
+    auto operation = fq->get_input_node_shared_ptr(0);
+    std::shared_ptr<ngraph::Node> concat;
+    bool only_concat = true;
+    std::string fq_original_name = fq->get_friendly_name(), operation_original_name;
+    if (is_type<opset1::Concat>(operation)) {
+        concat = operation;
+    } else {
+        operation_original_name = operation->get_friendly_name();
+        concat = operation->get_input_node_shared_ptr(0);
+        only_concat = false;
+    }
+    if (!ConcatTransformation::isQuantizedStatic(concat)) {
+        return false;
+    }
+    std::vector<std::shared_ptr<ngraph::Node>> fqs;
+    size_t input_size = concat->get_input_size();
+    for (size_t i{ 0 }; i < input_size; ++i) {
+        std::shared_ptr<ngraph::Node> fq_input;
+        if (only_concat) {
+            fq_input = concat->get_input_node_shared_ptr(i);
+        } else {
+            auto input = concat->get_input_node_shared_ptr(i);
+            fq_input = operation->clone_with_new_inputs({ input });
+            fq_input->set_friendly_name(operation_original_name + "_" + std::to_string(i + 1));
+        }
+        auto newFq = fq->clone_with_new_inputs({ fq_input,
+            fq->get_input_node_shared_ptr(1),
+            fq->get_input_node_shared_ptr(2),
+            fq->get_input_node_shared_ptr(3),
+            fq->get_input_node_shared_ptr(4) });
+        newFq->set_friendly_name(fq_original_name + "_" + std::to_string(i + 1));
+        fqs.push_back(newFq);
+    }
+    ngraph::copy_runtime_info(fq, fqs);
+    auto newConcat = concat->clone_with_new_inputs(ngraph::OutputVector(fqs.begin(), fqs.end()));
+    newConcat->set_friendly_name(concat->get_friendly_name());
+    replace_node(fq, newConcat);
+    NetworkHelper::copyInfo(concat, newConcat);
+    updateOutput(context, newConcat, fq);
+    return true;
+}
+
+bool MoveFakeQuantize::isPrecisionPreserved(std::shared_ptr<Node> layer) const noexcept {
+    return true;
+}
+
+} // namespace low_precision
+} // namespace pass
+} // namespace ngraph
diff --git a/inference-engine/src/low_precision_transformations/src/multiply.cpp b/inference-engine/src/low_precision_transformations/src/multiply.cpp
index cf15d24dc02d48..ea713ee6b27cb1 100644
--- a/inference-engine/src/low_precision_transformations/src/multiply.cpp
+++ b/inference-engine/src/low_precision_transformations/src/multiply.cpp
@@ -159,17 +159,17 @@ bool MultiplyTransformation::canBeTransformed(const TransformationContext& conte
     FakeQuantizeDequantization dequantization1 = pass::low_precision::NetworkHelper::getDequantization(layer, 0ul);
     FakeQuantizeDequantization dequantization2 = pass::low_precision::NetworkHelper::getDequantization(layer, 1ul);
 
-    if ((dequantization1.data.get_node() == nullptr) ||
-        (dequantization1.empty() && !ov::is_type<opset1::Constant>(dequantization1.data.get_node_shared_ptr()) &&
-                                    !ov::is_type<opset1::Constant>(dequantization2.data.get_node_shared_ptr()))) {
+    if (dequantization1.data.get_node() == nullptr || dequantization2.data.get_node() == nullptr) {
         return false;
     }
 
-    if ((dequantization2.data.get_node() == nullptr) ||
-        (dequantization2.empty() && !ov::is_type<opset1::Constant>(dequantization2.data.get_node_shared_ptr()) &&
-                                    !ov::is_type<opset1::Constant>(dequantization1.data.get_node_shared_ptr()))) {
+    const bool nonConstantData = !ov::is_type<opset1::Constant>(dequantization1.data.get_node_shared_ptr()) &&
+                                 !ov::is_type<opset1::Constant>(dequantization2.data.get_node_shared_ptr());
+
+    if (((dequantization1.empty() || dequantization2.empty()) && nonConstantData)) {
         return false;
     }
+
     return EltwiseBaseTransformation::canBeTransformed(context, layer);
 }
 
diff --git a/inference-engine/src/low_precision_transformations/src/mvn.cpp b/inference-engine/src/low_precision_transformations/src/mvn.cpp
index 093747a68b64dd..34f43655604eec 100644
--- a/inference-engine/src/low_precision_transformations/src/mvn.cpp
+++ b/inference-engine/src/low_precision_transformations/src/mvn.cpp
@@ -78,8 +78,6 @@ bool MVNTransformation::canBeTransformed(const TransformationContext& context, s
         }
     }
 
-    bool isScalarScales = NetworkHelper::isScalarLike(dequantization.multiplyConstant);
-
     AxisSet reduction_axes;
     if (ov::is_type<op::MVN>(mvn)) {
         reduction_axes = ov::as_type_ptr<op::MVN>(mvn)->get_reduction_axes();
@@ -104,6 +102,7 @@ bool MVNTransformation::canBeTransformed(const TransformationContext& context, s
         }
     }
 
+    bool isScalarScales = NetworkHelper::isScalarLike(dequantization.multiplyConstant);
     return perTensor && isScalarScales;
 }
 
@@ -127,9 +126,9 @@ bool MVNTransformation::transform(TransformationContext &context, ngraph::patter
 
     FakeQuantizeDequantization dequantization = NetworkHelper::getDequantization(mvn);
     const auto scalesConst = dequantization.multiplyConstant;
+    const auto type = scalesConst->get_element_type();
 
-    auto newScalesConst = dequantization.multiplyConstant;
-    const auto type = scalesConst->get_output_element_type(0);
+    auto newScalesConst = scalesConst;
     if (normalizeVariance) {
         switch (type) {
             case ngraph::element::Type_t::f16: {
@@ -145,6 +144,7 @@ bool MVNTransformation::transform(TransformationContext &context, ngraph::patter
             }
         }
     }
+
     std::shared_ptr<Node> newMVN;
     if (ov::is_type<op::MVN>(mvn)) {
         newMVN = mvn->copy_with_new_inputs({dequantization.data});
diff --git a/inference-engine/src/low_precision_transformations/src/reshape.cpp b/inference-engine/src/low_precision_transformations/src/reshape.cpp
index da44763ba0d66f..ee8e02e104585e 100644
--- a/inference-engine/src/low_precision_transformations/src/reshape.cpp
+++ b/inference-engine/src/low_precision_transformations/src/reshape.cpp
@@ -83,7 +83,7 @@ void reshapeDequantizationConstant(const std::shared_ptr<opset1::Reshape>& resha
             Shape newOperationConstantBroadcastedShape = constant->get_shape();
             // add dimensions to broadcast values
             if (newOperationConstantBroadcastedShape.size() == 2ul) {
-                newOperationConstantBroadcastedShape.push_back(dimensionsToBroadcast);
+                newOperationConstantBroadcastedShape[0] = dimensionsToBroadcast;
             } else {
                 newOperationConstantBroadcastedShape[2] = dimensionsToBroadcast;
             }
diff --git a/inference-engine/src/mkldnn_plugin/CMakeLists.txt b/inference-engine/src/mkldnn_plugin/CMakeLists.txt
index 6e066a4656c384..3e43077afe5d02 100644
--- a/inference-engine/src/mkldnn_plugin/CMakeLists.txt
+++ b/inference-engine/src/mkldnn_plugin/CMakeLists.txt
@@ -44,6 +44,8 @@ target_link_libraries(${TARGET_NAME} PRIVATE mkldnn
                                              inference_engine_transformations
                                              inference_engine_lp_transformations)
 
+target_compile_definitions(${TARGET_NAME} PRIVATE IMPLEMENT_INFERENCE_EXTENSION_API)
+
 target_include_directories(${TARGET_NAME} PRIVATE
         ${CMAKE_CURRENT_SOURCE_DIR})
 
@@ -79,7 +81,7 @@ target_include_directories(${TARGET_NAME}_obj SYSTEM PUBLIC $<TARGET_PROPERTY:mk
 set_ie_threading_interface_for(${TARGET_NAME}_obj)
 
 target_compile_definitions(${TARGET_NAME}_obj
-        PRIVATE USE_STATIC_IE IMPLEMENT_INFERENCE_ENGINE_PLUGIN
+        PRIVATE USE_STATIC_IE IMPLEMENT_INFERENCE_ENGINE_PLUGIN IMPLEMENT_INFERENCE_EXTENSION_API
 )
 
 set_target_properties(${TARGET_NAME}_obj PROPERTIES EXCLUDE_FROM_ALL ON)
diff --git a/inference-engine/src/mkldnn_plugin/config.cpp b/inference-engine/src/mkldnn_plugin/config.cpp
index 37715610c580ba..bec2c5ee0b6d80 100644
--- a/inference-engine/src/mkldnn_plugin/config.cpp
+++ b/inference-engine/src/mkldnn_plugin/config.cpp
@@ -46,16 +46,17 @@ Config::Config() {
     updateProperties();
 }
 
-
 void Config::readProperties(const std::map<std::string, std::string> &prop) {
-    auto streamExecutorConfigKeys = streamExecutorConfig.SupportedKeys();
-    for (auto& kvp : prop) {
-        auto& key = kvp.first;
-        auto& val = kvp.second;
-
+    const auto streamExecutorConfigKeys = streamExecutorConfig.SupportedKeys();
+    const auto hintsConfigKeys = perfHintsConfig.SupportedKeys();
+    for (const auto& kvp : prop) {
+        const auto& key = kvp.first;
+        const auto& val = kvp.second;
         if (streamExecutorConfigKeys.end() !=
             std::find(std::begin(streamExecutorConfigKeys), std::end(streamExecutorConfigKeys), key)) {
             streamExecutorConfig.SetConfig(key, val);
+        } else if (hintsConfigKeys.end() != std::find(hintsConfigKeys.begin(), hintsConfigKeys.end(), key)) {
+            perfHintsConfig.SetConfig(key, val);
         } else if (key == PluginConfigParams::KEY_DYN_BATCH_LIMIT) {
             int val_i = -1;
             try {
@@ -163,6 +164,9 @@ void Config::updateProperties() {
             _config.insert({ PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::YES });
         else
             _config.insert({ PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::NO });
+        _config.insert({ PluginConfigParams::KEY_PERFORMANCE_HINT, perfHintsConfig.ovPerfHint });
+        _config.insert({ PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS,
+                         std::to_string(perfHintsConfig.ovPerfHintNumRequests) });
     }
 }
 
diff --git a/inference-engine/src/mkldnn_plugin/config.h b/inference-engine/src/mkldnn_plugin/config.h
index 54336d58495276..c1edd197639559 100644
--- a/inference-engine/src/mkldnn_plugin/config.h
+++ b/inference-engine/src/mkldnn_plugin/config.h
@@ -5,6 +5,7 @@
 #pragma once
 
 #include <threading/ie_istreams_executor.hpp>
+#include <ie_performance_hints.hpp>
 #include "utils/debug_capabilities.h"
 
 #include <string>
@@ -26,7 +27,7 @@ struct Config {
     std::string dumpToDot = "";
     int batchLimit = 0;
     InferenceEngine::IStreamsExecutor::Config streamExecutorConfig;
-
+    InferenceEngine::PerfHintsConfig  perfHintsConfig;
 #if defined(__arm__) || defined(__aarch64__)
     // Currently INT8 mode is not optimized on ARM, fallback to FP32 mode.
     LPTransformsMode lpTransformsMode = LPTransformsMode::Off;
diff --git a/inference-engine/src/mkldnn_plugin/cpu_memory_desc_utils.cpp b/inference-engine/src/mkldnn_plugin/cpu_memory_desc_utils.cpp
deleted file mode 100644
index cc04db7f26f0a6..00000000000000
--- a/inference-engine/src/mkldnn_plugin/cpu_memory_desc_utils.cpp
+++ /dev/null
@@ -1,395 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include "cpu_memory_desc.h"
-#include "cpu_memory_desc_utils.h"
-#include "mkldnn_memory.h"
-#include "utils/general_utils.h"
-#include "utils/cpu_utils.hpp"
-#include <limits>
-#include <vector>
-#include <numeric>
-#include <blob_factory.hpp>
-
-using namespace mkldnn;
-using namespace MKLDNNPlugin;
-using namespace InferenceEngine;
-
-namespace MKLDNNPlugin {
-
-/**
- * Convert to  BlockedDescriptor
- *
- * mkl:  IOhw_4i16o4i    dims {32, 64, 128, 128}
- *   strides               // the order of outer dims is encoded here
- *   inner_blks   4 16 4
- *   inner_idxs   1  0 1
- *
- * IE tensor desc has more expressive ability. Any oneDNN blocked tensor can be covreted.
- * How to convert into IE representation:
- *    0. Detect a new_outer_order of outer_dims via descending strides.
- *    1. IE strides :  concatenate strides in new_outer_order and inner strides.
- *    2. IE dims    :  concatenate outer dims in new_outer_order with auto padding and inner blocks
- *    3. IE order   :  concatenate new_outer_order and inner_idxs
- */
-BlockedMemoryDesc MemoryDescUtils::convertToBlockedDescriptor(const MKLDNNMemoryDesc& inpDesc) {
-    mkldnn::memory::desc desc = inpDesc;
-    const auto dims = desc.dims();
-
-    if (desc.data.format_kind != dnnl_blocked)
-        IE_THROW() << "Conversion is not possible";
-
-    const auto &blk_desc = desc.data.format_desc.blocking;
-
-    const size_t outer_ndims = dims.size();
-    const size_t inner_ndims = blk_desc.inner_nblks;
-    const size_t total_ndims = outer_ndims + inner_ndims;
-
-    // strides of inner dims. In case of 4i16o4i will be {64, 4, 1}
-    std::vector<size_t> inner_strides(inner_ndims, 1);
-    for (size_t i = 1; i < blk_desc.inner_nblks; i++) {
-        inner_strides[blk_desc.inner_nblks - 1 - i] = inner_strides[blk_desc.inner_nblks - i] * blk_desc.inner_blks[blk_desc.inner_nblks - i];
-    }
-
-    // total inner block size. in case of 4i16o4i will be {16, 16, 1, 1}
-    std::vector<size_t> total_block_per_dim(outer_ndims, 1);
-    for (int i = 0; i < inner_ndims; i++) {
-        total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
-    }
-    std::vector<size_t> outer_block_dims(std::begin(dims), std::begin(dims) + outer_ndims);
-    for (size_t i = 0; i < outer_block_dims.size(); i++) {
-        outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
-    }
-
-    // order of outer dims. In case of IOhw_ will be {1, 0, 2, 3}
-    std::vector<size_t> outer_order(outer_ndims);
-    std::iota(outer_order.begin(), outer_order.end(), 0);
-    std::sort(outer_order.begin(), outer_order.end(),
-              [&blk_desc, &outer_block_dims] (size_t ind_l, size_t ind_r) {
-                  return (blk_desc.strides[ind_l] > blk_desc.strides[ind_r]) ||
-                         (blk_desc.strides[ind_l] == blk_desc.strides[ind_r] && outer_block_dims[ind_l] > outer_block_dims[ind_r]);
-              });
-
-    // IE blocked order
-    // [new_outer_order] U [inner_idxs]
-    SizeVector ie_blk_order(total_ndims, 0);
-    std::copy(outer_order.begin(), outer_order.end(), ie_blk_order.begin());
-    std::copy(blk_desc.inner_idxs, blk_desc.inner_idxs + blk_desc.inner_nblks, ie_blk_order.begin() + dims.size());
-
-    // IE blocked strides
-    // [outer_strides via new_outer_order] U [inner_strides]
-    SizeVector ie_blk_strides(total_ndims, 0);
-    std::copy(inner_strides.rbegin(), inner_strides.rend(), ie_blk_strides.rbegin());
-    std::transform(outer_order.begin(), outer_order.end(), ie_blk_strides.begin(),
-                   [&] (size_t i) { return blk_desc.strides[i]; });
-
-    // IE blocked dims
-    // [dims via new_outer_order with auto pad] U [inner_blk_dims]
-    SizeVector ie_blk_dims(total_ndims, 0);
-    std::copy(blk_desc.inner_blks, blk_desc.inner_blks + blk_desc.inner_nblks,
-              ie_blk_dims.end() - blk_desc.inner_nblks);
-    std::transform(outer_order.begin(), outer_order.end(), ie_blk_dims.begin(),
-                   [&] (size_t i) { return outer_block_dims[i]; });
-
-    // IE offset padded to data. Same as for oneDNN
-    SizeVector ie_blk_offset_to_data {desc.data.padded_offsets, desc.data.padded_offsets + desc.data.ndims};
-    size_t ie_blk_offset0 = desc.data.offset0;
-
-    // TODO: The tensor desc implementation allow to specify offset_to_data for inner blocked dims.
-    //       Which is not obvious behavior. It required offset_to_data.size == total_ndims, so will
-    //       fill it with zero.
-    ie_blk_offset_to_data.insert(ie_blk_offset_to_data.end(), inner_ndims, 0);
-
-    BlockedMemoryDesc res(MKLDNNMemory::convertToIePrec(desc.data_type()), SizeVector {begin(dims), end(dims)}, ie_blk_dims,
-                          ie_blk_order, ie_blk_offset0, ie_blk_offset_to_data, ie_blk_strides);
-    return res;
-}
-
-
-InferenceEngine::TensorDesc MemoryDescUtils::convertToTensorDesc(const MemoryDesc& desc) {
-    if (auto blockingDesc = dynamic_cast<const BlockedMemoryDesc*>(&desc)) {
-        return InferenceEngine::TensorDesc(blockingDesc->getPrecision(), blockingDesc->getShape().getStaticDims(),
-                                           {blockingDesc->getBlockDims(), blockingDesc->getOrder(), blockingDesc->getOffsetPadding(),
-                                            blockingDesc->getOffsetPaddingToData(), blockingDesc->getStrides()});
-    } else if (auto mkldnnDesc = dynamic_cast<const MKLDNNMemoryDesc*>(&desc)) {
-        auto blockingDesc = convertToBlockedDescriptor(*mkldnnDesc);
-        return InferenceEngine::TensorDesc(blockingDesc.getPrecision(), blockingDesc.getShape().getStaticDims(),
-                                           {blockingDesc.getBlockDims(), blockingDesc.getOrder(), blockingDesc.getOffsetPadding(),
-                                            blockingDesc.getOffsetPaddingToData(), blockingDesc.getStrides()});
-    }
-
-    IE_THROW() << "Cannot convert MemoryDesc to InferenceEngine::TensorDesc";
-
-    return InferenceEngine::TensorDesc();
-}
-
-MKLDNNMemoryDesc MemoryDescUtils::convertToMKLDNNMemoryDesc(const MemoryDesc& desc) {
-    if (MemoryDescType::Blocked == desc.getType()) {
-        return convertToMKLDNNMemoryDesc(*(desc.as<BlockedMemoryDesc>()));
-    } else if (MemoryDescType::Mkldnn == desc.getType()) {
-        return *(desc.as<MKLDNNMemoryDesc>());
-    } else {
-        IE_THROW() << "Cannot convert MemoryDesc to MKLDNNMemoryDesc";
-    }
-}
-
-MKLDNNMemoryDesc MemoryDescUtils::convertToMKLDNNMemoryDesc(const BlockedMemoryDesc& desc) {
-    dnnl_memory_desc_t mkldnnDesc;
-
-    // scalar case
-    if (desc.getShape().getRank() == 0) {
-        mkldnn::memory::desc convertedDesc;
-        convertedDesc.data.format_kind = dnnl_blocked;
-        convertedDesc.data.data_type = memory::convert_to_c(MKLDNNMemory::convertToDataType(desc.getPrecision()));
-        convertedDesc.data.ndims = 1;
-        convertedDesc.data.dims[0] = 1;
-        convertedDesc.data.padded_dims[0] = 1;
-        convertedDesc.data.format_desc.blocking.strides[0] = 1;
-        convertedDesc.data.padded_offsets[0] = 0;
-        convertedDesc.data.offset0 = desc.getOffsetPadding();
-        return MKLDNNMemoryDesc(convertedDesc);
-    }
-
-    auto dims = desc.getShape().getStaticDims();
-
-    auto ie_blkdDims = desc.getBlockDims();
-    auto ie_order = desc.getOrder();
-    auto ie_offsetsToData = desc.getOffsetPaddingToData();
-    auto ie_strides = desc.getStrides();
-
-    size_t outer_ndims = dims.size();
-    size_t inner_ndims = ie_order.size() - dims.size();
-
-    bool is_descending_strides = true;
-    for (int i = 1; i < ie_strides.size(); i++) {
-        is_descending_strides &= (ie_strides[i-1] >= ie_strides[i]);
-    }
-
-    // TODO: That's strong constrains and can be mitigated. IE::TensorDesc allow to transpose blocked dims
-    //       and may be we can achieve correct "descending strides" form which allow conversion.
-    if (!is_descending_strides)
-        IE_THROW() << "Unsupported case for conversion";
-
-    std::vector<size_t> outer_order(outer_ndims, outer_ndims + 1); // outer_order[i] is index of stride for i-th dimension
-    for (size_t i = 0; i < outer_ndims; i++) {
-        outer_order[ie_order[i]] = i;
-    }
-    bool outer_is_correct_permutation_of_n =
-            std::find(outer_order.begin(), outer_order.end(), outer_ndims + 1) == outer_order.end();
-
-    if (!outer_is_correct_permutation_of_n)
-        IE_THROW() << "Unsupported case for conversion";
-
-    bool inner_block_are_dense = one_of(ie_strides.back(), 0, 1);  // stride 1 - is dense case, 0 - broad casted
-    for (int i = outer_ndims; i < ie_strides.size() - 1; i++) {
-        inner_block_are_dense &= (ie_strides[i] == ie_strides[i+1] * ie_blkdDims[i+1]);
-    }
-
-    if (!inner_block_are_dense)
-        IE_THROW() << "Unsupported case for conversion";
-
-    bool inner_pad_offsets_is_zero = std::all_of(ie_offsetsToData.begin() + outer_ndims, ie_offsetsToData.end(),
-                                                 [](size_t pad) { return  pad == 0; });
-
-    if (!inner_pad_offsets_is_zero)
-        IE_THROW() << "Unsupported case for conversion";
-
-    // Fill general memory desc fields
-    mkldnnDesc.format_kind = dnnl_blocked;
-    mkldnnDesc.extra.flags = 0;
-    mkldnnDesc.data_type = memory::convert_to_c(MKLDNNMemory::convertToDataType(desc.getPrecision()));
-    mkldnnDesc.ndims = dims.size();
-    mkldnnDesc.offset0 = desc.getOffsetPadding();
-    std::copy(dims.begin(), dims.end(), mkldnnDesc.dims);
-    std::copy(ie_offsetsToData.begin(), ie_offsetsToData.begin() + outer_ndims, mkldnnDesc.padded_offsets);
-    std::fill(mkldnnDesc.padded_dims, mkldnnDesc.padded_dims + outer_ndims, 1);
-    for (size_t i = 0; i < ie_order.size(); i++) {
-        auto idx = ie_order[i];
-        mkldnnDesc.padded_dims[idx] *= ie_blkdDims[i];
-    }
-
-    // Fill blocking desc
-    auto &dnn_blk_desc = mkldnnDesc.format_desc.blocking;
-    dnn_blk_desc.inner_nblks = inner_ndims;
-    std::copy(ie_blkdDims.end() - inner_ndims, ie_blkdDims.end(), dnn_blk_desc.inner_blks);
-    std::copy(ie_order.end() - inner_ndims, ie_order.end(), dnn_blk_desc.inner_idxs);
-    for (size_t i = 0; i < outer_ndims; i++) {
-        dnn_blk_desc.strides[i] = ie_strides[outer_order[i]];
-    }
-
-    return MKLDNNMemoryDesc(mkldnnDesc);
-}
-
-
-/**
- * Construct from IE::TensorDesc
- * @param tDesc
- *
- * IE  IOhw_4i16o4i   dims(N) = {32, 64, 128, 128}
- *   blockedDims  {4, 2, 128, 128, 4, 16, 4}                      // total dims(inner, outermost, auto blocked/padded). Generally sorted by strides.
- *   strides      {8388608, 4194304,  32768, 256, 64,  4, 1}      // strides for blockedDims, growing sequence
- *   order        {1, 0,   2,   3, 1,  0, 1}                      // matching to original dims
- *
- *   All vectors blockedDims/strides/order have same size equals total num of internal blocked dims(inner_dims + outer_dims)
- *
- *   Tensor descriptor filing is not deterministic. It allows any permutation of index which keeps order of
- *   real dims spliting.
- *      for {1, 0, 2, 3, 1, 0, 1} we can swap elements [1] <=> [4]
- *      but not [0]<=>[4] because it breacke spliting original dims into internal blocked dims
- *   Normalization of representation: Make strides growing but keep layout same as original. Not all
- *   layout allow us to meet normalize form of tensor desc.
- *
- *   Limitation of conversion first N elements of order should be permutation of [0,1,2 ... N]
- */
-MKLDNNMemoryDesc MemoryDescUtils::convertToMKLDNNMemoryDesc(const InferenceEngine::TensorDesc& tDesc) {
-    mkldnn::memory::desc mkldnnDesc({}, mkldnn::memory::data_type::undef, mkldnn::memory::format_tag::undef);
-    auto dims = tDesc.getDims();
-
-    // TODO: implicit conversion of dims is no good...
-    if (tDesc.getLayout() == Layout::SCALAR) {
-        mkldnnDesc.data.format_kind = dnnl_blocked;
-        mkldnnDesc.data.data_type = memory::convert_to_c(MKLDNNMemory::convertToDataType(tDesc.getPrecision()));
-        mkldnnDesc.data.ndims = 1;
-        mkldnnDesc.data.dims[0] = 1;
-        mkldnnDesc.data.padded_dims[0] = 1;
-        mkldnnDesc.data.format_desc.blocking.strides[0] = 1;
-        mkldnnDesc.data.padded_offsets[0] = 0;
-        mkldnnDesc.data.offset0 = tDesc.getBlockingDesc().getOffsetPadding();
-        return MKLDNNMemoryDesc(mkldnnDesc);
-    }
-
-    if (tDesc.getLayout() == Layout::ANY) {
-        mkldnnDesc.data.format_kind = dnnl_format_kind_any;
-        mkldnnDesc.data.data_type = memory::convert_to_c(MKLDNNMemory::convertToDataType(tDesc.getPrecision()));
-        mkldnnDesc.data.ndims = dims.size();
-        std::copy(dims.begin(), dims.end(), mkldnnDesc.data.dims);
-        std::copy(dims.begin(), dims.end(), mkldnnDesc.data.padded_dims);
-        mkldnnDesc.data.offset0 = tDesc.getBlockingDesc().getOffsetPadding();
-        std::fill(mkldnnDesc.data.padded_offsets, mkldnnDesc.data.padded_offsets + dims.size(), 0);
-        return MKLDNNMemoryDesc(mkldnnDesc);
-    }
-
-    auto ie_blkdDims = tDesc.getBlockingDesc().getBlockDims();
-    auto ie_order = tDesc.getBlockingDesc().getOrder();
-    auto ie_offsetsToData = tDesc.getBlockingDesc().getOffsetPaddingToData();
-    auto ie_strides = tDesc.getBlockingDesc().getStrides();
-
-    size_t outer_ndims = dims.size();
-    size_t inner_ndims = ie_order.size() - dims.size();
-
-    bool is_descending_strides = true;
-    for (int i = 1; i < ie_strides.size(); i++) {
-        is_descending_strides &= (ie_strides[i-1] >= ie_strides[i]);
-    }
-
-    // TODO: That's strong constrains and can be mitigated. IE::TensorDesc allow to transpose blocked dims
-    //       and may be we can achieve correct "descending strides" form which allow conversion.
-    if (!is_descending_strides)
-        IE_THROW() << "Unsupported case for conversion";
-
-    std::vector<size_t> outer_order(outer_ndims, outer_ndims + 1); // outer_order[i] is index of stride for i-th dimension
-    for (size_t i = 0; i < outer_ndims; i++) {
-        outer_order[ie_order[i]] = i;
-    }
-    bool outer_is_correct_permutation_of_n =
-            std::find(outer_order.begin(), outer_order.end(), outer_ndims + 1) == outer_order.end();
-
-    if (!outer_is_correct_permutation_of_n)
-        IE_THROW() << "Unsupported case for conversion";
-
-    bool inner_block_are_dense = one_of(ie_strides.back(), 0, 1);  // stride 1 - is dense case, 0 - broad casted
-    for (int i = outer_ndims; i < ie_strides.size() - 1; i++) {
-        inner_block_are_dense &= (ie_strides[i] == ie_strides[i+1] * ie_blkdDims[i+1]);
-    }
-
-    if (!inner_block_are_dense)
-        IE_THROW() << "Unsupported case for conversion";
-
-    bool inner_pad_offsets_is_zero = std::all_of(ie_offsetsToData.begin() + outer_ndims, ie_offsetsToData.end(),
-                                                 [](size_t pad) { return  pad == 0; });
-
-    if (!inner_pad_offsets_is_zero)
-        IE_THROW() << "Unsupported case for conversion";
-
-    // Fill general memory desc fields
-    mkldnnDesc.data.format_kind = dnnl_blocked;
-    mkldnnDesc.data.data_type = memory::convert_to_c(MKLDNNMemory::convertToDataType(tDesc.getPrecision()));
-    mkldnnDesc.data.ndims = dims.size();
-    mkldnnDesc.data.offset0 = tDesc.getBlockingDesc().getOffsetPadding();
-    std::copy(dims.begin(), dims.end(), mkldnnDesc.data.dims);
-    std::copy(ie_offsetsToData.begin(), ie_offsetsToData.begin() + outer_ndims, mkldnnDesc.data.padded_offsets);
-    std::fill(mkldnnDesc.data.padded_dims, mkldnnDesc.data.padded_dims + outer_ndims, 1);
-    for (size_t i = 0; i < ie_order.size(); i++) {
-        auto idx = ie_order[i];
-        mkldnnDesc.data.padded_dims[idx] *= ie_blkdDims[i];
-    }
-
-    // Fill blocking desc
-    auto &dnn_blk_desc = mkldnnDesc.data.format_desc.blocking;
-    dnn_blk_desc.inner_nblks = inner_ndims;
-    std::copy(ie_blkdDims.end() - inner_ndims, ie_blkdDims.end(), dnn_blk_desc.inner_blks);
-    std::copy(ie_order.end() - inner_ndims, ie_order.end(), dnn_blk_desc.inner_idxs);
-    for (size_t i = 0; i < outer_ndims; i++) {
-        dnn_blk_desc.strides[i] = ie_strides[outer_order[i]];
-    }
-
-    return MKLDNNMemoryDesc(mkldnnDesc);
-}
-
-BlockedMemoryDesc MemoryDescUtils::convertToBlockedDescriptor(const MemoryDesc &desc) {
-    if (desc.getType() == MemoryDescType::Blocked) {
-        return *(desc.as<BlockedMemoryDesc>());
-    } else if (desc.getType() == MemoryDescType::Mkldnn) {
-        return MemoryDescUtils::convertToBlockedDescriptor(*(desc.as<MKLDNNMemoryDesc>()));
-    } else {
-        IE_THROW() << "Cannot convert to blocked memory descriptor. Unsupported memory desc type";
-    }
-}
-
-MemoryDescPtr MemoryDescUtils::applyUndefinedOffset(const MKLDNNMemoryDesc& desc) {
-    if (desc.getFormatKind() != dnnl_format_kind_t::dnnl_blocked)
-        IE_THROW() << "applyUndefinedOffset doesn't support not dnnl_blocked MKLDNNMemoryDesc";
-
-    mkldnn::memory::desc retDesc = desc;
-    retDesc.data.offset0 = Shape::UNDEFINED_DIM;
-    return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(retDesc);
-}
-
-MemoryDescPtr MemoryDescUtils::applyUndefinedOffset(const BlockedMemoryDesc &desc) {
-    std::vector<size_t> strides;
-    std::vector<size_t> offsetPaddingToData;
-
-    strides.resize(desc.getBlockDims().size(), Shape::UNDEFINED_DIM);
-    offsetPaddingToData.resize(desc.getBlockDims().size(), 0);
-    size_t offsetPadding = Shape::UNDEFINED_DIM;
-
-    return MKLDNNPlugin::make_unique<BlockedMemoryDesc>(desc.getPrecision(), desc.getShape().getDims(), desc.getBlockDims(),
-                                                        desc.getOrder(), offsetPadding, offsetPaddingToData, strides);
-}
-
-MemoryDescPtr MemoryDescUtils::resetOffset(const MemoryDesc* desc) {
-    if (MemoryDescType::Blocked == desc->getType()) {
-        auto blockedDesc = desc->as<BlockedMemoryDesc>();
-        return MKLDNNPlugin::make_unique<BlockedMemoryDesc>(blockedDesc->getPrecision(), blockedDesc->getShape().getDims(),
-                                              blockedDesc->getBlockDims(), blockedDesc->getOrder());
-    } else if (MemoryDescType::Mkldnn == desc->getType()) {
-        auto mkldnnDesc = desc->as<MKLDNNMemoryDesc>();
-        mkldnn::memory::desc retDesc = *mkldnnDesc;
-        retDesc.data.offset0 = 0;
-        return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(retDesc);
-    } else {
-        IE_THROW() << "resetOffset support Blocked and Mkldnn descpriptors only";
-    }
-}
-
-InferenceEngine::Blob::Ptr MemoryDescUtils::interpretAsBlob(const MKLDNNMemory &mem) {
-    // TODO [DS]: Rewrite when IE is moved to the new TensorDescriptor
-    auto& memDesc = mem.GetDesc();
-    InferenceEngine::TensorDesc desc = convertToTensorDesc(memDesc);
-
-    desc = InferenceEngine::TensorDesc(desc.getPrecision(), memDesc.getShape().getStaticDims(), desc.getBlockingDesc());
-    return MKLDNNPlugin::isEmptyTensorDesc(desc) ? make_blob_with_precision(desc) : make_blob_with_precision(desc, mem.GetData());
-}
-
-} // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/cpu_memory_desc_utils.h b/inference-engine/src/mkldnn_plugin/cpu_memory_desc_utils.h
deleted file mode 100644
index 5cc6b0fc1038c7..00000000000000
--- a/inference-engine/src/mkldnn_plugin/cpu_memory_desc_utils.h
+++ /dev/null
@@ -1,88 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <ie_layouts.h>
-#include <ie_blob.h>
-
-namespace MKLDNNPlugin {
-class MKLDNNMemoryDesc;
-class BlockedMemoryDesc;
-class MKLDNNMemory;
-
-class MemoryDescUtils {
-public:
-    /**
-     * @brief Converts MemoryDesc to InferenceEngine::TensorDesc
-     * @param desc MemoryDesc to be converted
-     * @return converted InferenceEngine::TensorDesc
-     */
-    static InferenceEngine::TensorDesc convertToTensorDesc(const MemoryDesc& desc);
-
-    /**
-     * @brief Converts MemoryDesc to MKLDNNMemoryDesc
-     * @param desc MemoryDesc to be converted
-     * @return converted MKLDNNMemoryDesc
-     */
-    static MKLDNNMemoryDesc convertToMKLDNNMemoryDesc(const MemoryDesc& desc);
-
-    /**
-     * @brief Converts BlockedMemoryDesc to MKLDNNMemoryDesc
-     * @param desc BlockedMemoryDesc to be converted
-     * @return converted MKLDNNMemoryDesc
-     */
-    static MKLDNNMemoryDesc convertToMKLDNNMemoryDesc(const BlockedMemoryDesc& desc);
-
-    /**
-     * @brief Converts InferenceEngine::TensorDesc to MKLDNNMemoryDesc
-     * @param desc InferenceEngine::TensorDesc to be converted
-     * @return converted MKLDNNMemoryDesc
-     */
-    static MKLDNNMemoryDesc convertToMKLDNNMemoryDesc(const InferenceEngine::TensorDesc& desc);
-
-    /**
-     * @brief Converts MemoryDesc to BlockedMemoryDesc
-     * @param desc MemoryDesc to be converted
-     * @return converted BlockedMemoryDesc
-     */
-    static BlockedMemoryDesc convertToBlockedDescriptor(const MemoryDesc& desc);
-
-    /**
-     * @brief Converts MKLDNNMemoryDesc to BlockedMemoryDesc
-     * @param desc MKLDNNMemoryDesc to be converted
-     * @return converted BlockedMemoryDesc
-     */
-    static BlockedMemoryDesc convertToBlockedDescriptor(const MKLDNNMemoryDesc& inpDesc);
-
-    /**
-     * @brief Creates MKLDNNMemoryDesc with offset0 of UNDEFINED_DIM size
-     * @param desc modifiable MKLDNNMemoryDesc
-     * @return pointer to MKLDNNMemoryDesc
-     */
-    static MemoryDescPtr applyUndefinedOffset(const MKLDNNMemoryDesc& desc);
-
-    /**
-     * @brief Creates BlockedMemoryDesc with offsetPadding, strides of UNDEFINED_DIM size and offsetPaddingToData of 0 size
-     * @param desc modifiable BlockedMemoryDesc
-     * @return pointer to BlockedMemoryDesc
-     */
-    static MemoryDescPtr applyUndefinedOffset(const BlockedMemoryDesc& desc);
-
-    /**
-     * @brief Creates MemoryDesc with offsetPadding of 0 size
-     * @param desc modifiable MemoryDesc
-     * @return pointer to MemoryDesc
-     */
-    static MemoryDescPtr resetOffset(const MemoryDesc* desc);
-
-    /**
-     * @brief Creates InferenceEngine::Blob from MKLDNNMemory
-     * @param desc MKLDNNMemory from which will be created InferenceEngine::Blob
-     * @return pointer to InferenceEngine::Blob
-     */
-    static InferenceEngine::Blob::Ptr interpretAsBlob(const MKLDNNMemory& mem);
-};
-
-}  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/cpu_shape.cpp b/inference-engine/src/mkldnn_plugin/cpu_shape.cpp
new file mode 100644
index 00000000000000..2e0ab9e67e2b32
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/cpu_shape.cpp
@@ -0,0 +1,49 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "cpu_shape.h"
+#include "utils/general_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
+
+using namespace MKLDNNPlugin;
+
+bool Shape::isCompatible(const VectorDims &vecDims) const {
+    if (getRank() != vecDims.size()) {
+        return false;
+    }
+
+    auto comparator = [](Dim lhs, Dim rhs) {
+        return (lhs == rhs) || (lhs == Shape::UNDEFINED_DIM);
+    };
+
+    if (!std::equal(getDims().begin(), getDims().end(), vecDims.begin(), comparator)) {
+        return false;
+    }
+
+    if (!std::equal(getMaxDims().begin(), getMaxDims().end(), vecDims.begin(), [](Dim lhs, Dim rhs) { return lhs >= rhs; })) {
+        return false;
+    }
+
+    if (!std::equal(getMinDims().begin(), getMinDims().end(), vecDims.begin(), [](Dim lhs, Dim rhs) { return lhs <= rhs; })) {
+        return false;
+    }
+    return true;
+}
+
+std::string Shape::toString() const  {
+    std::stringstream output;
+    output << "{";
+
+    size_t i = 0;
+    do {
+        if (dims[i] == Shape::UNDEFINED_DIM) {
+            output << MemoryDescUtils::dim2str(minDims[i]) << " - " << MemoryDescUtils::dim2str(maxDims[i]);
+        } else {
+            output << dims[i];
+        }
+    } while (++i < dims.size() && output << ", ");
+
+    output << "}";
+    return output.str();
+}
diff --git a/inference-engine/src/mkldnn_plugin/cpu_shape.h b/inference-engine/src/mkldnn_plugin/cpu_shape.h
index fd063c2dc18c13..0972ebd227fa48 100644
--- a/inference-engine/src/mkldnn_plugin/cpu_shape.h
+++ b/inference-engine/src/mkldnn_plugin/cpu_shape.h
@@ -9,7 +9,7 @@
 #include <utility>
 #include <ie_common.h>
 #include <ngraph/partial_shape.hpp>
-#include "mkldnn_dims.h"
+#include "cpu_types.h"
 
 namespace MKLDNNPlugin {
 
@@ -19,7 +19,9 @@ class Shape {
 
     explicit Shape(const ngraph::PartialShape& shape) {
         minDims = shape.get_min_shape();
+        std::transform(minDims.begin(), minDims.end(), minDims.begin(), [](Dim x){ return ngraph::Interval::s_max == x ? UNDEFINED_DIM : x;});
         maxDims = shape.get_max_shape();
+        std::transform(maxDims.begin(), maxDims.end(), maxDims.begin(), [](Dim x){ return ngraph::Interval::s_max == x ? UNDEFINED_DIM : x;});
         type = shape.is_static() ? ShapeType::Static : ShapeType::Dynamic;
 
         initDims();
@@ -34,7 +36,7 @@ class Shape {
     }
 
     /**
-     * @brief 
+     * @brief
      * for static shape
      * maxDims = [2, 3, 4, 5]
      * minDims = [2, 3, 4, 5]
@@ -46,12 +48,12 @@ class Shape {
      * dims = [UNDEFINED_DIM, UNDEFINED_DIM, UNDEFINED_DIM, UNDEFINED_DIM]
      * @return return lower bound of shape = [1, 1, 1, 1]
      */
-    const std::vector<size_t>& getMinDims() const {
+    const VectorDims& getMinDims() const {
         return minDims;
     }
 
     /**
-     * @brief 
+     * @brief
      * for static shape
      * maxDims = [2, 3, 4, 5]
      * minDims = [2, 3, 4, 5]
@@ -63,15 +65,15 @@ class Shape {
      * dims = [UNDEFINED_DIM, UNDEFINED_DIM, UNDEFINED_DIM, UNDEFINED_DIM]
      * @return return upper bound of shape = [6, 6, 6, 6]
      */
-    const std::vector<size_t>& getMaxDims() const {
+    const VectorDims& getMaxDims() const {
         return maxDims;
     }
 
     /**
-     * @brief return defined shape or throw exception for dynamic case 
+     * @brief return defined shape or throw exception for dynamic case
      * @return return shape
      */
-    const std::vector<size_t>& getStaticDims() const {
+    const VectorDims& getStaticDims() const {
         if (type != ShapeType::Static) {
             IE_THROW() << "Cannot get dims for non static shape";
         }
@@ -80,7 +82,7 @@ class Shape {
     }
 
     /**
-     * @brief 
+     * @brief
      * for static shape
      * maxDims = [2, 3, 4, 5]
      * minDims = [2, 3, 4, 5]
@@ -92,13 +94,18 @@ class Shape {
      * dims = [2, 3, UNDEFINED_DIM, UNDEFINED_DIM]
      * @return return shape with defined and undefined dims = [2, 3, UNDEFINED_DIM, UNDEFINED_DIM]
      */
-    const std::vector<size_t>& getDims() const {
+    const VectorDims& getDims() const {
         return dims;
     }
+
     bool isStatic() const {
         return type == ShapeType::Static;
     }
 
+    bool isDynamic() const {
+        return type == ShapeType::Dynamic;
+    }
+
     size_t getRank() const {
         return minDims.size();
     }
@@ -118,14 +125,21 @@ class Shape {
     }
 
     ngraph::PartialShape toPartialShape() const {
-        std::vector<ngraph::Dimension> nGraphDims;
+        using ngraph::Dimension;
+        std::vector<Dimension> nGraphDims;
         nGraphDims.reserve(minDims.size());
         for (int i = 0; i < minDims.size(); i++) {
-            nGraphDims.emplace_back(minDims[i], maxDims[i]);
+            Dimension::value_type minDim = Shape::UNDEFINED_DIM == minDims[i] ? -1 : minDims[i];
+            Dimension::value_type maxDim = Shape::UNDEFINED_DIM == maxDims[i] ? -1 : maxDims[i];
+            nGraphDims.emplace_back(minDim, maxDim);
         }
         return ngraph::PartialShape(nGraphDims);
     }
 
+    bool isCompatible(const VectorDims& vecDims) const;
+
+    std::string toString() const;
+
     bool operator == (const Shape& rhs) const {
         return minDims == rhs.minDims && maxDims == rhs.maxDims;
     }
@@ -134,7 +148,11 @@ class Shape {
         return !(*this == rhs);
     }
 
-    enum : size_t {
+    bool hasDefinedUpperBounds() const {
+        return std::all_of(maxDims.begin(), maxDims.end(), [](Dim dim){ return dim != UNDEFINED_DIM; });
+    }
+
+    enum : Dim {
         UNDEFINED_DIM = 0xffffffffffffffff
     };
 
@@ -151,9 +169,8 @@ class Shape {
         Dynamic
     } type {ShapeType::Static};
 
-    std::vector<size_t> minDims;
-    std::vector<size_t> maxDims;
-    std::vector<size_t> dims;
+    VectorDims minDims;
+    VectorDims maxDims;
+    VectorDims dims;
 };
-
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/cpu_types.h b/inference-engine/src/mkldnn_plugin/cpu_types.h
index 7c820c4db50ccf..130fc142e980f5 100644
--- a/inference-engine/src/mkldnn_plugin/cpu_types.h
+++ b/inference-engine/src/mkldnn_plugin/cpu_types.h
@@ -4,8 +4,13 @@
 
 #pragma once
 
+#include <vector>
+
 namespace MKLDNNPlugin {
 
+using Dim = std::size_t;
+using VectorDims = std::vector<Dim>;
+
 enum Type {
     Unknown,
     Generic,
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/blocked_memory_desc.cpp b/inference-engine/src/mkldnn_plugin/memory_desc/blocked_memory_desc.cpp
new file mode 100644
index 00000000000000..a7b231c37af35e
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/blocked_memory_desc.cpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "blocked_memory_desc.h"
+#include "utils/general_utils.h"
+
+using namespace MKLDNNPlugin;
+
+bool BlockedMemoryDesc::isCompatible(const BlockedMemoryDesc &rhs) const {
+    if (this->getShape() != rhs.getShape() || this->getPrecision() != rhs.getPrecision())
+        return false;
+
+    if (!dimsEqualWeak(this->getBlockDims(), rhs.getBlockDims())) {
+        return false;
+    }
+
+    if (!dimsEqualWeak(this->getOffsetPaddingToData(), rhs.getOffsetPaddingToData())) {
+        return false;
+    }
+
+    // this check needed to avoid inserting unnecessary reorders if the memory is used in place and the batch size is equal to 1
+    size_t skipAxis = this->getShape().getRank() > 0 && this->getShape().getDims().front() == 1 ? 0 :
+            Shape::UNDEFINED_DIM; //ignore batch axis if batch size == 1
+    if (!dimsEqualWeak(this->getStrides(), rhs.getStrides(), skipAxis)) {
+        return false;
+    }
+
+    if (!dimsEqualWeak(this->getOrder(), rhs.getOrder())) {
+        return false;
+    }
+
+    return dimsEqualWeak(this->getOffsetPadding(), rhs.getOffsetPadding());
+}
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/blocked_memory_desc.h b/inference-engine/src/mkldnn_plugin/memory_desc/blocked_memory_desc.h
new file mode 100644
index 00000000000000..ac7a90185b999f
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/blocked_memory_desc.h
@@ -0,0 +1,83 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "cpu_memory_desc.h"
+
+namespace MKLDNNPlugin {
+
+class BlockedMemoryDesc : public virtual MemoryDesc {
+public:
+    BlockedMemoryDesc() {}
+
+    /**
+     * @brief Returns the blocked dimensions
+     *
+     * @return blocked dimensions
+     */
+    virtual const VectorDims& getBlockDims() const = 0;
+
+    /**
+     * @brief Returns the vector of order
+     *
+     * @return order
+     */
+    virtual const VectorDims& getOrder() const = 0;
+
+    /**
+     * @brief Returns the per-dimension offset vector
+     *
+     * @return offsets
+     */
+    virtual const VectorDims& getOffsetPaddingToData() const = 0;
+
+    /**
+     * @brief Returns the offset to the current memory block
+     *
+     * @return offset
+     */
+    virtual size_t getOffsetPadding() const = 0;
+
+    /**
+     * @brief Returns strides for each dimension
+     *
+     * @return strides
+     */
+    virtual const VectorDims& getStrides() const = 0;
+
+    /**
+     * @brief Check that desc has padded dims
+     *
+     * @return true if exist padded dims, otherwise false
+     */
+    virtual bool blocksExtended() const = 0;
+
+    /**
+     * @brief Compute number of elements taking into account padded dims
+     *
+     * @return number of elements taking into account padded dims
+     */
+    virtual size_t getPaddedElementsCount() const = 0;
+
+protected:
+    /**
+     * @brief Check descs on compatibility
+     * WARNING: Check only BlockedMemoryDesc specific attributes like: strides, order etc.
+     * Doesn't perform type check for descs
+     * Doesn't perform descs specific attributes check
+     * @return true if compatible, otherwise false
+     */
+    bool isCompatible(const BlockedMemoryDesc &rhs) const;
+
+    mutable VectorDims blockedDims;
+    mutable VectorDims strides;
+    mutable VectorDims order;
+    mutable VectorDims offsetPaddingToData;
+};
+
+using BlockedMemoryDescPtr = std::shared_ptr<BlockedMemoryDesc>;
+using BlockedMemoryDescCPtr = std::shared_ptr<const BlockedMemoryDesc>;
+
+} // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/cpu_blocked_memory_desc.cpp b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_blocked_memory_desc.cpp
similarity index 55%
rename from inference-engine/src/mkldnn_plugin/cpu_blocked_memory_desc.cpp
rename to inference-engine/src/mkldnn_plugin/memory_desc/cpu_blocked_memory_desc.cpp
index 6041e1f3f7b63e..aa9f72c5280ecb 100644
--- a/inference-engine/src/mkldnn_plugin/cpu_blocked_memory_desc.cpp
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_blocked_memory_desc.cpp
@@ -4,11 +4,12 @@
 
 #include "cpu_blocked_memory_desc.h"
 #include "mkldnn_memory.h"
-#include "utils/cpu_utils.hpp"
+#include "dnnl_blocked_memory_desc.h"
 
 using namespace MKLDNNPlugin;
 
-BlockedMemoryDesc::BlockedMemoryDesc(InferenceEngine::Precision prc, const std::vector<size_t>& dims) : MemoryDesc(dims, Blocked) , precision(prc) {
+CpuBlockedMemoryDesc::CpuBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape) : MemoryDesc(shape, Blocked), precision(prc) {
+    auto& dims = shape.getDims();
     order.resize(dims.size());
     std::iota(order.begin(), order.end(), 0);
     blockedDims = dims;
@@ -21,15 +22,15 @@ BlockedMemoryDesc::BlockedMemoryDesc(InferenceEngine::Precision prc, const std::
     }
 }
 
-BlockedMemoryDesc::BlockedMemoryDesc(InferenceEngine::Precision prc, const std::vector<size_t>& dims, const std::vector<size_t>& blockedDims,
-                  const std::vector<size_t>& order, size_t offsetPadding, const std::vector<size_t>& offsetPaddingToData,
-                  const std::vector<size_t>& strides) : MemoryDesc(dims, Blocked), precision(prc) {
+CpuBlockedMemoryDesc::CpuBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape, const VectorDims& blockedDims,
+                  const VectorDims& order, size_t offsetPadding, const VectorDims& offsetPaddingToData,
+                  const VectorDims& strides) : MemoryDesc(shape, Blocked), precision(prc) {
     if (std::any_of(order.begin(), order.end(), [](size_t val) { return val == Shape::UNDEFINED_DIM; })) {
-        IE_THROW() << "BlockedMemoryDesc do not support undefined order.";
+        IE_THROW() << "CpuBlockedMemoryDesc do not support undefined order.";
     }
 
-    if (std::any_of(blockedDims.begin() + dims.size(), blockedDims.end(), [](size_t val) { return val == Shape::UNDEFINED_DIM; })) {
-        IE_THROW() << "BlockedMemoryDesc doesn't support undefined blockedDims.";
+    if (std::any_of(blockedDims.begin() + shape.getRank(), blockedDims.end(), [](size_t val) { return val == Shape::UNDEFINED_DIM; })) {
+        IE_THROW() << "CpuBlockedMemoryDesc doesn't support undefined blockedDims.";
     }
 
     this->order = order;
@@ -37,11 +38,7 @@ BlockedMemoryDesc::BlockedMemoryDesc(InferenceEngine::Precision prc, const std::
     this->offsetPadding = offsetPadding;
 
     if (offsetPaddingToData.empty() && !order.empty()) {
-        this->offsetPaddingToData.resize(order.size());
-        this->offsetPaddingToData[order.size() - 1] = 0;
-        for (size_t i = 2; i <= order.size(); i++) {
-            this->offsetPaddingToData[order.size() - i] = 0;
-        }
+        this->offsetPaddingToData.resize(order.size(), 0);
     } else {
         this->offsetPaddingToData = offsetPaddingToData;
     }
@@ -65,7 +62,7 @@ BlockedMemoryDesc::BlockedMemoryDesc(InferenceEngine::Precision prc, const std::
     }
 }
 
-bool BlockedMemoryDesc::isDefined() const {
+bool CpuBlockedMemoryDesc::isDefinedImp() const {
     bool defined = true;
     defined = defined && std::none_of(blockedDims.cbegin(), blockedDims.cend(), [](size_t val) { return val == Shape::UNDEFINED_DIM; });
     defined = defined && std::none_of(strides.cbegin(), strides.cend(), [](size_t val) { return val == Shape::UNDEFINED_DIM; });
@@ -76,48 +73,26 @@ bool BlockedMemoryDesc::isDefined() const {
     return defined;
 }
 
-bool BlockedMemoryDesc::isCompatible(const MemoryDesc& rhs) const {
+bool CpuBlockedMemoryDesc::isCompatible(const MemoryDesc& rhs) const {
     const MemoryDesc* pRhs = &rhs;
-    if (auto blockingDesc = dynamic_cast<const BlockedMemoryDesc*>(pRhs)) {
-        return isCompatible(*blockingDesc);
-    } else if (auto mkldnnDesc = dynamic_cast<const MKLDNNMemoryDesc*>(pRhs)) {
-        return mkldnnDesc->isCompatible(*this);
+    if (auto cpuBlkDesc = dynamic_cast<const CpuBlockedMemoryDesc*>(pRhs)) {
+        return isCompatible(*cpuBlkDesc);
+    } else if (auto dnnlBlkDesc = dynamic_cast<const DnnlBlockedMemoryDesc*>(pRhs)) {
+        return isCompatible(*dnnlBlkDesc);
     } else {
         return false;
     }
 }
 
-bool BlockedMemoryDesc::isCompatible(const BlockedMemoryDesc& rhs) const {
-    if (this->getShape() != rhs.getShape() || this->getPrecision() != rhs.getPrecision())
-        return false;
-
-    if (!dimsEqualWeak(this->getBlockDims(), rhs.getBlockDims())) {
-        return false;
-    }
-
-    if (!dimsEqualWeak(this->getOffsetPaddingToData(), rhs.getOffsetPaddingToData())) {
-        return false;
-    }
-
-    // this check needed to avoid inserting unnecessary reorders if the memory is used in place and the batch size is equal to 1
-    size_t skipAxis = this->getShape().getRank() > 0 && this->getShape().getDims().front() == 1 ? 0 :
-            Shape::UNDEFINED_DIM; //ignore batch axis if batch size == 1
-    if (!dimsEqualWeak(this->getStrides(), rhs.getStrides(), skipAxis)) {
-        return false;
-    }
-
-    if (!dimsEqualWeak(this->getOrder(), rhs.getOrder())) {
-        return false;
-    }
-
-    return dimsEqualWeak(this->getOffsetPadding(), rhs.getOffsetPadding());
+bool CpuBlockedMemoryDesc::isCompatible(const CpuBlockedMemoryDesc &rhs) const {
+    return BlockedMemoryDesc::isCompatible(rhs);
 }
 
-bool BlockedMemoryDesc::isCompatible(const MKLDNNMemoryDesc& rhs) const {
+bool CpuBlockedMemoryDesc::isCompatible(const DnnlBlockedMemoryDesc &rhs) const {
     return rhs.isCompatible(*this);
 }
 
-size_t BlockedMemoryDesc::getMemSizeImp() const {
+size_t CpuBlockedMemoryDesc::getCurrentMemSizeImp() const {
     int64_t e_size = getOffsetPadding() + 1;  // size in bytes (from begin of data to last element)
     for (int j = 0; j < getBlockDims().size(); j++)
         e_size += (getBlockDims()[j] - 1) * getStrides()[j];
@@ -128,7 +103,21 @@ size_t BlockedMemoryDesc::getMemSizeImp() const {
     return e_size;
 }
 
-size_t BlockedMemoryDesc::getOffset(const InferenceEngine::SizeVector& v) const {
+size_t CpuBlockedMemoryDesc::getMaxMemSize() const {
+    if (shape.isStatic()) {
+        return getCurrentMemSize();
+    }
+
+    auto& maxDims = shape.getMaxDims();
+    if (std::any_of(maxDims.begin(), maxDims.end(), [](size_t x){ return Shape::UNDEFINED_DIM == x; })) {
+        return UNDEFINED_SIZE;
+    }
+
+    auto maxDimsDesc = cloneWithNewDims(maxDims);
+    return maxDimsDesc->getCurrentMemSize();
+}
+
+size_t CpuBlockedMemoryDesc::getOffset(const InferenceEngine::SizeVector& v) const {
     InferenceEngine::SizeVector off_v = v;
 
     size_t n_blocked_dims = order.size();
@@ -148,7 +137,7 @@ size_t BlockedMemoryDesc::getOffset(const InferenceEngine::SizeVector& v) const
     return offset;
 }
 
-size_t BlockedMemoryDesc::getElementOffset(size_t elemNumber) const {
+size_t CpuBlockedMemoryDesc::getElementOffset(size_t elemNumber) const {
     // TODO [DS]: rewrite to support dynamic shapes
     auto& dims = shape.getStaticDims();
     size_t n_dims = dims.size();
@@ -162,7 +151,7 @@ size_t BlockedMemoryDesc::getElementOffset(size_t elemNumber) const {
     return getOffset(pos);
 }
 
-bool BlockedMemoryDesc::hasLayoutType(LayoutType layoutType) const {
+bool CpuBlockedMemoryDesc::hasLayoutType(LayoutType layoutType) const {
     switch (layoutType) {
         case LayoutType::ncsp:
             return isPlainFormat();
@@ -177,7 +166,7 @@ bool BlockedMemoryDesc::hasLayoutType(LayoutType layoutType) const {
     }
 }
 
-bool BlockedMemoryDesc::isPlainFormat() const {
+bool CpuBlockedMemoryDesc::isPlainFormat() const {
     if (shape.getRank() != order.size()) {
         return false;
     }
@@ -189,7 +178,7 @@ bool BlockedMemoryDesc::isPlainFormat() const {
     return true;
 }
 
-bool BlockedMemoryDesc::isBlockedCFormat(size_t blk_size) const {
+bool CpuBlockedMemoryDesc::isBlockedCFormat(size_t blk_size) const {
     if ((order.size() - shape.getRank()) != 1) {
         return false;
     }
@@ -207,7 +196,7 @@ bool BlockedMemoryDesc::isBlockedCFormat(size_t blk_size) const {
     return true;
 }
 
-bool BlockedMemoryDesc::isTailCFormat() const {
+bool CpuBlockedMemoryDesc::isTailCFormat() const {
     if (shape.getRank() < 3) {
         return false;
     }
@@ -223,7 +212,7 @@ bool BlockedMemoryDesc::isTailCFormat() const {
     return true;
 }
 
-std::string BlockedMemoryDesc::serializeFormat() const {
+std::string CpuBlockedMemoryDesc::serializeFormat() const {
     std::stringstream result;
     char startLetter = 'a';
     std::unordered_map<size_t, size_t> mapAxisBlockSize;
@@ -245,3 +234,64 @@ std::string BlockedMemoryDesc::serializeFormat() const {
 
     return result.str();
 }
+
+MemoryDescPtr CpuBlockedMemoryDesc::cloneWithNewDimsImp(const VectorDims &dims) const {
+    if (std::any_of(dims.begin(), dims.end(), [](size_t x){ return Shape::UNDEFINED_DIM == x; })) {
+        IE_THROW() << "Can't clone desc if new dims are undefined";
+    }
+
+    // TODO [DS]: add stride recalculation for strided blobs
+    for (int i = strides.size() - 2; i >= 0 ; i--) {
+        if (strides[i] == Shape::UNDEFINED_DIM)
+            break;
+
+        if (strides[i] != strides[i + 1] * blockedDims[i + 1])
+            IE_THROW(NotImplemented) << "Can't clone desc with new dims for not dense tensor";
+    }
+
+    VectorDims newBlockedDims(order.size());
+
+    for (size_t i = 0; i < dims.size(); ++i) {
+        newBlockedDims[i] = dims[order[i]];
+    }
+
+    for (size_t i = dims.size(); i < order.size(); ++i) {
+        if (newBlockedDims[order[i]] != Shape::UNDEFINED_DIM) {
+            newBlockedDims[order[i]] = div_up(newBlockedDims[order[i]], blockedDims[i]);
+            newBlockedDims[i] = blockedDims[i];
+        }
+    }
+
+    VectorDims newOffsetPaddingToData;
+    if (std::none_of(offsetPaddingToData.begin(), offsetPaddingToData.end(), [](size_t x){ return x == Shape::UNDEFINED_DIM;})) {
+        newOffsetPaddingToData = offsetPaddingToData;
+    }
+
+    return std::make_shared<CpuBlockedMemoryDesc>(precision, Shape(dims), newBlockedDims, order, offsetPadding, newOffsetPaddingToData);
+}
+
+bool CpuBlockedMemoryDesc::blocksExtended() const {
+    const size_t rank = shape.getRank();
+    for (size_t i = rank; i < order.size(); i++) {
+        size_t idx = order[i];
+        Dim paddedDim = 1;
+        for (size_t j = rank; j < order.size(); j++) {
+            if (order[j] == idx)
+                paddedDim *= blockedDims[j];
+        }
+        if (blockedDims[idx] == Shape::UNDEFINED_DIM) {
+            paddedDim = Shape::UNDEFINED_DIM;
+        } else {
+            paddedDim *= blockedDims[idx];
+        }
+        if (paddedDim != shape.getDims()[idx])
+            return true;
+    }
+    return false;
+}
+
+size_t CpuBlockedMemoryDesc::getPaddedElementsCount() const {
+    if (std::any_of(blockedDims.begin(), blockedDims.end(), [](Dim dim) { return dim == Shape::UNDEFINED_DIM; }))
+        IE_THROW() << "Can't compute padded elements count for non undefined blocked dims";
+    return std::accumulate(blockedDims.begin(), blockedDims.end(), size_t{1}, std::multiplies<size_t>());
+}
diff --git a/inference-engine/src/mkldnn_plugin/cpu_blocked_memory_desc.h b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_blocked_memory_desc.h
similarity index 51%
rename from inference-engine/src/mkldnn_plugin/cpu_blocked_memory_desc.h
rename to inference-engine/src/mkldnn_plugin/memory_desc/cpu_blocked_memory_desc.h
index 2c5b8a7d53cbdb..40a465108f587a 100644
--- a/inference-engine/src/mkldnn_plugin/cpu_blocked_memory_desc.h
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_blocked_memory_desc.h
@@ -4,41 +4,32 @@
 
 #pragma once
 
-#include "cpu_memory_desc.h"
+#include "blocked_memory_desc.h"
+#include "utils/general_utils.h"
 
 namespace MKLDNNPlugin {
 
-class MKLDNNMemoryDesc;
-
-class BlockedMemoryDesc : public MemoryDesc {
+class CpuBlockedMemoryDesc : public BlockedMemoryDesc {
 public:
-    BlockedMemoryDesc(InferenceEngine::Precision prc, const std::vector<size_t>& dims);
+    CpuBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape);
 
-    BlockedMemoryDesc(InferenceEngine::Precision prc, const std::vector<size_t>& dims, const std::vector<size_t>& blockedDims,
-                      const std::vector<size_t>& order, size_t offsetPadding = 0, const std::vector<size_t>& offsetPaddingToData = {},
-                      const std::vector<size_t>& strides = {});
+    CpuBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape, const VectorDims& blockedDims,
+                         const VectorDims& order, size_t offsetPadding = 0, const VectorDims& offsetPaddingToData = {},
+                         const VectorDims& strides = {});
 
     MemoryDescPtr clone() const override {
-        return MKLDNNPlugin::make_unique<BlockedMemoryDesc>(*this);
+        return std::make_shared<CpuBlockedMemoryDesc>(*this);
     }
 
-    bool isDefined() const override;
-
     bool isCompatible(const MemoryDesc& rhs) const override;
-
-    bool isCompatible(const BlockedMemoryDesc& rhs) const;
-
-    bool isCompatible(const MKLDNNMemoryDesc& rhs) const;
+    bool isCompatible(const CpuBlockedMemoryDesc &rhs) const;
+    bool isCompatible(const DnnlBlockedMemoryDesc &rhs) const;
 
     InferenceEngine::Precision getPrecision() const override {
         return precision;
     }
 
-    void setPrecision(InferenceEngine::Precision prc) override {
-        precision = std::move(prc);
-    }
-
-    const std::vector<size_t>& getBlockDims() const {
+    const VectorDims& getBlockDims() const override {
         return blockedDims;
     }
 
@@ -47,7 +38,7 @@ class BlockedMemoryDesc : public MemoryDesc {
      *
      * @return order
      */
-    const std::vector<size_t>& getOrder() const {
+    const VectorDims& getOrder() const override {
         return order;
     }
 
@@ -56,7 +47,7 @@ class BlockedMemoryDesc : public MemoryDesc {
      *
      * @return offsets
      */
-    const std::vector<size_t>& getOffsetPaddingToData() const {
+    const VectorDims& getOffsetPaddingToData() const override {
         return offsetPaddingToData;
     }
     /**
@@ -64,7 +55,7 @@ class BlockedMemoryDesc : public MemoryDesc {
      *
      * @return offset
      */
-    size_t getOffsetPadding() const {
+    size_t getOffsetPadding() const override {
         return offsetPadding;
     }
 
@@ -73,28 +64,41 @@ class BlockedMemoryDesc : public MemoryDesc {
      *
      * @return strides
      */
-    const std::vector<size_t>& getStrides() const {
+    const VectorDims& getStrides() const override {
         return strides;
     }
 
+    bool blocksExtended() const override;
+
     bool hasLayoutType(LayoutType layoutType) const override;
 
     std::string serializeFormat() const override;
 
+    size_t getMaxMemSize() const override;
+
+    size_t getPaddedElementsCount() const override;
+
 private:
     size_t getElementOffset(size_t elemNumber) const override;
-    size_t getMemSizeImp() const override;
+    size_t getCurrentMemSizeImp() const override;
     size_t getOffset(const InferenceEngine::SizeVector& v) const;
     bool isPlainFormat() const;
     bool isBlockedCFormat(size_t blk_size) const;
     bool isTailCFormat() const;
+    bool isDefinedImp() const override;
+    MemoryDescPtr cloneWithNewDimsImp(const VectorDims& dims) const override;
+
+    void setPrecision(InferenceEngine::Precision prc) override {
+        precision = std::move(prc);
+    }
 
 private:
     InferenceEngine::Precision precision;
-    std::vector<size_t> blockedDims;
-    std::vector<size_t> strides;
-    std::vector<size_t> order;
-    std::vector<size_t> offsetPaddingToData;
     size_t offsetPadding;
+    mutable VectorDims paddedDims;
 };
+
+using CpuBlockedMemoryDescPtr = std::shared_ptr<CpuBlockedMemoryDesc>;
+using CpuBlockedMemoryDescCPtr = std::shared_ptr<const CpuBlockedMemoryDesc>;
+
 } // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/cpu_memory_desc.h b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc.h
similarity index 51%
rename from inference-engine/src/mkldnn_plugin/cpu_memory_desc.h
rename to inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc.h
index 31d2b4b2091f00..6bb9812320f310 100644
--- a/inference-engine/src/mkldnn_plugin/cpu_memory_desc.h
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc.h
@@ -7,13 +7,32 @@
 #include <ie_common.h>
 #include <ie_precision.hpp>
 #include "cpu_shape.h"
-#include "utils/general_utils.h"
+#include "cpu_types.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
+
+/**
+ * @brief
+ *
+ * MemoryDesc - the descriptor of tensor representation in memory. Describes all required information
+ * for proper allocation and handling tensor in some buffer. The real memory is not present, just description.
+ * This object answers on question how and where data with logical index [x1, x2, .. xN] placed in real buffer.
+ * In the simplest case it describe a mapping between "logical offset" and "real offset".
+ *
+ */
 
 namespace MKLDNNPlugin {
 
+class MemoryDesc;
+
+using MemoryDescPtr = std::shared_ptr<MemoryDesc>;
+using MemoryDescCPtr = std::shared_ptr<const MemoryDesc>;
+
 enum MemoryDescType {
-    Blocked,
-    Mkldnn
+    Undef = 0,
+    Blocked = 1,
+    Mkldnn = 1 << 1,
+
+    DnnlBlocked = Blocked | Mkldnn
 };
 
 enum class LayoutType : unsigned {
@@ -37,31 +56,51 @@ class MemoryDesc {
 
     virtual InferenceEngine::Precision getPrecision() const = 0;
 
-    virtual void setPrecision(InferenceEngine::Precision prc) = 0;
+    virtual MemoryDescPtr clone() const = 0;
 
-    virtual std::unique_ptr<MemoryDesc> clone() const = 0;
+    // clone descriptor with new dims. Throws an exception if some of the new dims conflicts with the internal shape (i.e. its defined dims ,rank, upper bounds)
+    MemoryDescPtr cloneWithNewDims(const VectorDims& dims) const {
+        if (!getShape().isCompatible(dims)) {
+            IE_THROW(ParameterMismatch) << "Can not clone with new dims. Descriptor's shape: " << getShape().toString() <<
+                                           " is incompatible with provided dimensions: " << MemoryDescUtils::dims2str(dims) << ".";
+        }
+
+        return cloneWithNewDimsImp(dims);
+    }
 
     virtual bool isCompatible(const MemoryDesc& rhs) const = 0;
 
     // Checks that all dimensions, offsets, strides, etc are defined (!= UNDEFINED_DIM)
-    virtual bool isDefined() const = 0;
+    bool isDefined() const {
+        if (descStatus::Unknown == status) {
+            status = isDefinedImp() ? descStatus::Defined : descStatus::Undefined;
+        }
+        return descStatus::Defined == status;
+    }
 
     virtual bool hasLayoutType(LayoutType layoutType) const = 0;
 
     virtual std::string serializeFormat() const = 0;
 
+    // Get memory upper bound if possible. Can be undefined
+    virtual size_t getMaxMemSize() const = 0;
+
     /**
      * @brief Get minimal required memory size in bytes.
      * @return return minimal required memory size in bytes or UNDEFINED_SIZE in case undefined descriptor
      */
-    size_t getCurrentSize() const {
+    size_t getCurrentMemSize() const {
         size_t retVal = UNDEFINED_SIZE;
         if (isDefined()) {
-            retVal = getMemSizeImp();
+            retVal = getCurrentMemSizeImp();
         }
         return retVal;
     }
 
+    bool hasDefinedMaxSize() const {
+        return getMaxMemSize() != MemoryDesc::UNDEFINED_SIZE;
+    }
+
     template <typename T,
             typename std::enable_if<!std::is_pointer<T>::value && !std::is_reference<T>::value, int>::type = 0,
             typename std::enable_if<std::is_base_of<MemoryDesc, T>::value, int>::type = 0>
@@ -85,26 +124,37 @@ class MemoryDesc {
     static constexpr size_t UNDEFINED_SIZE = std::numeric_limits<size_t>::max();
 
 protected:
-    MemoryDesc(const Shape& shape, MemoryDescType type)
-            : shape(shape), type(type) {}
+    MemoryDesc() : type(MemoryDescType::Undef) {}
+    MemoryDesc(Shape shape, MemoryDescType type)
+            : shape(std::move(shape)), type(type) {}
 
-    MemoryDesc(const std::vector<size_t>& dims, MemoryDescType type)
+    MemoryDesc(const VectorDims& dims, MemoryDescType type)
             : shape(dims), type(type) {}
 
-    virtual size_t getMemSizeImp() const = 0;
+    virtual void setPrecision(InferenceEngine::Precision prc) = 0;
+
+    virtual size_t getCurrentMemSizeImp() const = 0;
 
     // Get offset to the n'th element. Returns physical index of the element by the logical one considering padding, layout, blocking etc.
     virtual size_t getElementOffset(size_t elemNumber) const = 0;
 
+    virtual bool isDefinedImp() const = 0;
+
+    virtual MemoryDescPtr cloneWithNewDimsImp(const VectorDims& dims) const = 0;
+
     MemoryDescType type;
     Shape shape;
 
+    mutable enum class descStatus : uint8_t {
+        Unknown,
+        Defined,
+        Undefined,
+    } status = descStatus::Unknown;
+
     friend class BlobDumper;
     // WA: optimizedNspc2Ncsp used getElementOffset inside implementation
     friend class MKLDNNSplitNode;
+    friend MemoryDescPtr MemoryDescUtils::cloneWithNewPrecision(const MemoryDesc& desc, const InferenceEngine::Precision prec);
 };
 
-using MemoryDescPtr = std::unique_ptr<MemoryDesc>;
-using MemoryDescConstPtr = std::unique_ptr<const MemoryDesc>;
-
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc_utils.cpp b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc_utils.cpp
new file mode 100644
index 00000000000000..af940d8e48ec97
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc_utils.cpp
@@ -0,0 +1,155 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "cpu_memory_desc.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
+#include "mkldnn_memory.h"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
+#include "utils/general_utils.h"
+#include "utils/cpu_utils.hpp"
+#include <limits>
+#include <vector>
+#include <numeric>
+#include <blob_factory.hpp>
+#include <dnnl_types.h>
+
+using namespace mkldnn;
+using namespace MKLDNNPlugin;
+using namespace InferenceEngine;
+
+namespace MKLDNNPlugin {
+
+DnnlMemoryDescPtr MemoryDescUtils::convertToDnnlMemoryDesc(const MemoryDescPtr &desc) {
+    if (MemoryDescType::Blocked == desc->getType()) {
+        const auto cpuDesc = desc->as<CpuBlockedMemoryDesc>();
+        return std::shared_ptr<DnnlBlockedMemoryDesc>(new DnnlBlockedMemoryDesc(cpuDesc->getPrecision(), cpuDesc->getShape(), cpuDesc->getBlockDims(),
+                                                        cpuDesc->getOrder(), cpuDesc->getOffsetPadding(),
+                                                        cpuDesc->getOffsetPaddingToData(), cpuDesc->getStrides()));
+    } else if (MemoryDescType::Mkldnn & desc->getType()) {
+        return std::dynamic_pointer_cast<DnnlMemoryDesc>(desc);
+    } else {
+        IE_THROW() << "Cannot convert MemoryDesc to DnnlMemoryDesc";
+    }
+}
+
+DnnlBlockedMemoryDesc MemoryDescUtils::convertToDnnlBlockedMemoryDesc(const MemoryDesc& desc) {
+    if (MemoryDescType::DnnlBlocked == desc.getType()) {
+        return DnnlBlockedMemoryDesc(*desc.as<DnnlBlockedMemoryDesc>());
+    } else if (MemoryDescType::Blocked == desc.getType()) {
+        const auto cpuDesc = desc.as<CpuBlockedMemoryDesc>();
+        return DnnlBlockedMemoryDesc(cpuDesc->getPrecision(), cpuDesc->getShape(), cpuDesc->getBlockDims(), cpuDesc->getOrder(), cpuDesc->getOffsetPadding(),
+                                     cpuDesc->getOffsetPaddingToData(), cpuDesc->getStrides());
+    } else {
+        IE_THROW() << "Cannot convert MemoryDesc to DnnlMemoryDesc";
+    }
+}
+
+CpuBlockedMemoryDesc MemoryDescUtils::convertToCpuBlockedMemoryDesc(const InferenceEngine::TensorDesc& desc) {
+    if (desc.getLayout() == InferenceEngine::Layout::ANY)
+        IE_THROW() << "Cannot convert InferenceEngine::TensorDesc with ANY layout to CpuBlockedMemoryDesc";
+    const auto &blkDesc = desc.getBlockingDesc();
+    return CpuBlockedMemoryDesc(desc.getPrecision(), Shape(desc.getDims()), blkDesc.getBlockDims(), blkDesc.getOrder(), blkDesc.getOffsetPadding(),
+                                blkDesc.getOffsetPaddingToData(), blkDesc.getStrides());
+}
+
+DnnlBlockedMemoryDesc MemoryDescUtils::convertToDnnlBlockedMemoryDesc(const InferenceEngine::TensorDesc& desc) {
+    const auto &blkDesc = desc.getBlockingDesc();
+    if (desc.getLayout() == InferenceEngine::Layout::ANY)
+        IE_THROW() << "Cannot convert InferenceEngine::TensorDesc with ANY layout to DnnlBlockedMemoryDesc";
+    return DnnlBlockedMemoryDesc(desc.getPrecision(), Shape(desc.getDims()), blkDesc.getBlockDims(), blkDesc.getOrder(), blkDesc.getOffsetPadding(),
+                                 blkDesc.getOffsetPaddingToData(), blkDesc.getStrides());
+}
+
+BlockedMemoryDescPtr MemoryDescUtils::convertToBlockedMemoryDesc(const MemoryDescPtr &desc) {
+    if (desc->getType() & MemoryDescType::Blocked) {
+        return std::dynamic_pointer_cast<BlockedMemoryDesc>(desc);
+    } else {
+        IE_THROW() << "Can not convert unsupported memory descriptor";
+    }
+}
+
+MemoryDescPtr MemoryDescUtils::cloneWithUndefStridesAndOffset(const MemoryDesc& desc) {
+    if (desc.getType() == MemoryDescType::Mkldnn) {
+        IE_THROW() << "Can't apply undefined offset for mkldnn memory desc";
+    }
+
+    const auto blkMemDesc = desc.as<BlockedMemoryDesc>();
+
+    VectorDims strides;
+    VectorDims offsetPaddingToData;
+    strides.resize(blkMemDesc->getBlockDims().size(), Shape::UNDEFINED_DIM);
+    offsetPaddingToData.resize(blkMemDesc->getBlockDims().size(), 0);
+    size_t offsetPadding = Shape::UNDEFINED_DIM;
+
+    if (blkMemDesc->getType() == MemoryDescType::Blocked) {
+        return std::make_shared<CpuBlockedMemoryDesc>(blkMemDesc->getPrecision(), blkMemDesc->getShape(), blkMemDesc->getBlockDims(),
+                                                                    blkMemDesc->getOrder(), offsetPadding, offsetPaddingToData, strides);
+    } else if (blkMemDesc->getType() == MemoryDescType::DnnlBlocked) {
+        return DnnlBlockedMemoryDescPtr(new DnnlBlockedMemoryDesc(blkMemDesc->getPrecision(), blkMemDesc->getShape(),
+                                                                  blkMemDesc->getBlockDims(), blkMemDesc->getOrder(),
+                                                                  offsetPadding, offsetPaddingToData, strides));
+    } else {
+        IE_THROW() << "Cannot apply undefined offset. Unsupported memory desc type";
+    }
+}
+
+MemoryDescPtr MemoryDescUtils::cloneWithDefaultStridesAndOffset(const MemoryDesc& desc) {
+    const auto blkMemDesc = desc.as<BlockedMemoryDesc>();
+
+    if (MemoryDescType::Blocked == desc.getType()) {
+        return std::make_shared<CpuBlockedMemoryDesc>(blkMemDesc->getPrecision(), blkMemDesc->getShape(),
+                                                               blkMemDesc->getBlockDims(), blkMemDesc->getOrder());
+    } else if (MemoryDescType::DnnlBlocked == desc.getType()) {
+        return DnnlBlockedMemoryDescPtr(new DnnlBlockedMemoryDesc(blkMemDesc->getPrecision(), blkMemDesc->getShape(),
+                                                                  blkMemDesc->getBlockDims(), blkMemDesc->getOrder()));
+    } else {
+        IE_THROW() << "cloneWithDefaultStridesAndOffset supports Blocked descriptors only";
+    }
+}
+
+MemoryDescPtr MemoryDescUtils::cloneWithNewPrecision(const MemoryDesc& desc, const InferenceEngine::Precision prec) {
+    MemoryDescPtr newDesc = desc.clone();
+    newDesc->setPrecision(prec);
+    return newDesc;
+}
+
+InferenceEngine::Blob::Ptr MemoryDescUtils::interpretAsBlob(const MKLDNNMemory &mem) {
+    // TODO [DS]: Rewrite when IE is moved to the new TensorDescriptor
+    auto& memDesc = mem.getDesc();
+    InferenceEngine::TensorDesc desc = convertToTensorDesc(memDesc);
+
+    desc = InferenceEngine::TensorDesc(desc.getPrecision(), memDesc.getShape().getStaticDims(), desc.getBlockingDesc());
+    return make_blob_with_precision(desc, mem.GetData());
+}
+
+InferenceEngine::TensorDesc MemoryDescUtils::convertToTensorDesc(const MemoryDesc& desc) {
+    if (auto blockingDesc = dynamic_cast<const BlockedMemoryDesc*>(&desc)) {
+        return InferenceEngine::TensorDesc(blockingDesc->getPrecision(), blockingDesc->getShape().getStaticDims(),
+                                           {blockingDesc->getBlockDims(), blockingDesc->getOrder(), blockingDesc->getOffsetPadding(),
+                                            blockingDesc->getOffsetPaddingToData(), blockingDesc->getStrides()});
+    } else {
+        IE_THROW() << "Cannot convert MemoryDesc to InferenceEngine::TensorDesc";
+    }
+}
+
+std::string MemoryDescUtils::dim2str(Dim dim) {
+    return dim == Shape::UNDEFINED_DIM ? "?" : std::to_string(dim);
+}
+
+std::string MemoryDescUtils::dims2str(const VectorDims& dims) {
+    std::stringstream output;
+    output << "{";
+
+    if (!dims.empty()) {
+        auto itr = dims.begin();
+        do {
+            output << dim2str(*itr);
+        } while (++itr != dims.end() && output << ", ");
+    }
+
+    output << "}";
+    return output.str();
+}
+
+} // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc_utils.h b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc_utils.h
new file mode 100644
index 00000000000000..04878af80451c3
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/cpu_memory_desc_utils.h
@@ -0,0 +1,107 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <ie_layouts.h>
+#include <ie_blob.h>
+#include "mkldnn/ie_mkldnn.h"
+
+namespace MKLDNNPlugin {
+
+class MemoryDesc;
+class DnnlMemoryDesc;
+class BlockedMemoryDesc;
+class DnnlBlockedMemoryDesc;
+class CpuBlockedMemoryDesc;
+class MKLDNNMemory;
+
+class MemoryDescUtils {
+public:
+    /**
+     * @brief Converts MemoryDesc to DnnlMemoryDesc
+     * @param desc MemoryDesc to be converted
+     * @return converted DnnlMemoryDesc
+     */
+    static std::shared_ptr<DnnlMemoryDesc> convertToDnnlMemoryDesc(const std::shared_ptr<MemoryDesc> &desc);
+
+    /**
+     * @brief Converts MemoryDesc to DnnlBlockedMemoryDesc
+     * @param desc MemoryDesc to be converted
+     * @return converted DnnlBockedMemoryDesc
+     */
+    static DnnlBlockedMemoryDesc convertToDnnlBlockedMemoryDesc(const MemoryDesc& desc);
+
+    /**
+     * @brief Converts InferenceEngine::TensorDesc to CpuBlockedMemoryDesc
+     * @param desc InferenceEngine::TensorDesc to be converted
+     * @return converted CpuBlockedMemoryDesc
+     */
+    static CpuBlockedMemoryDesc convertToCpuBlockedMemoryDesc(const InferenceEngine::TensorDesc& desc);
+
+    /**
+     * @brief Converts InferenceEngine::TensorDesc to DnnlBlockedMemoryDesc
+     * @param desc InferenceEngine::TensorDesc to be converted
+     * @return converted DnnlBlockedMemoryDesc
+     */
+    static DnnlBlockedMemoryDesc convertToDnnlBlockedMemoryDesc(const InferenceEngine::TensorDesc& desc);
+
+    /**
+     * @brief Converts MemoryDesc to BlockedMemoryDesc
+     * @param desc MemoryDesc to be converted
+     * @return converted BlockedMemoryDesc
+     */
+    static std::shared_ptr<BlockedMemoryDesc> convertToBlockedMemoryDesc(const std::shared_ptr<MemoryDesc> &desc);
+
+    /**
+     * @brief Creates BlockedMemoryDesc with offsetPadding and strides of UNDEFINED_DIM size
+     * @param desc is the MemoryDesc to be cloned
+     * @return pointer to the new MemoryDesc
+     */
+    static std::shared_ptr<MemoryDesc> cloneWithUndefStridesAndOffset(const MemoryDesc& desc);
+
+    /**
+     * @brief Creates MemoryDesc with offsetPadding of 0 size and default strides
+     * @param desc is the MemoryDesc to be cloned
+     * @return pointer to the new MemoryDesc
+     */
+    static std::shared_ptr<MemoryDesc> cloneWithDefaultStridesAndOffset(const MemoryDesc& desc);
+
+    /**
+     * @brief Creates MemoryDesc with specified precision
+     * @param desc is the MemoryDesc to be cloned
+     * @return pointer to the new MemoryDesc
+     */
+    static std::shared_ptr<MemoryDesc> cloneWithNewPrecision(const MemoryDesc& desc, const InferenceEngine::Precision prec);
+
+    /**
+     * @brief Creates InferenceEngine::Blob from MKLDNNMemory with the memory reuse
+     * @param desc MKLDNNMemory from which will be created InferenceEngine::Blob
+     * @return pointer to InferenceEngine::Blob
+     */
+    static InferenceEngine::Blob::Ptr interpretAsBlob(const MKLDNNMemory& mem);
+
+    /**
+     * @brief Converts MemoryDesc to InferenceEngine::TensorDesc
+     * @param desc MemoryDesc to be converted
+     * @return converted InferenceEngine::TensorDesc
+     */
+    static InferenceEngine::TensorDesc convertToTensorDesc(const MemoryDesc& desc);
+
+    /**
+     * @brief Converts dim to string, undefined dim represented as ?
+     * @param dim Dim to be converted
+     * @return dim as string
+     */
+    static std::string dim2str(Dim dim);
+
+    /**
+     * @brief Converts dims to string, undefined dim represented as ?
+     * @param dim Dims to be converted
+     * @return dims as string
+     */
+    static std::string dims2str(const VectorDims& dims);
+};
+
+}  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_blocked_memory_desc.cpp b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_blocked_memory_desc.cpp
new file mode 100644
index 00000000000000..e2834c1defa858
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_blocked_memory_desc.cpp
@@ -0,0 +1,796 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "memory_desc/dnnl_blocked_memory_desc.h"
+#include <dnnl_types.h>
+#include <common/memory_desc_wrapper.hpp>
+
+using namespace MKLDNNPlugin;
+using namespace InferenceEngine;
+
+DnnlBlockedMemoryDesc::DnnlBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape) : MemoryDesc(shape, DnnlBlocked) {
+    const auto ndims = shape.getRank();
+    const auto &dims = shape.getDims();
+    mkldnn::memory::dims plain_strides;
+    if (std::any_of(dims.begin(), dims.end(), [](size_t val) { return val == Shape::UNDEFINED_DIM; })) {
+        plain_strides.resize(ndims, DNNL_RUNTIME_DIM_VAL);
+    } else {
+        plain_strides.resize(ndims, 1);
+        for (size_t i = 1; i < ndims; i++) {
+            plain_strides[ndims - i -1] = plain_strides[ndims - i] * dims[ndims - i];
+        }
+    }
+
+    desc = {MKLDNNExtensionUtils::convertToDnnlDims(dims), MKLDNNExtensionUtils::IEPrecisionToDataType(prc), plain_strides};
+
+    order.resize(ndims);
+    std::iota(order.begin(), order.end(), 0);
+
+    initBlockedParams();
+}
+
+/**
+ * Construct from blocked parameters
+ *
+ * IE  IOhw_4i16o4i   dims(N) = {32, 64, 128, 128}
+ *   blockedDims  {4, 2, 128, 128, 4, 16, 4}                      // total dims(inner, outermost, auto blocked/padded). Generally sorted by strides.
+ *   strides      {8388608, 4194304,  32768, 256, 64,  4, 1}      // strides for blockedDims, growing sequence
+ *   order        {1, 0,   2,   3, 1,  0, 1}                      // matching to original dims
+ *
+ *   All vectors blockedDims/strides/order have same size equals total num of internal blocked dims(inner_dims + outer_dims)
+ *
+ *   Tensor descriptor filing is not deterministic. It allows any permutation of index which keeps order of
+ *   real dims spliting.
+ *      for {1, 0, 2, 3, 1, 0, 1} we can swap elements [1] <=> [4]
+ *      but not [0]<=>[4] because it break splitting original dims into internal blocked dims
+ *   Normalization of representation: Make strides growing but keep layout same as original. Not all
+ *   layout allow us to meet normalize form of tensor desc.
+ *
+ *   Limitation of conversion first N elements of order should be permutation of [0,1,2 ... N]
+ */
+DnnlBlockedMemoryDesc::DnnlBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape, const VectorDims& blockedDims,
+                                                 const VectorDims& order, size_t offsetPadding, const VectorDims& offsetPaddingToData,
+                                                 const VectorDims& strides) : MemoryDesc(shape, DnnlBlocked) {
+    using namespace mkldnn;
+    // scalar case
+    if (shape.getRank() == 0) {
+        desc.data.format_kind = dnnl_blocked;
+        desc.data.data_type = memory::convert_to_c(MKLDNNExtensionUtils::IEPrecisionToDataType(prc));
+        desc.data.ndims = 1;
+        desc.data.dims[0] = 1;
+        desc.data.padded_dims[0] = 1;
+        desc.data.format_desc.blocking.strides[0] = 1;
+        desc.data.padded_offsets[0] = 0;
+        desc.data.offset0 = MKLDNNExtensionUtils::convertToDnnlDim(offsetPadding);
+        return;
+    }
+
+    if (order.size() != blockedDims.size()) {
+        IE_THROW() << "Can not construct DnnlBlockedMemoryDesc, order and blocked dims must have equals size";
+    }
+
+    if (!offsetPaddingToData.empty() && offsetPaddingToData.size() != order.size()) {
+        IE_THROW() << "Can not construct DnnlBlockedMemoryDesc, offsetPaddingToData must have equal size with order and blocked dims";
+    }
+
+    if (!strides.empty() && strides.size() != order.size()) {
+        IE_THROW() << "Can not construct DnnlBlockedMemoryDesc, strides must have equal size with order and blocked dims";
+    }
+
+    if (std::any_of(order.begin(), order.end(), [](size_t val) { return val == Shape::UNDEFINED_DIM; })) {
+        IE_THROW() << "DnnlBlockedMemoryDesc doesn't support undefined order.";
+    }
+
+    if (std::any_of(blockedDims.begin() + shape.getRank(), blockedDims.end(), [](size_t val) { return val == Shape::UNDEFINED_DIM; })) {
+        IE_THROW() << "DnnlBlockedMemoryDesc doesn't support undefined blockedDims.";
+    }
+
+    auto dims = MKLDNNExtensionUtils::convertToDnnlDims(shape.getDims());
+
+    size_t outer_ndims = dims.size();
+    size_t inner_ndims = order.size() - dims.size();
+
+    if (!strides.empty()) {
+        bool is_descending_strides = true;
+        for (int i = 1; i < strides.size(); i++) {
+            is_descending_strides &= (strides[i - 1] >= strides[i]);
+        }
+
+        // TODO: That's strong constrains and can be mitigated. IE::TensorDesc allow to transpose blocked dims
+        //       and may be we can achieve correct "descending strides" form which allow conversion.
+        if (!is_descending_strides)
+            IE_THROW() << "Can not construct DnnlBlockedMemoryDesc from strides: " << vec2str(strides);
+    }
+
+    VectorDims outer_order(outer_ndims, outer_ndims + 1); // outer_order[i] is index of stride for i-th dimension
+    for (size_t i = 0; i < outer_ndims; i++) {
+        outer_order[order[i]] = i;
+    }
+    bool outer_is_correct_permutation_of_n =
+            std::find(outer_order.begin(), outer_order.end(), outer_ndims + 1) == outer_order.end();
+
+    if (!outer_is_correct_permutation_of_n)
+        IE_THROW() << "Can not construct DnnlBlockedMemoryDesc because of incorrect order: " << vec2str(order);
+
+    if (!strides.empty() && std::none_of(strides.begin(), strides.end(), [](size_t x) { return Shape::UNDEFINED_DIM == x; })) {
+        bool inner_block_are_dense = one_of(strides.back(), 0, 1);  // stride 1 - is dense case, 0 - broad casted
+        for (int i = outer_ndims; i < strides.size() - 1; i++) {
+            inner_block_are_dense &= (strides[i] == strides[i + 1] * blockedDims[i + 1]);
+        }
+
+        if (!inner_block_are_dense)
+            IE_THROW() << "Can not construct DnnlBlockedMemoryDesc from strides: " << vec2str(strides) << " inner blocks are not dense.";
+    }
+
+    // Fill general memory desc fields
+    desc.data.format_kind = dnnl_blocked;
+    desc.data.extra.flags = 0;
+    desc.data.data_type = memory::convert_to_c(MKLDNNExtensionUtils::IEPrecisionToDataType(prc));
+    desc.data.ndims = dims.size();
+    desc.data.offset0 = MKLDNNExtensionUtils::convertToDnnlDim(offsetPadding);
+    std::copy(dims.begin(), dims.end(), desc.data.dims);
+
+    if (!offsetPaddingToData.empty()) {
+        bool inner_pad_offsets_is_zero = std::all_of(offsetPaddingToData.begin() + outer_ndims, offsetPaddingToData.end(),
+                                                     [](size_t pad) { return pad == 0; });
+
+        if (!inner_pad_offsets_is_zero)
+            IE_THROW() << "Can not construct DnnlBlockedMemoryDesc, inner pad offsets is not zero: " << vec2str(offsetPaddingToData);
+        auto dnnlPaddedOffsets = MKLDNNExtensionUtils::convertToDnnlDims(offsetPaddingToData);
+        std::copy(dnnlPaddedOffsets.begin(), dnnlPaddedOffsets.begin() + outer_ndims, desc.data.padded_offsets);
+    } else {
+        std::fill(std::begin(desc.data.padded_offsets), std::begin(desc.data.padded_offsets) + outer_ndims, 0);
+    }
+
+    std::fill(desc.data.padded_dims, desc.data.padded_dims + outer_ndims, 1);
+    auto dnnlBlkDims = MKLDNNExtensionUtils::convertToDnnlDims(blockedDims);
+
+    for (size_t i = 0; i < order.size(); i++) {
+        auto idx = order[i];
+        if (desc.data.padded_dims[idx] != DNNL_RUNTIME_DIM_VAL && dnnlBlkDims[i] != DNNL_RUNTIME_DIM_VAL) {
+            desc.data.padded_dims[idx] *= dnnlBlkDims[i];
+        } else {
+            desc.data.padded_dims[idx] = DNNL_RUNTIME_DIM_VAL;
+        }
+    }
+
+    // Fill blocking desc
+    auto &dnn_blk_desc = desc.data.format_desc.blocking;
+    dnn_blk_desc.inner_nblks = inner_ndims;
+    std::copy(dnnlBlkDims.end() - inner_ndims, dnnlBlkDims.end(), dnn_blk_desc.inner_blks);
+    std::copy(order.end() - inner_ndims, order.end(), dnn_blk_desc.inner_idxs);
+
+    if (strides.empty()) {
+        if (std::any_of(dnnlBlkDims.begin(), dnnlBlkDims.end(), [](memory::dim val) { return val == DNNL_RUNTIME_DIM_VAL; })) {
+            std::fill(std::begin(dnn_blk_desc.strides), std::begin(dnn_blk_desc.strides) + outer_ndims, DNNL_RUNTIME_DIM_VAL);
+        } else {
+            //TODO [DS]: phase 2: refactor
+            std::vector<memory::dim> tmpStrides(order.size());
+            tmpStrides[order.size() - 1] = 1;
+            for (size_t i = 2; i <= order.size(); i++) {
+                tmpStrides[order.size() - i] = tmpStrides[order.size() - (i - 1)] * dnnlBlkDims[blockedDims.size() - (i - 1)];
+            }
+            for (size_t i = 0; i < outer_ndims; i++) {
+                dnn_blk_desc.strides[i] = tmpStrides[outer_order[i]];
+            }
+        }
+    } else {
+        for (size_t i = 0; i < outer_ndims; i++) {
+            auto dnnlStrides = MKLDNNExtensionUtils::convertToDnnlDims(strides);
+            dnn_blk_desc.strides[i] = dnnlStrides[outer_order[i]];
+        }
+    }
+
+    this->order = order;
+
+    initBlockedParams();
+}
+
+DnnlBlockedMemoryDesc::DnnlBlockedMemoryDesc(const Shape& shape, mkldnn::memory::data_type dataType, mkldnn::memory::format_tag format) :
+        MemoryDesc(shape, DnnlBlocked) {
+    using namespace mkldnn;
+    if (format == memory::format_tag::any || format == memory::format_tag::undef)
+        IE_THROW(Unexpected) << "Can't create mkldnn::desc with any or undef format";
+
+    const auto dims = shape.getDims();
+    if (format == memory::format_tag::x && shape.getRank() == 0) {
+        desc = mkldnn::memory::desc(mkldnn::memory::dims(1, 1), dataType, format);
+    } else {
+        desc = mkldnn::memory::desc(MKLDNNExtensionUtils::convertToDnnlDims(dims), dataType, format);
+    }
+
+    VectorDims perm;
+    VectorDims inner_blks;
+    VectorDims inner_idxs;
+
+    mkldnn::impl::memory_desc_wrapper::compute_blocking(mkldnn::memory::convert_to_c(format), perm, inner_blks, inner_idxs);
+
+    order.swap(perm);
+    order.insert(order.end(), inner_idxs.begin(), inner_idxs.end());
+
+    initBlockedParams();
+}
+
+bool DnnlBlockedMemoryDesc::isCompatible(const MemoryDesc& rhs) const {
+    if (auto desc = dynamic_cast<const DnnlBlockedMemoryDesc*>(&rhs)) {
+        return isCompatible(*desc);
+    } else if (auto desc = dynamic_cast<const CpuBlockedMemoryDesc*>(&rhs)) {
+        return isCompatible(*desc);
+    } else {
+        return false;
+    }
+}
+
+bool DnnlBlockedMemoryDesc::isCompatible(const CpuBlockedMemoryDesc& rhs) const {
+    return this->desc.data.extra.flags == dnnl_memory_extra_flag_none && BlockedMemoryDesc::isCompatible(rhs);
+}
+
+bool DnnlBlockedMemoryDesc::isCompatible(const DnnlBlockedMemoryDesc& rhs) const {
+    using namespace dnnl;
+    using namespace impl;
+    using namespace impl::utils;
+    if (this->getShape() != rhs.getShape() || this->getPrecision() != rhs.getPrecision()) {
+        return false;
+    }
+
+    if (this->desc == rhs.desc) {
+        return true;
+    }
+    memory_desc_wrapper wrappedThis(this->desc.data);
+    memory_desc_wrapper wrappedRhs(rhs.desc.data);
+    if (one_of(wrappedThis.format_kind(), format_kind::undef, format_kind::any))
+        return false;
+
+    int stride_start = wrappedThis.ndims() > 0 && wrappedThis.dims()[0] == 1 ? 1 : 0;  // ignore batch axis stride if batch size == 1
+
+    const auto thisExtra = this->desc.data.extra;
+    const auto rhsExtra = rhs.desc.data.extra;
+    return this->getOrder() == rhs.getOrder() && (thisExtra.flags == rhsExtra.flags && thisExtra.compensation_mask == rhsExtra.compensation_mask &&
+           thisExtra.scale_adjust == rhsExtra.scale_adjust) && wrappedThis.similar_to(wrappedRhs, true, true, 0, stride_start, true, true);
+}
+
+DnnlBlockedMemoryDesc::DnnlBlockedMemoryDesc(const mkldnn::memory::desc& mdesc) :
+                MemoryDesc(MKLDNNExtensionUtils::convertToVectorDims(mdesc.dims()), DnnlBlocked) {
+    desc = mdesc;
+    if (desc.data.format_kind == dnnl::impl::format_kind::any)
+        IE_THROW(Unexpected) << "Memory format any is prohibited!";
+
+    mkldnn::impl::memory_desc_wrapper descWrapped(desc.data);
+    if (!descWrapped.is_blocking_desc())
+        IE_THROW(Unexpected) << "Can't create DnnlBlockedMemoryDesc from not blocking desc";
+
+    if (descWrapped.has_runtime_dims_or_strides()) {
+        IE_THROW(Unexpected) << "Cannot calculate order from undefined dims or strides";
+    }
+
+    const auto dims = desc.dims();
+
+    const auto &blk_desc = descWrapped.blocking_desc();
+
+    const size_t outer_ndims = dims.size();
+    const size_t inner_ndims = blk_desc.inner_nblks;
+    const size_t total_ndims = outer_ndims + inner_ndims;
+
+    // strides of inner dims. In case of 4i16o4i will be {64, 4, 1}
+    VectorDims inner_strides(inner_ndims, 1);
+    for (size_t i = 1; i < blk_desc.inner_nblks; i++) {
+        inner_strides[blk_desc.inner_nblks - 1 - i] = inner_strides[blk_desc.inner_nblks - i] * blk_desc.inner_blks[blk_desc.inner_nblks - i];
+    }
+
+    // total inner block size. in case of 4i16o4i will be {16, 16, 1, 1}
+    VectorDims total_block_per_dim(outer_ndims, 1);
+    for (int i = 0; i < inner_ndims; i++) {
+        total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
+    }
+    VectorDims outer_block_dims(std::begin(dims), std::begin(dims) + outer_ndims);
+    for (size_t i = 0; i < outer_block_dims.size(); i++) {
+        outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
+    }
+
+    // order of outer dims. In case of IOhw_ will be {1, 0, 2, 3}
+    VectorDims outer_order(outer_ndims);
+    std::iota(outer_order.begin(), outer_order.end(), 0);
+    std::sort(outer_order.begin(), outer_order.end(),
+              [&blk_desc, &outer_block_dims](size_t ind_l, size_t ind_r) {
+                  return (blk_desc.strides[ind_l] > blk_desc.strides[ind_r]) ||
+                         (blk_desc.strides[ind_l] == blk_desc.strides[ind_r] && outer_block_dims[ind_l] > outer_block_dims[ind_r]);
+              });
+
+
+    // blocked order
+    // [new_outer_order] U [inner_idxs]
+    SizeVector blk_order(total_ndims, 0);
+    std::copy(outer_order.begin(), outer_order.end(), blk_order.begin());
+    std::copy(blk_desc.inner_idxs, blk_desc.inner_idxs + blk_desc.inner_nblks, blk_order.begin() + dims.size());
+    order.swap(blk_order);
+
+    initBlockedParams();
+}
+
+bool DnnlBlockedMemoryDesc::hasLayoutType(LayoutType layoutType) const {
+    switch (layoutType) {
+        case LayoutType::ncsp:
+            return isPlainFormat();
+        case LayoutType::nspc:
+            return isTailCFormat();
+        case LayoutType::nCsp8c:
+            return isBlockedCFormat(8);
+        case LayoutType::nCsp16c:
+            return isBlockedCFormat(16);
+        default:
+            return false;
+    }
+}
+
+bool DnnlBlockedMemoryDesc::isPlainFormat() const {
+    if (shape.getRank() != order.size()) {
+        return false;
+    }
+    for (size_t i = 0; i < order.size(); ++i) {
+        if (order[i] != i) {
+            return false;
+        }
+    }
+    return true;
+}
+
+bool DnnlBlockedMemoryDesc::isBlockedCFormat(size_t blk_size) const {
+    const auto &blocking = desc.data.format_desc.blocking;
+
+    if (desc.data.format_kind !=dnnl_blocked ||
+        blocking.inner_nblks != 1 ||
+        blocking.inner_idxs[0] != 1)
+        return false;
+
+    if ((order.size() - shape.getRank()) != 1) {
+        return false;
+    }
+    for (size_t i = 0; i < order.size() - 1; ++i) {
+        if (order[i] != i) {
+            return false;
+        }
+    }
+    if (blk_size != UNREACHABLE_DIM && blk_size != blocking.inner_blks[0]) {
+            return false;
+    }
+
+    return true;
+}
+
+bool DnnlBlockedMemoryDesc::isTailCFormat() const {
+    if (shape.getRank() < 3) {
+        return false;
+    }
+    if (shape.getRank() != order.size()) {
+        return false;
+    }
+    if (!std::is_sorted(order.begin(), --order.end())) {
+        return false;
+    }
+    if (order.back() != 1) {
+        return false;
+    }
+    return true;
+}
+
+MemoryDescPtr DnnlBlockedMemoryDesc::cloneWithNewDimsImp(const VectorDims &dims) const {
+    if (std::any_of(dims.begin(), dims.end(), [](size_t x){ return Shape::UNDEFINED_DIM == x; })) {
+        IE_THROW() << "Can't clone desc if new dims are undefined";
+    }
+
+    // TODO [DS]: add stride recalculation for strided blobs
+    getStrides();
+    getBlockDims();
+    for (int i = strides.size() - 2; i >= 0 ; i--) {
+        if (strides[i] == Shape::UNDEFINED_DIM)
+            break;
+
+        if (strides[i] != strides[i + 1] * blockedDims[i + 1])
+            IE_THROW(NotImplemented) << "Can't clone desc with new dims for not dense tensor";
+    }
+
+    using namespace dnnl::impl::utils;
+    auto mklDims = MKLDNNExtensionUtils::convertToDnnlDims(dims);
+    mkldnn::memory::desc newMklDesc = desc;
+    array_copy(newMklDesc.data.dims, mklDims.data(), mklDims.size());
+    std::vector<int> perm(order.begin(), order.begin() + mklDims.size());
+    auto& blockingDesc = newMklDesc.data.format_desc.blocking;
+    auto numInnerBlks = blockingDesc.inner_nblks;
+    std::vector<int> innerBlks(std::begin(blockingDesc.inner_blks), std::begin(blockingDesc.inner_blks) + numInnerBlks);
+    std::vector<int> innerIdxs(std::begin(blockingDesc.inner_idxs), std::begin(blockingDesc.inner_idxs) + numInnerBlks);
+    auto retCode = dnnl::impl::fill_blocked(newMklDesc.data, perm, innerBlks, innerIdxs);
+    if (retCode != dnnl::impl::status::success) {
+        IE_THROW() << "Can not clone DnnlBlockedMemoryDesc with dims: " << MemoryDescUtils::dims2str(dims);
+    }
+    return DnnlBlockedMemoryDescPtr(new DnnlBlockedMemoryDesc(newMklDesc));
+}
+
+static const std::map<int, std::vector<mkldnn::memory::format_tag>> form_tags_by_ndims {
+    {0, {
+        mkldnn::memory::format_tag::a   // TODO :: really 1d layout for scalar??
+     }}, {1, {
+        mkldnn::memory::format_tag::a
+     }}, {2, {
+        mkldnn::memory::format_tag::ab,
+        mkldnn::memory::format_tag::ba
+     }}, {3, {
+        mkldnn::memory::format_tag::abc,
+        mkldnn::memory::format_tag::acb,
+        mkldnn::memory::format_tag::bac,
+        mkldnn::memory::format_tag::bca,
+        mkldnn::memory::format_tag::cba,
+
+        mkldnn::memory::format_tag::Abc16a,
+        mkldnn::memory::format_tag::ABc16a16b,
+        mkldnn::memory::format_tag::ABc4a4b,
+        mkldnn::memory::format_tag::aBc16b,
+        mkldnn::memory::format_tag::aBc32b,
+        mkldnn::memory::format_tag::ABc16b16a,
+        mkldnn::memory::format_tag::Abc4a,
+        mkldnn::memory::format_tag::aBc4b,
+        mkldnn::memory::format_tag::ABc4b16a4b,
+        mkldnn::memory::format_tag::ABc2b8a4b,
+        mkldnn::memory::format_tag::ABc16b16a4b,
+        mkldnn::memory::format_tag::ABc16b16a2b,
+        mkldnn::memory::format_tag::ABc4b4a,
+        mkldnn::memory::format_tag::ABc8a16b2a,
+        mkldnn::memory::format_tag::ABc8a8b,
+        mkldnn::memory::format_tag::ABc8a4b,
+        mkldnn::memory::format_tag::aBc8b,
+        mkldnn::memory::format_tag::ABc8b16a2b,
+        mkldnn::memory::format_tag::ABc8b8a,
+        mkldnn::memory::format_tag::Acb16a,
+        mkldnn::memory::format_tag::Acb4a,
+        mkldnn::memory::format_tag::Acb8a,
+        mkldnn::memory::format_tag::BAc16a16b,
+        mkldnn::memory::format_tag::BAc16b16a,
+     }}, {4, {                                 // Popular
+        mkldnn::memory::format_tag::abcd,      // plain
+        mkldnn::memory::format_tag::acdb,      // tail_c
+        mkldnn::memory::format_tag::aBcd8b,    // blocked 8c
+        mkldnn::memory::format_tag::aBcd16b,   // blocked 16c
+
+        mkldnn::memory::format_tag::abdc,
+
+        mkldnn::memory::format_tag::bacd,
+        mkldnn::memory::format_tag::bcda,
+        mkldnn::memory::format_tag::cdba,
+        mkldnn::memory::format_tag::dcab,
+
+        mkldnn::memory::format_tag::Abcd8a,
+        mkldnn::memory::format_tag::Abcd16a,
+        mkldnn::memory::format_tag::Abcd32a,
+        mkldnn::memory::format_tag::ABcd16a16b,
+        mkldnn::memory::format_tag::aBcd32b,
+        mkldnn::memory::format_tag::ABcd16b16a,
+        mkldnn::memory::format_tag::aBCd16b16c,
+        mkldnn::memory::format_tag::aBCd16c16b,
+        mkldnn::memory::format_tag::Abcd4a,
+        mkldnn::memory::format_tag::aBcd4b,
+        mkldnn::memory::format_tag::ABcd4b16a4b,
+        mkldnn::memory::format_tag::ABcd2b8a4b,
+        mkldnn::memory::format_tag::ABcd4b4a,
+        mkldnn::memory::format_tag::ABcd4a4b,
+        mkldnn::memory::format_tag::aBCd4c16b4c,
+        mkldnn::memory::format_tag::aBCd2c8b4c,
+        mkldnn::memory::format_tag::ABcd16b16a4b,
+        mkldnn::memory::format_tag::ABcd16b16a2b,
+        mkldnn::memory::format_tag::aBCd16c16b4c,
+        mkldnn::memory::format_tag::aBCd16c16b2c,
+        mkldnn::memory::format_tag::aBCd4c4b,
+        mkldnn::memory::format_tag::aBCd4b4c,
+        mkldnn::memory::format_tag::ABcd8a16b2a,
+        mkldnn::memory::format_tag::ABcd8a8b,
+        mkldnn::memory::format_tag::ABcd8a32b,
+        mkldnn::memory::format_tag::ABcd32a32b,
+        mkldnn::memory::format_tag::ABcd8a4b,
+
+        mkldnn::memory::format_tag::ABcd8b16a2b,
+        mkldnn::memory::format_tag::aBCd8b16c2b,
+        mkldnn::memory::format_tag::ABcd8b8a,
+        mkldnn::memory::format_tag::aBCd8b8c,
+        mkldnn::memory::format_tag::aBCd8b4c,
+        mkldnn::memory::format_tag::aBCd8c16b2c,
+        mkldnn::memory::format_tag::aBCd8c8b,
+
+        mkldnn::memory::format_tag::ABcd4a8b8a4b,
+        mkldnn::memory::format_tag::ABcd2a8b8a2b,
+
+        mkldnn::memory::format_tag::aBdc16b,
+        mkldnn::memory::format_tag::aBdc4b,
+        mkldnn::memory::format_tag::aBdc8b,
+        mkldnn::memory::format_tag::aCBd16b16c,
+        mkldnn::memory::format_tag::aCBd16c16b,
+        mkldnn::memory::format_tag::Acdb16a,
+        mkldnn::memory::format_tag::Acdb4a,
+        mkldnn::memory::format_tag::Acdb8a,
+        mkldnn::memory::format_tag::BAcd16a16b,
+        mkldnn::memory::format_tag::BAcd16b16a,
+        mkldnn::memory::format_tag::ABcd32a32b,
+        mkldnn::memory::format_tag::Acdb32a,
+        mkldnn::memory::format_tag::aBCd2b4c2b,
+        mkldnn::memory::format_tag::aBCd2c4b2c,
+        mkldnn::memory::format_tag::aBCd4b8c2b,
+        mkldnn::memory::format_tag::aBCd4c8b2c,
+    }}, {5, {                                   // Popular
+        mkldnn::memory::format_tag::abcde,      // plain
+        mkldnn::memory::format_tag::acdeb,      // tail_c
+        mkldnn::memory::format_tag::aBcde8b,    // blocked 8c
+        mkldnn::memory::format_tag::aBcde16b,   // blocked 16c
+
+        mkldnn::memory::format_tag::abdec,
+        mkldnn::memory::format_tag::acbde,
+        mkldnn::memory::format_tag::bacde,
+        mkldnn::memory::format_tag::bcdea,
+        mkldnn::memory::format_tag::cdeba,
+        mkldnn::memory::format_tag::decab,
+
+        mkldnn::memory::format_tag::Abcde16a,
+        mkldnn::memory::format_tag::Abcde32a,
+        mkldnn::memory::format_tag::ABcde16a16b,
+        mkldnn::memory::format_tag::aBcde32b,
+        mkldnn::memory::format_tag::ABcde16b16a,
+        mkldnn::memory::format_tag::aBCde16b16c,
+        mkldnn::memory::format_tag::aBCde16c16b,
+        mkldnn::memory::format_tag::aBCde2c8b4c,
+        mkldnn::memory::format_tag::Abcde4a,
+        mkldnn::memory::format_tag::aBcde4b,
+        mkldnn::memory::format_tag::ABcde4b4a,
+        mkldnn::memory::format_tag::ABcde4a4b,
+        mkldnn::memory::format_tag::aBCde4b4c,
+        mkldnn::memory::format_tag::aBCde4c16b4c,
+        mkldnn::memory::format_tag::aBCde16c16b4c,
+        mkldnn::memory::format_tag::aBCde16c16b2c,
+        mkldnn::memory::format_tag::aBCde4c4b,
+        mkldnn::memory::format_tag::Abcde8a,
+        mkldnn::memory::format_tag::ABcde8a8b,
+        mkldnn::memory::format_tag::ABcde8a4b,
+        mkldnn::memory::format_tag::ABcde8b16a2b,
+        mkldnn::memory::format_tag::ABcde4b16a4b,
+        mkldnn::memory::format_tag::ABcde2b8a4b,
+        mkldnn::memory::format_tag::aBCde8b16c2b,
+        mkldnn::memory::format_tag::ABcde8b8a,
+        mkldnn::memory::format_tag::aBCde8b8c,
+        mkldnn::memory::format_tag::aBCde8b4c,
+        mkldnn::memory::format_tag::aBCde4b8c8b4c,
+        mkldnn::memory::format_tag::aBCde2b8c8b2c,
+        mkldnn::memory::format_tag::aBCde8c16b2c,
+        mkldnn::memory::format_tag::aBCde8c8b,
+        mkldnn::memory::format_tag::aBdec16b,
+        mkldnn::memory::format_tag::aBdec4b,
+        mkldnn::memory::format_tag::aBdec8b,
+        mkldnn::memory::format_tag::aCBde16b16c,
+        mkldnn::memory::format_tag::aCBde16c16b,
+        mkldnn::memory::format_tag::Acdeb16a,
+        mkldnn::memory::format_tag::Acdeb4a,
+        mkldnn::memory::format_tag::Acdeb8a,
+        mkldnn::memory::format_tag::BAcde16b16a,
+        mkldnn::memory::format_tag::BAcde16a16b,
+        mkldnn::memory::format_tag::aBdec32b,
+        mkldnn::memory::format_tag::aBCde2b4c2b,
+        mkldnn::memory::format_tag::aBCde2c4b2c,
+        mkldnn::memory::format_tag::aBCde4b8c2b,
+        mkldnn::memory::format_tag::aBCde4c8b2c,
+    }}, {6, {                                    // Popular
+        mkldnn::memory::format_tag::abcdef,      // plain
+        mkldnn::memory::format_tag::acbdef,      // permute
+        mkldnn::memory::format_tag::defcab,      // permute
+        mkldnn::memory::format_tag::aBcdef16b,   // blocked 16c
+
+        mkldnn::memory::format_tag::aBCdef16b16c,
+        mkldnn::memory::format_tag::aBCdef16c16b,
+        mkldnn::memory::format_tag::aBcdef4b,
+        mkldnn::memory::format_tag::aBCdef2c8b4c,
+        mkldnn::memory::format_tag::aBCdef4c4b,
+        mkldnn::memory::format_tag::aBCdef4b4c,
+        mkldnn::memory::format_tag::aBCdef8b8c,
+        mkldnn::memory::format_tag::aBCdef8b4c,
+        mkldnn::memory::format_tag::aBCdef8c16b2c,
+        mkldnn::memory::format_tag::aBCdef4c16b4c,
+        mkldnn::memory::format_tag::aBCdef8c8b,
+
+        mkldnn::memory::format_tag::aBdefc16b,
+        mkldnn::memory::format_tag::aCBdef16c16b,
+        mkldnn::memory::format_tag::aCBdef16b16c,
+        mkldnn::memory::format_tag::aBdefc4b,
+        mkldnn::memory::format_tag::aBdefc8b,
+
+        mkldnn::memory::format_tag::Abcdef4a,
+        mkldnn::memory::format_tag::Abcdef8a,
+        mkldnn::memory::format_tag::Abcdef16a,
+        mkldnn::memory::format_tag::Abcdef32a,
+        mkldnn::memory::format_tag::aBCdef2b4c2b,
+        mkldnn::memory::format_tag::aBCdef2c4b2c,
+        mkldnn::memory::format_tag::aBCdef4b8c2b,
+        mkldnn::memory::format_tag::aBCdef4c8b2c,
+        }}
+};
+
+bool DnnlBlockedMemoryDesc::isSame(mkldnn::memory::format_tag fmt) const {
+    mkldnn::memory::desc refDesc(desc.dims(), desc.data_type(), fmt);
+
+    if (desc.data.ndims != refDesc.data.ndims)
+        return false;
+
+    if (desc.data.format_kind != dnnl_blocked || refDesc.data.format_kind != dnnl_blocked)
+        IE_THROW() << "DnnlMemoryDesc::isSame is not implemented for non blocked memory format";
+
+    auto actualBlkDesc = desc.data.format_desc.blocking;
+    auto refBlkDesc = refDesc.data.format_desc.blocking;
+    if (actualBlkDesc.inner_nblks != refBlkDesc.inner_nblks)
+        return false;
+
+    for (size_t i = 0; i < actualBlkDesc.inner_nblks; ++i)
+        if (actualBlkDesc.inner_blks[i] != refBlkDesc.inner_blks[i])
+            return false;
+
+    for (size_t i = 0; i < actualBlkDesc.inner_nblks; ++i)
+        if (actualBlkDesc.inner_idxs[i] != refBlkDesc.inner_idxs[i])
+            return false;
+
+    auto actualStrides = desc.data.format_desc.blocking.strides;
+    auto refStrides = refDesc.data.format_desc.blocking.strides;
+
+    VectorDims actualOrder(desc.data.ndims);
+    {
+        const auto dims = desc.dims();
+        VectorDims total_block_per_dim(dims.size(), 1);
+        const auto &blk_desc = desc.data.format_desc.blocking;
+        for (int i = 0; i < blk_desc.inner_nblks; i++) {
+            total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
+        }
+        VectorDims outer_block_dims(std::begin(dims), std::begin(dims) + dims.size());
+        for (size_t i = 0; i < outer_block_dims.size(); i++) {
+            outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
+        }
+
+        std::iota(actualOrder.begin(), actualOrder.end(), 0);
+        std::sort(actualOrder.begin(), actualOrder.end(),
+                  [&actualStrides, &outer_block_dims] (size_t ind_l, size_t ind_r) {
+                      return (actualStrides[ind_l] > actualStrides[ind_r]) ||
+                             (actualStrides[ind_l] == actualStrides[ind_r] && outer_block_dims[ind_l] > outer_block_dims[ind_r]);
+                  });
+    }
+
+    VectorDims refOrder(refDesc.data.ndims);
+    {
+        const auto dims = refDesc.dims();
+        VectorDims total_block_per_dim(dims.size(), 1);
+        const auto &blk_desc = refDesc.data.format_desc.blocking;
+        for (int i = 0; i < blk_desc.inner_nblks; i++) {
+            total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
+        }
+        VectorDims outer_block_dims(std::begin(dims), std::begin(dims) + dims.size());
+        for (size_t i = 0; i < outer_block_dims.size(); i++) {
+            outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
+        }
+
+        std::iota(refOrder.begin(), refOrder.end(), 0);
+        std::sort(refOrder.begin(), refOrder.end(),
+                  [&refStrides, &outer_block_dims] (size_t ind_l, size_t ind_r) {
+                      return (refStrides[ind_l] > refStrides[ind_r]) ||
+                             (refStrides[ind_l] == refStrides[ind_r] && outer_block_dims[ind_l] > outer_block_dims[ind_r]);
+                  });
+    }
+
+    if (actualOrder != refOrder) {
+        return false;
+    }
+
+    return true;
+}
+
+mkldnn::memory::format_tag DnnlBlockedMemoryDesc::getFormat() const {
+    // TODO [OneDNN]: Previously it was a field of tdesc, but now the brute
+    //                force search here. Please avoid of using this method.
+    const auto ndims = desc.dims().size();
+
+    // There are no suitable format_tag for this
+    if (ndims == 0 || ndims > 6)
+        return mkldnn::memory::format_tag::undef;
+
+    for (const auto fmt : form_tags_by_ndims.at(ndims)) {
+        if (this->isSame(fmt))
+            return fmt;
+    }
+
+    return mkldnn::memory::format_tag::undef;
+}
+
+std::string DnnlBlockedMemoryDesc::serializeFormat() const {
+    auto fmt = getFormat();
+    return mkldnn::utils::fmt2str(fmt);
+}
+
+size_t DnnlBlockedMemoryDesc::getMaxMemSize() const {
+    if (shape.isStatic()) {
+        return getCurrentMemSize();
+    }
+
+    auto& maxDims = shape.getMaxDims();
+    if (std::any_of(maxDims.begin(), maxDims.end(), [](size_t x){ return Shape::UNDEFINED_DIM == x; })) {
+        return UNDEFINED_SIZE;
+    }
+
+    auto maxDimsDesc = cloneWithNewDims(maxDims);
+    return maxDimsDesc->getCurrentMemSize();
+}
+
+size_t DnnlBlockedMemoryDesc::getPaddedElementsCount() const {
+    return std::accumulate(std::begin(desc.data.padded_dims), std::begin(desc.data.padded_dims) + desc.data.ndims, size_t{1},
+                           std::multiplies<int64_t>());
+}
+
+bool DnnlBlockedMemoryDesc::blocksExtended() const {
+    for (int i = 0; i < desc.data.ndims; i++) {
+        if (desc.data.dims[i] != desc.data.padded_dims[i])
+            return true;
+    }
+    return false;
+}
+
+void DnnlBlockedMemoryDesc::initBlockDims() {
+    const auto dims = desc.dims();
+
+    const auto &blk_desc = desc.data.format_desc.blocking;
+
+    const size_t outer_ndims = dims.size();
+    const size_t inner_ndims = blk_desc.inner_nblks;
+    const size_t total_ndims = outer_ndims + inner_ndims;
+
+    // total inner block size. in case of 4i16o4i will be {16, 16, 1, 1}
+    VectorDims total_block_per_dim(outer_ndims, 1);
+    for (int i = 0; i < inner_ndims; i++) {
+        total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
+    }
+    // blocked dims
+    // [dims via new_outer_order with auto pad] U [inner_blk_dims]
+    VectorDims outer_block_dims = MKLDNNExtensionUtils::convertToVectorDims(dims);
+    for (size_t i = 0; i < outer_block_dims.size(); i++) {
+        if (outer_block_dims[i] != Shape::UNDEFINED_DIM) {
+            outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
+        }
+    }
+
+    // order of outer dims. In case of IOhw_ will be {1, 0, 2, 3}
+    VectorDims outer_order(outer_ndims);
+    std::copy(order.begin(), order.begin() + outer_ndims, outer_order.begin());
+
+    blockedDims.resize(total_ndims, 0);
+    std::copy(blk_desc.inner_blks, blk_desc.inner_blks + blk_desc.inner_nblks,
+              blockedDims.end() - blk_desc.inner_nblks);
+    std::transform(outer_order.begin(), outer_order.end(), blockedDims.begin(),
+                   [&] (size_t i) { return outer_block_dims[i]; });
+}
+
+void DnnlBlockedMemoryDesc::initStrides() {
+    const auto dims = desc.dims();
+
+    const auto &blk_desc = desc.data.format_desc.blocking;
+
+    const size_t outer_ndims = dims.size();
+    const size_t inner_ndims = blk_desc.inner_nblks;
+    const size_t total_ndims = outer_ndims + inner_ndims;
+
+    // strides of inner dims. In case of 4i16o4i will be {64, 4, 1}
+    VectorDims inner_strides(inner_ndims, 1);
+    for (size_t i = 1; i < blk_desc.inner_nblks; i++) {
+        inner_strides[blk_desc.inner_nblks - 1 - i] = inner_strides[blk_desc.inner_nblks - i] * blk_desc.inner_blks[blk_desc.inner_nblks - i];
+    }
+
+    // order of outer dims. In case of IOhw_ will be {1, 0, 2, 3}
+    VectorDims outer_order(outer_ndims);
+    std::copy(order.begin(), order.begin() + outer_ndims, outer_order.begin());
+
+    // blocked strides
+    // [outer_strides via new_outer_order] U [inner_strides]
+    strides.resize(total_ndims, 0);
+    std::copy(inner_strides.rbegin(), inner_strides.rend(), strides.rbegin());
+    std::transform(outer_order.begin(), outer_order.end(), strides.begin(),
+                   [&](size_t i) { return blk_desc.strides[i] == DNNL_RUNTIME_DIM_VAL ? Shape::UNDEFINED_DIM : blk_desc.strides[i]; });
+}
+
+void DnnlBlockedMemoryDesc::initOffsetPadding() {
+    offsetPaddingToData = VectorDims(std::begin(desc.data.padded_offsets), std::begin(desc.data.padded_offsets) + getOrder().size());
+}
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_blocked_memory_desc.h b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_blocked_memory_desc.h
new file mode 100644
index 00000000000000..297eb5badeccc4
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_blocked_memory_desc.h
@@ -0,0 +1,99 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "blocked_memory_desc.h"
+#include "mkldnn_memory.h"
+#include "mkldnn_extension_utils.h"
+
+namespace MKLDNNPlugin {
+
+class DnnlBlockedMemoryDesc : public BlockedMemoryDesc, public DnnlMemoryDesc {
+public:
+    // Creates planar DnnlBlockedMemoryDesc
+    DnnlBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape);
+
+    DnnlBlockedMemoryDesc(const Shape& shape, mkldnn::memory::data_type dataType, mkldnn::memory::format_tag format);
+
+    MemoryDescPtr clone() const override {
+        return std::make_shared<DnnlBlockedMemoryDesc>(*this);
+    }
+
+    bool isCompatible(const MemoryDesc& rhs) const override;
+    bool isCompatible(const DnnlBlockedMemoryDesc& rhs) const;
+    bool isCompatible(const CpuBlockedMemoryDesc& rhs) const;
+
+    const VectorDims& getBlockDims() const override {
+        return blockedDims;
+    }
+
+    const VectorDims& getOrder() const override {
+        return order;
+    }
+
+    const VectorDims& getOffsetPaddingToData() const override {
+        return offsetPaddingToData;
+    }
+
+    size_t getOffsetPadding() const override {
+        return MKLDNNExtensionUtils::convertToDim(desc.data.offset0);
+    }
+
+    const VectorDims& getStrides() const override {
+        return strides;
+    }
+
+    bool hasLayoutType(LayoutType layoutType) const override;
+
+    bool isSame(mkldnn::memory::format_tag fmt) const override;
+
+    std::string serializeFormat() const override;
+
+    size_t getMaxMemSize() const override;
+
+    bool blocksExtended() const override;
+
+    size_t getPaddedElementsCount() const override;
+
+private:
+    DnnlBlockedMemoryDesc(InferenceEngine::Precision prc, const Shape& shape, const VectorDims& blockedDims,
+                            const VectorDims& order, size_t offsetPadding = 0, const VectorDims& offsetPaddingToData = {},
+                            const VectorDims& strides = {});
+
+    DnnlBlockedMemoryDesc(const mkldnn::memory::desc& mdesc);
+
+    MemoryDescPtr cloneWithNewDimsImp(const VectorDims& dims) const override;
+
+    bool isPlainFormat() const;
+    bool isBlockedCFormat(size_t blk_size = UNREACHABLE_DIM) const;
+    bool isTailCFormat() const;
+
+    // WA: we need to initialize blocked params into ctor to avoid bugs when we calculate these params in throughput mode
+    // TODO [DS]: should be reimplemented to avoid useless calculation
+    void initBlockedParams() {
+        initBlockDims();
+        initStrides();
+        initOffsetPadding();
+    }
+
+    void initBlockDims();
+    void initStrides();
+    void initOffsetPadding();
+
+    /**
+     * Try to define original format tag use on creation
+     *
+     * @return format tag if was able to define it
+     */
+    mkldnn::memory::format_tag getFormat() const;
+
+    friend DnnlMemoryDescPtr MKLDNNExtensionUtils::makeDescriptor(const mkldnn::memory::desc &desc);
+    friend class MemoryDescUtils;
+};
+
+using DnnlBlockedMemoryDescPtr = std::shared_ptr<DnnlBlockedMemoryDesc>;
+using DnnlBlockedMemoryDescCPtr = std::shared_ptr<const DnnlBlockedMemoryDesc>;
+
+} // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_memory_desc.cpp b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_memory_desc.cpp
new file mode 100644
index 00000000000000..60b1a96ef0dd01
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_memory_desc.cpp
@@ -0,0 +1,75 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "dnnl_memory_desc.h"
+#include "mkldnn_extension_utils.h"
+#include <common/memory_desc_wrapper.hpp>
+#include "mkldnn/ie_mkldnn.h"
+
+namespace MKLDNNPlugin {
+
+DnnlMemoryDesc::DnnlMemoryDesc(const mkldnn::memory::desc& desc) :
+    MemoryDesc(Shape(MKLDNNExtensionUtils::convertToVectorDims(desc.dims())), Mkldnn), desc(desc) {
+    if (desc.data.format_kind == dnnl::impl::format_kind::any)
+        IE_THROW(Unexpected) << "Memory format any is prohibited!";
+}
+
+size_t DnnlMemoryDesc::getCurrentMemSizeImp() const {
+    return MKLDNNExtensionUtils::getMemSizeForDnnlDesc(desc);
+}
+
+size_t DnnlMemoryDesc::getElementOffset(size_t elemNumber) const {
+    mkldnn::impl::memory_desc_wrapper wrapped(desc.data);
+    return wrapped.off_l(elemNumber);
+}
+
+bool DnnlMemoryDesc::isCompatible(const MemoryDesc &rhs) const {
+    if (MemoryDescType::Mkldnn == rhs.getType()) {
+        return this->desc == rhs.as<DnnlMemoryDesc>()->desc;
+    } else {
+        return false;
+    }
+}
+
+// TODO: add serialization for packed format
+std::string DnnlMemoryDesc::serializeFormat() const {
+    if (desc.data.format_kind == dnnl_format_kind_wino) {
+        switch (desc.data.format_desc.wino_desc.wino_format) {
+            case dnnl_wino_memory_format_t::dnnl_wino_wei_aaOIoi: return "wino_aaOIoi";
+            case dnnl_wino_memory_format_t::dnnl_wino_wei_aaOio: return "wino_aaOio";
+            case dnnl_wino_memory_format_t::dnnl_wino_wei_aaOBiOo: return "wino_aaOBiOo";
+            case dnnl_wino_memory_format_t::dnnl_wino_wei_OBaaIBOIio: return "wino_OBaaIBOIio";
+            default: return "wino_undef";
+        }
+    }
+    return "undef";
+}
+
+bool DnnlMemoryDesc::isDefinedImp() const {
+    mkldnn::impl::memory_desc_wrapper wrappedThis(desc.data);
+
+    if (wrappedThis.has_runtime_dims_or_strides()) {
+        return false;
+    }
+
+    return wrappedThis.offset0() != DNNL_RUNTIME_DIM_VAL;
+}
+
+InferenceEngine::Precision DnnlMemoryDesc::getPrecision() const {
+    return MKLDNNExtensionUtils::DataTypeToIEPrecision(desc.data_type());
+}
+
+MemoryDescPtr DnnlMemoryDesc::cloneWithNewDimsImp(const VectorDims &dims) const {
+    IE_THROW(Unexpected) << "Cannot clone non blocked oneDNN desc with new dims";
+}
+
+size_t DnnlMemoryDesc::getMaxMemSize() const {
+    if (shape.isDynamic()) {
+        IE_THROW() << "Can't compute max mem size for DnnlMemoryDesc with dynaimc shape";
+    }
+
+    return getCurrentMemSize();
+}
+
+} // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_memory_desc.h b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_memory_desc.h
new file mode 100644
index 00000000000000..fd79994643bcd2
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/memory_desc/dnnl_memory_desc.h
@@ -0,0 +1,71 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "cpu_blocked_memory_desc.h"
+#include "mkldnn_extension_utils.h"
+
+namespace MKLDNNPlugin {
+
+class DnnlMemoryDesc;
+
+using DnnlMemoryDescPtr = std::shared_ptr<DnnlMemoryDesc>;
+using DnnlMemoryDescCPtr = std::shared_ptr<const DnnlMemoryDesc>;
+
+class DnnlMemoryDesc : public virtual MemoryDesc {
+public:
+    mkldnn::memory::data_type getDataType() const {
+        return static_cast<mkldnn::memory::data_type>(desc.data.data_type);
+    }
+
+    dnnl_format_kind_t getFormatKind() const {
+        return desc.data.format_kind;
+    }
+
+    MemoryDescPtr clone() const override {
+        return std::make_shared<DnnlMemoryDesc>(*this);
+    }
+
+    std::string serializeFormat() const override;
+
+    InferenceEngine::Precision getPrecision() const override;
+
+    bool isCompatible(const MemoryDesc& rhs) const override;
+
+    size_t getMaxMemSize() const override;
+
+    const mkldnn::memory::desc& getDnnlDesc() const {
+        return desc;
+    }
+
+    bool hasLayoutType(LayoutType layoutType) const override { return false; }
+
+    virtual bool isSame(mkldnn::memory::format_tag fmt) const { return false; }
+
+    bool hasEmptyExtraData() const { return desc.data.extra.flags == dnnl_memory_extra_flag_none; }
+
+protected:
+    DnnlMemoryDesc() {}
+    static constexpr size_t UNREACHABLE_DIM = std::numeric_limits<size_t>::max();
+
+    mkldnn::memory::desc desc;
+
+    void setPrecision(InferenceEngine::Precision prc) override {
+        desc.data.data_type = static_cast<dnnl_data_type_t>(MKLDNNExtensionUtils::IEPrecisionToDataType(prc));
+    }
+
+private:
+    explicit DnnlMemoryDesc(const mkldnn::memory::desc& desc);
+
+    size_t getElementOffset(size_t elemNumber) const override;
+
+    size_t getCurrentMemSizeImp() const override;
+    bool isDefinedImp() const override;
+    MemoryDescPtr cloneWithNewDimsImp(const VectorDims& dims) const override;
+
+    friend DnnlMemoryDescPtr MKLDNNExtensionUtils::makeDescriptor(const mkldnn::memory::desc &desc);
+};
+
+}  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_dims.h b/inference-engine/src/mkldnn_plugin/mkldnn_dims.h
deleted file mode 100644
index 4960660935fe1d..00000000000000
--- a/inference-engine/src/mkldnn_plugin/mkldnn_dims.h
+++ /dev/null
@@ -1,95 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include "perf_count.h"
-#include <vector>
-#include <utility>
-#include <mkldnn_types.h>
-#include <ie_common.h>
-#include <mkldnn.hpp>
-
-namespace MKLDNNPlugin {
-
-class MKLDNNDims {
-public:
-    MKLDNNDims() = default;
-
-    explicit MKLDNNDims(const InferenceEngine::SizeVector& size) {
-        dims = std::vector<ptrdiff_t>(size.begin(), size.end());
-    }
-
-    explicit MKLDNNDims(const std::vector<ptrdiff_t>& dim) {
-        dims = dim;
-    }
-
-    MKLDNNDims(const mkldnn_dims_t dnn_dims, int dnn_ndims) {
-        dims = std::vector<ptrdiff_t>(dnn_dims, dnn_dims + dnn_ndims);
-    }
-
-    explicit MKLDNNDims(std::initializer_list<ptrdiff_t> ilist) : dims(ilist) {}
-    explicit MKLDNNDims(std::initializer_list<size_t > ilist) : dims(ilist.begin(), ilist.end()) {}
-
-    InferenceEngine::SizeVector ToSizeVector() const {
-        InferenceEngine::SizeVector size;
-        for (auto i : dims) {
-            size.push_back(i);
-        }
-
-        return size;
-    }
-
-    int ndims() const {
-        return dims.size();
-    }
-
-    ptrdiff_t size() const {
-        return size(0);
-    }
-
-    ptrdiff_t size(int start) const {
-        ptrdiff_t size = 1;
-
-        for (int i = start; i < dims.size(); i++) {
-            size *= dims[i];
-        }
-
-        return size;
-    }
-
-    void push_back(int val) {
-        dims.push_back(val);
-    }
-
-    operator mkldnn::memory::dims() const {
-        // TODO: it will convert each time.. not good
-        return mkldnn::memory::dims(dims.begin(), dims.end());
-    }
-
-    bool operator == (const MKLDNNDims& rhs) const {
-        if (dims.size() != rhs.dims.size()) {
-            return false;
-        }
-
-        return std::equal(rhs.dims.begin(), rhs.dims.end(), dims.begin());
-    }
-
-    bool operator != (const MKLDNNDims& rhs) const {
-        return !(*this == rhs);
-    }
-
-    ptrdiff_t& operator[](int idx) {
-        return dims[idx];
-    }
-
-    ptrdiff_t operator[](int idx) const {
-        return dims[idx];
-    }
-
-private:
-    std::vector<ptrdiff_t> dims;
-};
-
-}  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_edge.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_edge.cpp
index acce99cfbd38d9..ad45a5d39adedb 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_edge.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_edge.cpp
@@ -166,8 +166,6 @@ void MKLDNNEdge::allocate(const void* mem_ptr) {
 
     auto& inputDesc = getInputDesc();
     auto& outputDesc = getOutputDesc();
-    if (!inputDesc.isDefined() || !outputDesc.isDefined())
-        IE_THROW() << "Cannot allocate memory for undefined descriptors.";
     if (!inputDesc.isCompatible(outputDesc))
         IE_THROW() << "Cannot allocate memory for incompatible descriptors.";
 
@@ -222,57 +220,6 @@ void MKLDNNEdge::changeStatus(MKLDNNEdge::Status state) {
     status = state;
 }
 
-// TODO [DS]: remove while DynamicShapes migration
-// TODO [DS]: How should we validate shape compatibility?
-// TODO [DS]: Why do we allow uninitialized shape?
-const Shape& MKLDNNEdge::getShape() {
-    if (!shape.getRank()) {
-        Shape inShape;
-        Shape outShape;
-        auto childPtr = getChild();
-        auto parentPtr = getParent();
-
-        int inNum = getOutputNum();
-        if (inNum < 0) {
-            IE_THROW() << "Error cannot find input data for " << child.lock()->getName()
-                               << " from " << parent.lock()->getName();
-        }
-        if (inNum < childPtr->inputShapes.size()) {
-            outShape = childPtr->inputShapes[inNum];
-        }
-
-        int outNum = getInputNum();
-        if (outNum < 0) {
-            IE_THROW() << "Error cannot find output data for " << parent.lock()->getName()
-                               << " to " << child.lock()->getName();
-        }
-        if (outNum >= parentPtr->outputShapes.size())
-            outNum = 0;
-        if (outNum < parentPtr->outputShapes.size()) {
-            inShape = parentPtr->outputShapes[outNum];
-        }
-
-        if (inShape.getRank() && outShape.getRank() && inShape.getRank() != outShape.getRank() && inShape.getElementsCount() != outShape.getElementsCount())
-            IE_THROW() << "Nodes " << getParent()->getName() << " and " << getChild()->getName()
-                               << " have incompatible dimensions!";
-
-        if (outShape.getRank() != 0) {
-            shape = outShape;
-        } else if (inShape.getRank() != 0) {
-            shape = inShape;
-        } else {
-            shape = Shape(InferenceEngine::SizeVector({1}));
-        }
-
-
-        if (!(outShape.getRank() == 0 && inShape.getRank() == 0) && !shape.getRank())
-            IE_THROW() << "Cannot detect right dims for nodes " << getParent()->getName()
-                               << " and " << getChild()->getName();
-    }
-
-    return shape;
-}
-
 const MemoryDesc& MKLDNNEdge::getInputDesc() const {
     auto parentPtr = getParent();
     if (parentPtr->getSelectedPrimitiveDescriptor() == nullptr)
@@ -321,20 +268,14 @@ const MemoryDesc& MKLDNNEdge::getDesc() const {
 }
 
 const MKLDNNMemory &MKLDNNEdge::getMemory() {
-    if (status == Status::NotAllocated) {
-        memoryPtr.reset(new MKLDNNMemory(getParent()->getEngine()));
-        memoryPtr->Create(getDesc(), getSharedEdge()->getMemoryPtr()->GetData());
-        memoryFromEdge.reset();
-        changeStatus(Status::Allocated);
-    }
-
-    return *memoryPtr;
+    return *getMemoryPtr();
 }
 
 MKLDNNMemoryPtr &MKLDNNEdge::getMemoryPtr() {
     if (status == Status::NotAllocated) {
         memoryPtr.reset(new MKLDNNMemory(getParent()->getEngine()));
-        memoryPtr->Create(getDesc(), getSharedEdge()->getMemoryPtr()->GetData());
+        const auto &desc = getDesc();
+        memoryPtr->Create(desc, desc.isDefined() ? getSharedEdge()->getMemoryPtr()->GetData() : nullptr);
         memoryFromEdge.reset();
         changeStatus(Status::Allocated);
     }
@@ -353,7 +294,6 @@ void MKLDNNEdge::validate() {
     getMemory();
     getParent();
     getChild();
-    getShape();
 
     if (status != Status::Allocated) {
         IE_THROW() << "Error memory is not allocated!";
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_edge.h b/inference-engine/src/mkldnn_plugin/mkldnn_edge.h
index 5e6f4d23542f9f..9c6a4f92506b51 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_edge.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_edge.h
@@ -6,7 +6,7 @@
 
 #include <ie_blob.h>
 #include "cpu_shape.h"
-#include "cpu_memory_desc.h"
+#include "memory_desc/cpu_memory_desc.h"
 #include "mkldnn_weights_cache.hpp"
 
 #include <map>
@@ -51,7 +51,6 @@ class MKLDNNEdge {
     const std::shared_ptr<MKLDNNNode> getParent() const;
     const std::shared_ptr<MKLDNNNode> getChild() const;
 
-    const Shape &getShape();
     const MKLDNNMemory& getMemory();
     MKLDNNMemoryPtr& getMemoryPtr();
 
@@ -68,6 +67,10 @@ class MKLDNNEdge {
     MKLDNNEdgePtr getSharedEdge() const;
     MKLDNNEdgePtr getSharedEdge(std::nothrow_t) const;
 
+    bool hasDefinedMaxSize() const {
+        return getDesc().hasDefinedMaxSize();
+    }
+
 private:
     std::string name() const;
 
@@ -78,7 +81,6 @@ class MKLDNNEdge {
 
     bool useExternalMemory = false;
     MKLDNNEdgeWeakPtr memoryFromEdge;
-    Shape shape;
     MKLDNNMemoryPtr memoryPtr;
     Status status = Status::Uninitialized;
 
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp
index 6e4746e2a8c662..14fe27a187d92e 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.cpp
@@ -10,13 +10,14 @@
 #include "mkldnn_infer_request.h"
 #include "mkldnn_memory_state.h"
 #include "mkldnn_itt.h"
+#include "mkldnn_serialize.h"
 #include "nodes/mkldnn_memory_node.hpp"
 #include <threading/ie_executor_manager.hpp>
-#if ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
+#define FIX_62820 0
+#if FIX_62820 && ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
 #include <threading/ie_tbb_streams_executor.hpp>
-#else
-#include <threading/ie_cpu_streams_executor.hpp>
 #endif
+#include <threading/ie_cpu_streams_executor.hpp>
 #include <ie_system_conf.h>
 #include <algorithm>
 #include <unordered_set>
@@ -72,14 +73,14 @@ MKLDNNExecNetwork::MKLDNNExecNetwork(const InferenceEngine::CNNNetwork &network,
     } else {
         auto streamsExecutorConfig = InferenceEngine::IStreamsExecutor::Config::MakeDefaultMultiThreaded(_cfg.streamExecutorConfig, isFloatModel);
         streamsExecutorConfig._name = "CPUStreamsExecutor";
-#if (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
+#if FIX_62820 && (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
         _taskExecutor = std::make_shared<TBBStreamsExecutor>(streamsExecutorConfig);
 #else
         _taskExecutor = ExecutorManager::getInstance()->getIdleCPUStreamsExecutor(streamsExecutorConfig);
 #endif
     }
     if (0 != cfg.streamExecutorConfig._streams) {
-#if (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
+#if FIX_62820 && (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
         // There is no additional threads but we still need serialize callback execution to preserve legacy behaviour
         _callbackExecutor = std::make_shared<ImmediateSerialExecutor>();
 #else
@@ -297,3 +298,8 @@ std::vector<IVariableStateInternal::Ptr> MKLDNNExecNetwork::QueryState() {
     return memoryStates;
 }
 IE_SUPPRESS_DEPRECATED_END
+
+void MKLDNNExecNetwork::Export(std::ostream& modelStream) {
+    CNNNetworkSerializer serializer(modelStream, extensionManager);
+    serializer <<_network;
+}
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.h b/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.h
index b16336711b3ac6..2ebd1007068643 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_exec_network.h
@@ -43,6 +43,8 @@ class MKLDNNExecNetwork: public InferenceEngine::ExecutableNetworkThreadSafeDefa
     INFERENCE_ENGINE_DEPRECATED("Use InferRequest::QueryState instead")
     std::vector<InferenceEngine::IVariableStateInternal::Ptr> QueryState() override;
 
+    void Export(std::ostream& modelStream) override;
+
 protected:
     friend class MKLDNNInferRequest;
     MKLDNNExtensionManager::Ptr extensionManager;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_extension.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_extension.cpp
new file mode 100644
index 00000000000000..daf2a0f6ac5a53
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_extension.cpp
@@ -0,0 +1,131 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "mkldnn_extension.h"
+#include "ngraph_transformations/op/fully_connected.hpp"
+#include "ngraph_transformations/op/leaky_relu.hpp"
+#include "ngraph_transformations/op/power_static.hpp"
+#include "ngraph_transformations/op/swish_cpu.hpp"
+
+#include <ngraph/ngraph.hpp>
+#include <ngraph_ops/type_relaxed.hpp>
+
+#include <mutex>
+
+namespace MKLDNNPlugin {
+
+void MKLDNNExtension::GetVersion(const InferenceEngine::Version*& versionInfo) const noexcept {
+    static const InferenceEngine::Version version = {
+        {1, 0},             // extension API version
+        "1.0",
+        "MKLDNNExtension"   // extension description message
+    };
+
+    versionInfo = &version;
+}
+
+void MKLDNNExtension::Unload() noexcept {}
+
+std::map<std::string, ngraph::OpSet> MKLDNNExtension::getOpSets() {
+    auto cpu_plugin_opset = []() {
+        ngraph::OpSet opset;
+
+#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+        NGRAPH_OP(FullyConnectedNode, MKLDNNPlugin)
+        NGRAPH_OP(LeakyReluNode, MKLDNNPlugin)
+        NGRAPH_OP(PowerStaticNode, MKLDNNPlugin)
+        NGRAPH_OP(SwishNode, MKLDNNPlugin)
+#undef NGRAPH_OP
+
+        return opset;
+    };
+
+    auto type_relaxed_opset = []() {
+        ngraph::OpSet opset;
+
+#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<ngraph::op::TypeRelaxed<NAMESPACE::NAME>>();
+        NGRAPH_OP(Add, ngraph::op::v1)
+        NGRAPH_OP(AvgPool, ngraph::op::v1)
+        NGRAPH_OP(Clamp, ngraph::op::v0)
+        NGRAPH_OP(Concat, ngraph::op::v0)
+        NGRAPH_OP(Convolution, ngraph::op::v1)
+        NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
+        NGRAPH_OP(DepthToSpace, ngraph::op::v0)
+        NGRAPH_OP(Equal, ngraph::op::v1)
+        NGRAPH_OP(FakeQuantize, ngraph::op::v0)
+        NGRAPH_OP(Greater, ngraph::op::v1)
+        NGRAPH_OP(GreaterEqual, ngraph::op::v1)
+        NGRAPH_OP(GroupConvolution, ngraph::op::v1)
+        NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
+        NGRAPH_OP(Interpolate, ngraph::op::v0)
+        NGRAPH_OP(Interpolate, ngraph::op::v4)
+        NGRAPH_OP(Less, ngraph::op::v1)
+        NGRAPH_OP(LessEqual, ngraph::op::v1)
+        NGRAPH_OP(LogicalAnd, ngraph::op::v1)
+        NGRAPH_OP(LogicalNot, ngraph::op::v1)
+        NGRAPH_OP(LogicalOr, ngraph::op::v1)
+        NGRAPH_OP(LogicalXor, ngraph::op::v1)
+        NGRAPH_OP(MatMul, ngraph::op::v0)
+        NGRAPH_OP(MaxPool, ngraph::op::v1)
+        NGRAPH_OP(Multiply, ngraph::op::v1)
+        NGRAPH_OP(NormalizeL2, ngraph::op::v0)
+        NGRAPH_OP(NotEqual, ngraph::op::v1)
+        NGRAPH_OP(PRelu, ngraph::op::v0)
+        NGRAPH_OP(Relu, ngraph::op::v0)
+        NGRAPH_OP(ReduceMax, ngraph::op::v1)
+        NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
+        NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
+        NGRAPH_OP(ReduceMean, ngraph::op::v1)
+        NGRAPH_OP(ReduceMin, ngraph::op::v1)
+        NGRAPH_OP(ReduceSum, ngraph::op::v1)
+        NGRAPH_OP(Reshape, ngraph::op::v1)
+        NGRAPH_OP(Select, ngraph::op::v1)
+        NGRAPH_OP(ShapeOf, ngraph::op::v0)
+        NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
+        NGRAPH_OP(Squeeze, ngraph::op::v0)
+        NGRAPH_OP(Subtract, ngraph::op::v1)
+        NGRAPH_OP(Unsqueeze, ngraph::op::v0)
+        NGRAPH_OP(MVN, ngraph::op::v0)
+        NGRAPH_OP(MVN, ngraph::op::v6)
+        NGRAPH_OP(Select, ngraph::op::v1)
+        NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
+#undef NGRAPH_OP
+
+        return opset;
+    };
+
+    static std::map<std::string, ngraph::OpSet> opsets = {
+        { "cpu_plugin_opset", cpu_plugin_opset() },
+        { "type_relaxed_opset", type_relaxed_opset() }
+    };
+
+    return opsets;
+}
+
+std::vector<std::string> MKLDNNExtension::getImplTypes(const std::shared_ptr<ngraph::Node>&) {
+    return {};
+}
+
+InferenceEngine::ILayerImpl::Ptr MKLDNNExtension::getImplementation(const std::shared_ptr<ngraph::Node>& node, const std::string& implType) {
+    return nullptr;
+}
+
+}  // namespace MKLDNNPlugin
+
+// Generate exported function
+IE_DEFINE_EXTENSION_CREATE_FUNCTION(MKLDNNPlugin::MKLDNNExtension)
+
+INFERENCE_EXTENSION_API(InferenceEngine::StatusCode)
+InferenceEngine::CreateExtension(InferenceEngine::IExtension*& ext, InferenceEngine::ResponseDesc* resp) noexcept {
+    try {
+        ext = new MKLDNNPlugin::MKLDNNExtension();
+        return OK;
+    } catch (std::exception& ex) {
+        if (resp) {
+            std::string err = ((std::string) "Couldn't create extension: ") + ex.what();
+            err.copy(resp->msg, 255);
+        }
+        return InferenceEngine::GENERAL_ERROR;
+    }
+}
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_extension.h b/inference-engine/src/mkldnn_plugin/mkldnn_extension.h
new file mode 100644
index 00000000000000..81c8aeb95a513e
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_extension.h
@@ -0,0 +1,20 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <ie_iextension.h>
+
+namespace MKLDNNPlugin {
+
+class MKLDNNExtension : public InferenceEngine::IExtension {
+public:
+    void GetVersion(const InferenceEngine::Version*& versionInfo) const noexcept override;
+    void Unload() noexcept override;
+    std::map<std::string, ngraph::OpSet> getOpSets() override;
+    std::vector<std::string> getImplTypes(const std::shared_ptr<ngraph::Node>& node) override;
+    InferenceEngine::ILayerImpl::Ptr getImplementation(const std::shared_ptr<ngraph::Node>& node, const std::string& implType) override;
+};
+
+}  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.cpp
index 2170d05d07e273..da0265d020840a 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.cpp
@@ -51,3 +51,7 @@ std::shared_ptr<InferenceEngine::ILayerImplFactory> MKLDNNExtensionManager::Crea
     }
     return factory;
 }
+
+const std::vector<InferenceEngine::IExtensionPtr> & MKLDNNExtensionManager::Extensions() const {
+    return _extensions;
+}
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.h b/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.h
index 784f5ea52664f3..0d349a9cff4a86 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_extension_mngr.h
@@ -19,6 +19,7 @@ class MKLDNNExtensionManager {
     InferenceEngine::ILayerImpl::Ptr CreateImplementation(const std::shared_ptr<ngraph::Node>& op);
     std::shared_ptr<InferenceEngine::ILayerImplFactory> CreateExtensionFactory(const std::shared_ptr<ngraph::Node>& op);
     void AddExtension(const InferenceEngine::IExtensionPtr& extension);
+    const std::vector<InferenceEngine::IExtensionPtr> & Extensions() const;
 
 private:
     std::vector<InferenceEngine::IExtensionPtr> _extensions;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.cpp
index d1c851645b1d78..22d78b46242db0 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.cpp
@@ -4,9 +4,8 @@
 
 #include "mkldnn_extension_utils.h"
 #include "utils/general_utils.h"
-#include <limits>
 #include <vector>
-#include <numeric>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -77,10 +76,63 @@ InferenceEngine::Precision MKLDNNExtensionUtils::DataTypeToIEPrecision(memory::d
     }
 }
 
-InferenceEngine::SizeVector MKLDNNExtensionUtils::convertToSizeVector(const mkldnn::memory::dims& dims) {
-    return InferenceEngine::SizeVector(dims.begin(), dims.end());
+Dim MKLDNNExtensionUtils::convertToDim(const dnnl::memory::dim &dim) {
+    return dim == DNNL_RUNTIME_DIM_VAL ?  Shape::UNDEFINED_DIM : static_cast<size_t>(dim);
+}
+dnnl::memory::dim MKLDNNExtensionUtils::convertToDnnlDim(const Dim &dim) {
+    return dim == Shape::UNDEFINED_DIM ? DNNL_RUNTIME_DIM_VAL : static_cast<mkldnn::memory::dim>(dim);
+}
+
+VectorDims MKLDNNExtensionUtils::convertToVectorDims(const memory::dims& dims) {
+    std::vector<size_t> vecResult;
+    vecResult.reserve(dims.size());
+    std::back_insert_iterator<std::vector<size_t>> itr(vecResult);
+    std::transform(dims.begin(), dims.end(), itr, convertToDim);
+    return vecResult;
+}
+
+memory::dims MKLDNNExtensionUtils::convertToDnnlDims(const VectorDims& dims) {
+    memory::dims vecResult;
+    vecResult.reserve(dims.size());
+    std::back_insert_iterator<memory::dims> itr(vecResult);
+    std::transform(dims.begin(), dims.end(), itr, convertToDnnlDim);
+    return vecResult;
+}
+
+memory::format_tag MKLDNNExtensionUtils::GetPlainFormatByRank(size_t rank) {
+    switch (rank) {
+        case 0:
+        case 1:
+            return memory::format_tag::a;
+        case 2:
+            return memory::format_tag::ab;
+        case 3:
+            return memory::format_tag::abc;
+        case 4:
+            return memory::format_tag::abcd;
+        case 5:
+            return memory::format_tag::abcde;
+        case 6:
+            return memory::format_tag::abcdef;
+        default:
+            return memory::format_tag::undef;
+    }
+}
+
+DnnlMemoryDescPtr MKLDNNExtensionUtils::makeDescriptor(const mkldnn::memory::desc &desc) {
+    if (desc.data.format_kind == dnnl_blocked) {
+        return std::shared_ptr<DnnlBlockedMemoryDesc>(new DnnlBlockedMemoryDesc(desc));
+    } else {
+        return std::shared_ptr<DnnlMemoryDesc>(new DnnlMemoryDesc(desc));
+    }
 }
 
-std::vector<dnnl::memory::dim> MKLDNNExtensionUtils::convertToDnnlDims(const InferenceEngine::SizeVector& dims) {
-    return std::vector<dnnl::memory::dim>(dims.begin(), dims.end());;
+size_t MKLDNNExtensionUtils::getMemSizeForDnnlDesc(mkldnn::memory::desc desc) {
+    const auto offset0 = desc.data.offset0;
+    desc.data.offset0 = 0;
+    size_t size = desc.get_size();
+    if (size == DNNL_RUNTIME_SIZE_VAL)
+        return MemoryDesc::UNDEFINED_SIZE;
+    size += offset0 * sizeOfDataType(desc.data_type());
+    return size;
 }
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.h b/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.h
index 8e7f9a1b3742e7..d352eed578ecfa 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_extension_utils.h
@@ -11,17 +11,30 @@
 #include <string>
 
 #include "mkldnn.hpp"
-#include "cpu_memory_desc.h"
+#include "memory_desc/cpu_memory_desc.h"
 
 namespace MKLDNNPlugin {
 
+class DnnlMemoryDesc;
+
 class MKLDNNExtensionUtils {
 public:
     static uint8_t sizeOfDataType(mkldnn::memory::data_type dataType);
     static mkldnn::memory::data_type IEPrecisionToDataType(const InferenceEngine::Precision& prec);
     static InferenceEngine::Precision DataTypeToIEPrecision(mkldnn::memory::data_type dataType);
-    static InferenceEngine::SizeVector convertToSizeVector(const mkldnn::memory::dims& dims);
-    static std::vector<dnnl::memory::dim> convertToDnnlDims(const InferenceEngine::SizeVector& dims);
+    static Dim convertToDim(const dnnl::memory::dim &dim);
+    static dnnl::memory::dim convertToDnnlDim(const Dim &dim);
+    static VectorDims convertToVectorDims(const mkldnn::memory::dims& dims);
+    static std::vector<dnnl::memory::dim> convertToDnnlDims(const VectorDims& dims);
+    static mkldnn::memory::format_tag GetPlainFormatByRank(size_t rank);
+
+    /**
+     * @brief Creates DnnlBlockedMemoryDesc if desc is blocked, otherwise DnnlMemoryDesc
+     * @param desc mkldnn::memory::desc from which one of the descriptors will be created
+     * @return pointer to DnnlBlockedMemoryDesc or DnnlMemoryDesc
+     */
+    static std::shared_ptr<DnnlMemoryDesc> makeDescriptor(const mkldnn::memory::desc &desc);
+    static size_t getMemSizeForDnnlDesc(mkldnn::memory::desc desc);
 };
 
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp
index eb6f5fc523b520..a2c1c9818ea48d 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp
@@ -39,7 +39,7 @@
 #include "utils/node_dumper.h"
 #include "utils/ngraph_utils.hpp"
 #include "utils/cpu_utils.hpp"
-#include "cpu_memory_desc_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
 
 #include <ngraph/node.hpp>
 #include <ngraph/function.hpp>
@@ -47,6 +47,7 @@
 #include <ngraph/ops.hpp>
 #include <transformations/utils/utils.hpp>
 #include <low_precision/low_precision.hpp>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -214,8 +215,11 @@ void MKLDNNGraph::Replicate(const CNNNetwork &network, const MKLDNNExtensionMana
         graphNodes.push_back(node);
 
         if (op->get_type_info() == ngraph::op::v0::Parameter::type_info) {
-            if (inputsInfo.count(node->getName()) != 0) {
+            const auto inInfo = inputsInfo.find(node->getName());
+            if (inInfo != inputsInfo.end()) {
                 inputNodesMap[node->getName()] = node;
+                if (inInfo->second->getInputData()->isDynamic())
+                    graphHasDynamicInput = true;
             }
         }
 
@@ -439,8 +443,8 @@ void MKLDNNGraph::ExecuteConstantNodesOnly() {
 }
 
 static bool isReorderAvailable(const MemoryDesc& parentDesc, const MemoryDesc& childDesc, const mkldnn::engine& eng) {
-    memory::desc dstMemDesc = MemoryDescUtils::convertToMKLDNNMemoryDesc(childDesc);
-    memory::desc srcMemDesc = MemoryDescUtils::convertToMKLDNNMemoryDesc(parentDesc);;
+    memory::desc dstMemDesc = MemoryDescUtils::convertToDnnlMemoryDesc(childDesc.clone())->getDnnlDesc();
+    memory::desc srcMemDesc = MemoryDescUtils::convertToDnnlMemoryDesc(parentDesc.clone())->getDnnlDesc();
     mkldnn::primitive_attr attr;
 
     dnnl_primitive_desc_t result = nullptr;
@@ -522,6 +526,9 @@ static edge_clusters_t findEdgeClusters(const std::vector<MKLDNNEdgePtr> & graph
     edge_cluster_idx_map_t edge_cluster_indices;
 
     for (auto &edge : graphEdges) {
+        if (!edge->hasDefinedMaxSize())
+            continue;
+
         auto edge_it = edge_cluster_indices.find(edge);
 
         if (edge_it != edge_cluster_indices.end())
@@ -602,11 +609,11 @@ void MKLDNNGraph::AllocateWithReuse() {
             int e_start = edge->getParent()->execIndex;
             int e_finish = edge->getChild()->execIndex;
 
-            int64_t e_size = edge->getDesc().getCurrentSize();  // size in bytes (from the beginning of data to the last element)
-            if (e_size == MemoryDesc::UNDEFINED_SIZE) {
+            if (!edge->hasDefinedMaxSize()) {
                 IE_THROW() << "Can not allocate memory since the size is undefined.";
             }
 
+            int64_t e_size = edge->getDesc().getMaxMemSize();  // size in bytes (from the beginning of data to the last element)
             box.start = std::min(e_start, box.start);
             box.finish = std::max(e_finish, box.finish);
             box.size =  std::max(e_size, box.size);
@@ -639,7 +646,7 @@ void MKLDNNGraph::AllocateWithReuse() {
     size_t total_size = static_cast<size_t>(memSolver.solve()) * alignment;
 
     memWorkspace = std::make_shared<MKLDNNMemory>(eng);
-    memWorkspace->Create(MKLDNNMemoryDesc({total_size}, mkldnn::memory::data_type::s8));
+    memWorkspace->Create(DnnlBlockedMemoryDesc(InferenceEngine::Precision::I8, Shape(InferenceEngine::SizeVector{total_size})));
 
     if (edge_clusters.empty())
         return;
@@ -658,7 +665,7 @@ void MKLDNNGraph::AllocateWithReuse() {
                 // TODO: WA for some test (like strided_slice_test) which use tensors with
                 //       shapes {0}. And it is implisitly converted into {1} tensor.
                 //       Zeroing of input data allow pass tests.
-                if (edge->getParent()->type == Input)
+                if (edge->getParent()->type == Input && edge->hasDefinedMaxSize())
                     edge->getMemoryPtr()->FillZero();
 
                 count++;
@@ -679,8 +686,11 @@ void MKLDNNGraph::Allocate() {
     // Allocate memory space for all edges marked with NeedAllocation
     AllocateWithReuse();
 
-    // Resolve all other edges with status NotAllocated or in-place
-    for (auto& node : graphNodes) node->resolveNotAllocatedEdges();
+    // Resolve all other edges with status NotAllocated and in-place
+    for (auto& node : graphNodes) node->resolveInPlaceEdges();
+
+    // Create dummy memory with undefined desc for edges that are not allocated on the previous stages (memory solver and inPlace resolving)
+    for (auto& edge : graphEdges) edge->allocate();
 
     // Check all getters. Should work.
     for (auto& edge : graphEdges) edge->validate();
@@ -703,7 +713,7 @@ void MKLDNNGraph::PushInputData(const std::string& name, const InferenceEngine::
         void *inter_data_ptr = input->second->getChildEdgeAt(0)->getMemory().GetData();
 
         if (ext_data_ptr != inter_data_ptr) {
-            auto ext_tdesc = MemoryDescUtils::convertToMKLDNNMemoryDesc(in->getTensorDesc());
+            auto ext_tdesc = MemoryDescUtils::convertToDnnlBlockedMemoryDesc(in->getTensorDesc());
 
             auto ext_mem = MKLDNNMemory(eng);
             ext_mem.Create(ext_tdesc, ext_data_ptr, false);
@@ -714,7 +724,7 @@ void MKLDNNGraph::PushInputData(const std::string& name, const InferenceEngine::
         // todo: make sure 'name' exists in this map...
         if (_normalizePreprocMap.find(name) != _normalizePreprocMap.end()) {
             if (in->getTensorDesc().getPrecision() == InferenceEngine::Precision::FP32) {
-                _normalizePreprocMap[name].NormalizeImage(input->second->getChildEdgeAt(0)->getShape(),
+                _normalizePreprocMap[name].NormalizeImage(input->second->getOutputShapeAtPort(0),
                                                           reinterpret_cast<float *>(inter_data_ptr),
                                                           in->getTensorDesc().getLayout());
             } else {
@@ -726,7 +736,7 @@ void MKLDNNGraph::PushInputData(const std::string& name, const InferenceEngine::
     }
 }
 
-void MKLDNNGraph::PullOutputData(const BlobMap &out) {
+void MKLDNNGraph::PullOutputData(BlobMap &out) {
     if (!IsReady())
         IE_THROW() << "Wrong state. Topology not ready.";
 
@@ -735,50 +745,60 @@ void MKLDNNGraph::PullOutputData(const BlobMap &out) {
         auto node = outputMap.second;
         const MKLDNNMemory& intr_blob = node->getParentEdgeAt(0)->getMemory();
 
-        if (!out.count(name)) {
+        const auto ext_blob = out.find(name);
+        if (ext_blob == out.end()) {
             IE_THROW(Unexpected) << "The network outputs do not contain mkldnn graph output node name: \"" << name << "\"";
         }
 
-        const Blob::Ptr &ext_blob = out.at(name);
+        const auto actualDesc = MemoryDescUtils::convertToTensorDesc(intr_blob.getDesc());
+        const auto &expectedDesc = ext_blob->second->getTensorDesc();
+
+        // TODO [NM]: need to create universal reorder which will be detect cases when we really need to use it
+        // WA: for cases when output shape after transformation will be 1x1x1x1 but model output is scalar
+        bool isScalarOutput = false;
+        if (actualDesc.getLayout() == SCALAR) {
+            isScalarOutput = expectedDesc.getLayout() == SCALAR ||
+                             (!expectedDesc.getDims().empty() &&
+                             std::accumulate(expectedDesc.getDims().begin(), expectedDesc.getDims().end(), (size_t)1, std::multiplies<size_t>()) == 1);
+        } else if (expectedDesc.getLayout() == SCALAR) {
+            isScalarOutput = actualDesc.getLayout() == SCALAR ||
+                             (!actualDesc.getDims().empty() &&
+                             std::accumulate(actualDesc.getDims().begin(), actualDesc.getDims().end(), (size_t)1, std::multiplies<size_t>()) == 1);
+        }
+
+        if (out[name]->getTensorDesc().getDims() != intr_blob.getStaticDims() && !isScalarOutput) {
+            if (!node->isDynamicNode())
+                IE_THROW() << "Output blob and node dims mismatch for node with name: \"" << name << "\"";
+            out[name]->setShape(intr_blob.getStaticDims());
+        }
+
+        auto srcPrec = actualDesc.getPrecision();
+        auto dstPrec = expectedDesc.getPrecision();
 
-        auto srcPrec = MKLDNNExtensionUtils::DataTypeToIEPrecision(intr_blob.GetDataType());
-        auto dstPrec = ext_blob->getTensorDesc().getPrecision();
-        if (srcPrec == dstPrec && ext_blob->byteSize() != intr_blob.GetSize())
+        if (srcPrec == dstPrec && ext_blob->second->byteSize() != intr_blob.GetSize())
                 IE_THROW() << "Output blob byte size is not equal network output byte size ("
-                                   << ext_blob->byteSize() << "!=" << intr_blob.GetSize() << ").";
-        if (ext_blob->size() != intr_blob.GetElementsCount())
-            IE_THROW() << "Output blob number of elements is not equal network output number of elements ("
-                               << ext_blob->size() << "!=" << intr_blob.GetElementsCount() << ").";
+                                   << ext_blob->second->byteSize() << "!=" << intr_blob.GetSize() << ").";
 
-        void *ext_blob_ptr = ext_blob->buffer();
+        void *ext_blob_ptr = ext_blob->second->buffer();
         void *intr_blob_ptr = intr_blob.GetData();
 
         // That is the same memory. No need to copy
         if (ext_blob_ptr == intr_blob_ptr) continue;
 
-        int MB = intr_blob.GetDims()[0];
-        int MB_to_process = node->batchToProcess();
+        const auto &outDims = intr_blob.getStaticDims();
+        size_t size_to_copy = intr_blob.GetDescWithType<BlockedMemoryDesc>()->getPaddedElementsCount();
         // TODO: Should we support InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT???
-        if (config.batchLimit)
-            MB_to_process = std::min<int>(config.batchLimit, MB_to_process);
-        size_t size_to_copy = intr_blob.GetElementsCount() * MB_to_process / MB;
-
-        const auto actualDesc = MemoryDescUtils::convertToTensorDesc(node->getParentEdgeAt(0)->getDesc());
-        const auto expectedDesc = ext_blob->getTensorDesc();
-
-        // TODO [NM]: need to create universal reorder which will be detect cases when we really need to use it
-        // WA: for cases when output shape after transformation will be 1x1x1x1 but model output is scalar
-        bool isScalarOutput = false;
-        if (actualDesc.getLayout() == SCALAR) {
-            isScalarOutput = expectedDesc.getLayout() == SCALAR ||
-                             std::accumulate(expectedDesc.getDims().begin(), expectedDesc.getDims().end(), (size_t)1, std::multiplies<size_t>()) == 1;
-        } else if (expectedDesc.getLayout() == SCALAR) {
-            isScalarOutput = actualDesc.getLayout() == SCALAR ||
-                             std::accumulate(actualDesc.getDims().begin(), actualDesc.getDims().end(), (size_t)1, std::multiplies<size_t>()) == 1;
+        // TODO [DS]: phase 2: should we support this behaviour? Looks obsolete in the dynamic shapes paradigm
+        if (config.batchLimit) {
+            if (node->isDynamicNode()) {
+                IE_THROW(NotImplemented) << "[DS] not implemented dynamic batch for node with dynamic shape";
+            }
+            int MB_to_process = node->batchToProcess();
+            size_to_copy = std::accumulate(outDims.begin() + 1, outDims.end(), (size_t)1, std::multiplies<size_t>()) * MB_to_process;
         }
 
         if (actualDesc.getBlockingDesc() != expectedDesc.getBlockingDesc() && !isScalarOutput) {
-            auto outBlobDesc = MemoryDescUtils::convertToMKLDNNMemoryDesc(expectedDesc);
+            auto outBlobDesc = MemoryDescUtils::convertToDnnlBlockedMemoryDesc(expectedDesc);
             auto outBloMem = MKLDNNMemory(eng);
             outBloMem.Create(outBlobDesc, ext_blob_ptr, false);
 
@@ -816,7 +836,11 @@ void MKLDNNGraph::Infer(MKLDNNInferRequest* request, int batch) {
         ENABLE_CPU_DEBUG_CAP(nd.dumpInputBlobs(node));
 
         OV_ITT_SCOPED_TASK(itt::domains::MKLDNNPlugin, node->profiling.execute);
-        node->execute(stream);
+        if (node->isDynamicNode()) {
+            node->executeDynamic(stream);
+        } else {
+            node->execute(stream);
+        }
 
         ENABLE_CPU_DEBUG_CAP(nd.dumpOutputBlobs(node));
     }
@@ -886,7 +910,7 @@ void MKLDNNGraph::SortTopologically() {
             for (int i = 0; i < node->parentEdges.size(); i++) {
                 auto edge = node->getParentEdgeAt(i);
                 int port = edge->getOutputNum();
-                if (!res[port])
+                if (port < port_num && !res[port])
                     res[port] = edge;
                 else
                     res.push_back(edge);
@@ -900,7 +924,7 @@ void MKLDNNGraph::SortTopologically() {
             for (int i = 0; i < node->childEdges.size(); i++) {
                 auto edge = node->getChildEdgeAt(i);
                 int port = edge->getInputNum();
-                if (!res[port])
+                if (port < port_num && !res[port])
                     res[port] = edge;
                 else
                     res.push_back(edge);
@@ -1070,6 +1094,7 @@ void MKLDNNGraph::DropDWConvNode(const MKLDNNNodePtr &node) {
         if (!parent) continue;
 
         MKLDNNEdgePtr &remEdge = p_edge;
+        const auto portCandidate = remEdge->getOutputNum();
         int inNum = 0;
         if (remEdge) {
             inNum = remEdge->getInputNum();
@@ -1081,8 +1106,9 @@ void MKLDNNGraph::DropDWConvNode(const MKLDNNNodePtr &node) {
         MKLDNNEdgePtr newEdge(new MKLDNNEdge(parent, parentConv, inNum, outNum));
         graphEdges.push_back(newEdge);
         parent->addEdge(newEdge);
-        parentConv->inputShapes.push_back(Shape(newEdge->getShape()));
+        parentConv->inputShapes.push_back(node->getInputShapeAtPort(portCandidate));
     }
+    parentConv->outputShapes[0] = node->getOutputShapeAtPort(0);
 }
 
 void MKLDNNGraph::RemoveDroppedNodes() {
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_graph.h b/inference-engine/src/mkldnn_plugin/mkldnn_graph.h
index a946d47bc6ada7..4d587b4afd5361 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_graph.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_graph.h
@@ -57,7 +57,7 @@ class MKLDNNGraph {
     }
 
     void PushInputData(const std::string& name, const InferenceEngine::Blob::Ptr &in);
-    void PullOutputData(const InferenceEngine::BlobMap &out);
+    void PullOutputData(InferenceEngine::BlobMap &out);
 
     void Infer(MKLDNNInferRequest* request = nullptr, int batch = -1);
 
@@ -85,6 +85,20 @@ class MKLDNNGraph {
         return outputNodesMap;
     }
 
+    MKLDNNNodePtr getInputNodeByName(const std::string &name) {
+        auto input = inputNodesMap.find(name);
+        if (input == inputNodesMap.end())
+            IE_THROW() << "CPU execution graph doesn't contain input node with name: " << name;
+        return input->second;
+    }
+
+    MKLDNNNodePtr getOutputNodeByName(const std::string &name) {
+        auto output = outputNodesMap.find(name);
+        if (output == outputNodesMap.end())
+            IE_THROW() << "CPU execution graph doesn't contain output node with name: " << name;
+        return output->second;
+    }
+
     bool hasInputWithName(const std::string& name) const {
         return inputNodesMap.count(name);
     }
@@ -172,6 +186,10 @@ class MKLDNNGraph {
         return isQuantizedFlag;
     }
 
+    bool hasDynamicInput() const {
+        return graphHasDynamicInput;
+    }
+
 protected:
     void VisitNode(MKLDNNNodePtr node, std::vector<MKLDNNNodePtr>& sortedNodes);
 
@@ -196,8 +214,6 @@ class MKLDNNGraph {
 
     MKLDNNMemoryPtr memWorkspace;
 
-    std::map<std::string, MKLDNNNodePtr> inputNodesMap;
-    std::map<std::string, MKLDNNNodePtr> outputNodesMap;
     std::vector<MKLDNNNodePtr> graphNodes;
     std::vector<MKLDNNEdgePtr> graphEdges;
 
@@ -205,6 +221,7 @@ class MKLDNNGraph {
     std::string _name;
 
     bool isQuantizedFlag = false;
+    bool graphHasDynamicInput = false;
 
     static mkldnn::engine eng;
 
@@ -226,6 +243,9 @@ class MKLDNNGraph {
     friend std::shared_ptr<ngraph::Function> dump_graph_as_ie_ngraph_net(const MKLDNNGraph &graph);
 
 private:
+    // TODO: change std::map to std::unordered_map
+    std::map<std::string, MKLDNNNodePtr> inputNodesMap;
+    std::map<std::string, MKLDNNNodePtr> outputNodesMap;
     // these node pointers (from graphNodes) are to avoid regular checking for
     // constant node in ExecuteConstantNodesOnly and Infer methods
     std::vector<MKLDNNNodePtr> constantGraphNodes;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_graph_dumper.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_graph_dumper.cpp
index 523d5dce81b424..4f695741bdaecc 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_graph_dumper.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_graph_dumper.cpp
@@ -3,13 +3,17 @@
 //
 
 #include "mkldnn_graph_dumper.h"
+
+#include "utils/debug_capabilities.h"
 #include <ie_ngraph_utils.hpp>
 #include "exec_graph_info.hpp"
 #include "ie_common.h"
 #include "mkldnn_debug.h"
 #include <ngraph/variant.hpp>
 #include "ngraph/ngraph.hpp"
-#include "utils/debug_capabilities.h"
+#include <ngraph/pass/manager.hpp>
+#include <transformations/serialize.hpp>
+
 #include <vector>
 #include <string>
 #include <memory>
@@ -45,11 +49,11 @@ std::map<std::string, std::string> extract_node_metadata(const MKLDNNNodePtr &no
 
     std::string outputPrecisionsStr;
     if (!node->getChildEdges().empty()) {
-        outputPrecisionsStr = node->getChildEdgeAt(0)->getMemory().GetDesc().getPrecision().name();
+        outputPrecisionsStr = node->getChildEdgeAt(0)->getMemory().getDesc().getPrecision().name();
 
         bool isAllEqual = true;
         for (size_t i = 1; i < node->getChildEdges().size(); i++) {
-            if (node->getChildEdgeAt(i - 1)->getMemory().GetDesc().getPrecision() != node->getChildEdgeAt(i)->getMemory().GetDesc().getPrecision()) {
+            if (node->getChildEdgeAt(i - 1)->getMemory().getDesc().getPrecision() != node->getChildEdgeAt(i)->getMemory().getDesc().getPrecision()) {
                 isAllEqual = false;
                 break;
             }
@@ -58,12 +62,12 @@ std::map<std::string, std::string> extract_node_metadata(const MKLDNNNodePtr &no
         // If all output precisions are the same, we store the name only once
         if (!isAllEqual) {
             for (size_t i = 1; i < node->getChildEdges().size(); i++)
-                outputPrecisionsStr += "," + std::string(node->getChildEdgeAt(i)->getMemory().GetDesc().getPrecision().name());
+                outputPrecisionsStr += "," + std::string(node->getChildEdgeAt(i)->getMemory().getDesc().getPrecision().name());
         }
     } else {
         // Branch to correctly handle output nodes
         if (!node->getParentEdges().empty()) {
-            outputPrecisionsStr = node->getParentEdgeAt(0)->getMemory().GetDesc().getPrecision().name();
+            outputPrecisionsStr = node->getParentEdgeAt(0)->getMemory().getDesc().getPrecision().name();
         }
     }
     serialization_info[ExecGraphInfoSerialization::OUTPUT_PRECISIONS] = outputPrecisionsStr;
@@ -160,7 +164,7 @@ std::shared_ptr<ngraph::Function> dump_graph_as_ie_ngraph_net(const MKLDNNGraph
         auto meta_data = extract_node_metadata(node);
         std::shared_ptr<ngraph::Node> return_node;
         if (is_input) {
-            auto& desc = node->getChildEdgeAt(0)->getMemory().GetDesc();
+            auto& desc = node->getChildEdgeAt(0)->getMemory().getDesc();
             auto param = std::make_shared<ngraph::op::Parameter>(details::convertPrecision(desc.getPrecision()), desc.getShape().toPartialShape());
             return_node = param;
             params.push_back(param);
@@ -172,7 +176,7 @@ std::shared_ptr<ngraph::Function> dump_graph_as_ie_ngraph_net(const MKLDNNGraph
                 get_inputs(node), node->getSelectedPrimitiveDescriptor()->getConfig().outConfs.size());
 
             for (size_t port = 0; port < return_node->get_output_size(); ++port) {
-                auto& desc = node->getChildEdgeAt(port)->getMemory().GetDesc();
+                auto& desc = node->getChildEdgeAt(port)->getMemory().getDesc();
                 return_node->set_output_type(port, details::convertPrecision(desc.getPrecision()), desc.getShape().toPartialShape());
             }
         }
@@ -222,7 +226,12 @@ void serializeToXML(const MKLDNNGraph &graph, const std::string& path) {
     if (path.empty())
         return;
 
-    graph.dump().serialize(path);
+    std::string binPath;
+    ngraph::pass::Manager manager;
+    manager.register_pass<ngraph::pass::Serialize>(path,
+                                                   binPath,
+                                                   ngraph::pass::Serialize::Version::IR_V10);
+    manager.run_passes(graph.dump());
 }
 
 void serializeToCout(const MKLDNNGraph &graph) {
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_graph_optimizer.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_graph_optimizer.cpp
index c450fc63ece68e..956832c1af9088 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_graph_optimizer.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_graph_optimizer.cpp
@@ -44,7 +44,7 @@
 #include <algorithm>
 
 #include "mkldnn_itt.h"
-#include "cpu_memory_desc_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -156,14 +156,14 @@ void MKLDNNGraphOptimizer::ApplyImplSpecificGraphOptimizations(MKLDNNGraph &grap
 void MKLDNNGraphOptimizer::FuseConvolutionAndBias(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         return node->getType() == Convolution &&
                node->getChildEdges().size() == 1 &&
                node->getParentEdges().size() == 2 &&
                node->getFusedWith().empty();
     };
 
-    auto isSutableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
+    auto isSuitableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
         if (childNode->getAlgorithm() != EltwiseAdd || !childNode->getFusedWith().empty() || childNode->getParentEdges().size() != 2)
             return false;
 
@@ -171,8 +171,8 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndBias(MKLDNNGraph &graph) {
         if (biasNode->getType() != Input || !biasNode->isConstant() || biasNode->getChildEdges().size() != 1)
             return false;
 
-        auto convOutDims = parentNode->getChildEdgesAtPort(0)[0]->getShape().getDims();
-        auto biasDims = getNormalizedDimsBySize(biasNode->getChildEdgesAtPort(0)[0]->getShape().getDims(),
+        auto convOutDims = parentNode->getOutputShapeAtPort(0).getDims();
+        auto biasDims = getNormalizedDimsBySize(biasNode->getOutputShapeAtPort(0).getDims(),
                                                 convOutDims.size());
         // TODO [NM]: Legacy ConvBias fusion transformation supports both per-tensor (via explicit broadcasing) and per-channel cases.
         // Most of the real models contain per-channel bias, so we need to reavaluate the need to support per-tensor variant.
@@ -193,13 +193,13 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndBias(MKLDNNGraph &graph) {
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
 
         auto childNode = parentNode->getChildEdgeAt(0)->getChild();
-        if (!isSutableChildNode(parentNode, childNode)) {
+        if (!isSuitableChildNode(parentNode, childNode)) {
             parent++;
             continue;
         }
@@ -255,7 +255,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndBias(MKLDNNGraph &graph) {
                 graphEdges.push_back(newEdge);
                 parent->addEdge(newEdge);
 
-                parent->outputShapes[inNum] = Shape(SizeVector{parentEltwise->outputShapes[0].getStaticDims()[1]});
+                parent->outputShapes[inNum] = Shape(VectorDims{parentEltwise->outputShapes[0].getStaticDims()[1]});
                 parentEltwise->inputShapes.push_back(parent->outputShapes[0]);
             }
         }
@@ -305,14 +305,14 @@ void MKLDNNGraphOptimizer::FuseDeconvolutionAndSimpleOperation(MKLDNNGraph &grap
 void MKLDNNGraphOptimizer::FuseMultiplyAndAdd(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableSecondInput = [](MKLDNNNodePtr node, SizeVector dataDims) {
+    auto isSuitableSecondInput = [](MKLDNNNodePtr node, VectorDims dataDims) {
         if (node->getType() != Input || !node->isConstant())
             return false;
-        auto secondInputDims = node->outputShapes[0].getDims();
+        auto secondInputDims = node->getOutputShapeAtPort(0).getStaticDims();
         if (secondInputDims.size() != dataDims.size() || secondInputDims.size() < 2)
             return false;
 
-        if (secondInputDims[0] != 1 || !dimsEqualStrong(secondInputDims[1], dataDims[1]))
+        if (secondInputDims[0] != 1 || !dimsEqualWeak(secondInputDims[1], dataDims[1]))
             return false;
 
         for (size_t i = 2; i < secondInputDims.size(); i++) {
@@ -323,32 +323,32 @@ void MKLDNNGraphOptimizer::FuseMultiplyAndAdd(MKLDNNGraph &graph) {
         return true;
     };
 
-    auto isSutableParentNode = [&](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [&](MKLDNNNodePtr node) {
         if (node->getAlgorithm() != EltwiseMultiply || !node->getFusedWith().empty() ||
             node->getParentEdges().size() != 2 || node->getChildEdges().size() != 1)
             return false;
 
-        return isSutableSecondInput(node->getParentEdgesAtPort(1)[0]->getParent(), node->getParentEdgesAtPort(0)[0]->getShape().getDims());
+        return isSuitableSecondInput(node->getParentEdgesAtPort(1)[0]->getParent(), node->getInputShapeAtPort(0).getDims());
     };
 
-    auto isSutableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
+    auto isSuitableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
         if (childNode->getAlgorithm() != EltwiseAdd || !childNode->getFusedWith().empty() || childNode->getParentEdges().size() != 2)
             return false;
 
-        return isSutableSecondInput(childNode->getParentEdgesAtPort(1)[0]->getParent(), childNode->getParentEdgesAtPort(0)[0]->getShape().getDims()) &&
-               parentNode->canFuse(childNode);
+        return isSuitableSecondInput(childNode->getParentEdgesAtPort(1)[0]->getParent(), childNode->getInputShapeAtPort(0).getDims()) &&
+                                     parentNode->canFuse(childNode);
     };
 
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
 
         auto childNode = parentNode->getChildEdgeAt(0)->getChild();
-        if (!isSutableChildNode(parentNode, childNode)) {
+        if (!isSuitableChildNode(parentNode, childNode)) {
             parent++;
             continue;
         }
@@ -404,7 +404,7 @@ void MKLDNNGraphOptimizer::FuseMultiplyAndAdd(MKLDNNGraph &graph) {
                 graphEdges.push_back(newEdge);
                 parent->addEdge(newEdge);
 
-                parentEltwise->inputShapes.push_back(parent->outputShapes[0]);
+                parentEltwise->inputShapes.push_back(parent->getOutputShapeAtPort(0));
             }
         }
 
@@ -419,11 +419,11 @@ void MKLDNNGraphOptimizer::FuseMultiplyAndAdd(MKLDNNGraph &graph) {
 void MKLDNNGraphOptimizer::FuseConvolutionAndZeroPoints(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableConvNode = [](MKLDNNNodePtr node) {
+    auto isSuitableConvNode = [](MKLDNNNodePtr node) {
         bool retVal = false;
         if (node->getType() == Convolution) {
             if (auto convNode = std::dynamic_pointer_cast<MKLDNNConvolutionNode>(node)) {
-                auto rank = convNode->getParentEdgeAt(0)->getShape().getRank();
+                auto rank = convNode->getInputShapeAtPort(0).getRank();
                 // int8 depthwise convolution does not support fusing zero points in 3D case
                 if (implication(convNode->isDepthWise(), rank == 4)) {
                     retVal = true;
@@ -438,8 +438,8 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndZeroPoints(MKLDNNGraph &graph) {
         if (convNode == nullptr)
             IE_THROW() << "Cannot get convolution node " << node->getName();
 
-        int IC = node->getParentEdgesAtPort(0)[0]->getShape().getDims()[1];
-        int OC = node->getChildEdgesAtPort(0)[0]->getShape().getDims()[1];
+        int IC = node->getInputShapeAtPort(0).getDims()[1];
+        int OC = node->getOutputShapeAtPort(0).getDims()[1];
 
         if (Shape::UNDEFINED_DIM == IC || Shape::UNDEFINED_DIM == OC) {
             return false;
@@ -467,11 +467,11 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndZeroPoints(MKLDNNGraph &graph) {
                 if (arg0->getOriginalOutputPrecisionAtPort(0) != Precision::U8)
                     return false;
 
-                if (parent0->getParentEdgesAtPort(1)[0]->getShape().getRank() < 2) {
+                if (parent0->getInputShapeAtPort(1).getRank() < 2) {
                     return false;
                 }
 
-                auto zpDims = parent0->getParentEdgesAtPort(1)[0]->getShape().getDims();
+                auto zpDims = parent0->getInputShapeAtPort(1).getDims();
                 if (zpDims[0] != 1 || !dimsEqualStrong(zpDims[1], IC))
                     return false;
 
@@ -496,7 +496,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndZeroPoints(MKLDNNGraph &graph) {
                 if (zeroPointsData == nullptr)
                     IE_THROW() << "zeroPointsBlob has not allocated buffer";
 
-                auto zeroPointDataSize =  parent0->getParentEdgesAtPort(1)[0]->getShape().getDims()[1];
+                auto zeroPointDataSize =  parent0->getInputShapeAtPort(1).getDims()[1];
                 if (Shape::UNDEFINED_DIM == zeroPointDataSize) {
                     return false;
                 }
@@ -580,7 +580,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndZeroPoints(MKLDNNGraph &graph) {
 
     for (int i = 0; i < graphNodes.size(); i++) {
         auto conv = graphNodes[i];
-        if (!isSutableConvNode(conv)) continue;
+        if (!isSuitableConvNode(conv)) continue;
 
         auto dataEltwise = conv->getParentEdgesAtPort(0)[0]->getParent();
         auto weightsEltwise = conv->getParentEdgesAtPort(1)[0]->getParent();
@@ -605,14 +605,14 @@ static bool BF16QuantizeNodeFusing(MKLDNNNodePtr parentNode, MKLDNNNodePtr child
 void MKLDNNGraphOptimizer::FuseFullyConnectedAndSimpleOperation(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
-        return node->getType() == FullyConnected && node->getChildEdges().size() == 1 && node->getParentEdgeAt(0)->getShape().getRank() != 3;
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
+        return node->getType() == FullyConnected && node->getChildEdges().size() == 1 && node->getInputShapeAtPort(0).getRank() != 3;
     };
 
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
@@ -658,7 +658,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndDWConvolution(MKLDNNGraph &graph) {
         return conv->getWeightDims()[weightRank - 1] == 1 && conv->getWeightDims()[weightRank - 2] == 1;
     };
 
-    auto isSutableParentConvolution = [&](MKLDNNNodePtr node) {
+    auto isSuitableParentConvolution = [&](MKLDNNNodePtr node) {
         if (node->isDropped())
             return false;
 
@@ -671,8 +671,8 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndDWConvolution(MKLDNNGraph &graph) {
 
         const auto &strides = conv->getStride();
         const auto &paddings = conv->getPaddingL();
-        const auto &inDims = node->getParentEdgeAt(0)->getShape().getDims();
-        const auto &outDims = node->getChildEdgeAt(0)->getShape().getDims();
+        const auto &inDims = node->getInputShapeAtPort(0).getDims();
+        const auto &outDims = node->getOutputShapeAtPort(0).getDims();
         bool isSupportedParams = conv->getGroupNum() == 1 &&
                 inDims.size() == 4 &&
                 dimsEqualStrong(inDims[inDims.size() - 1], outDims[outDims.size() - 1]) &&
@@ -686,7 +686,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndDWConvolution(MKLDNNGraph &graph) {
         return node->getChildEdges().size() == 1 && isConvolutionNode(node->getChildEdgeAt(0)->getChild());
     };
 
-    auto isSutableChildConvolution = [&](const MKLDNNNodePtr &parentNode, const MKLDNNNodePtr &childNode) {
+    auto isSuitableChildConvolution = [&](const MKLDNNNodePtr &parentNode, const MKLDNNNodePtr &childNode) {
         if (parentNode->isDropped() || childNode->isDropped())
             return false;
 
@@ -729,7 +729,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndDWConvolution(MKLDNNGraph &graph) {
                                  convChild->getStride()[stridesSize - 1] == convChild->getStride()[stridesSize - 2] &&
                                  withBias &&
                                  one_of(convChild->getStride()[stridesSize - 1], 1, 2) &&
-                                 childNode->getChildEdgeAt(0)->getShape().getRank() == 4;
+                                 childNode->getOutputShapeAtPort(0).getRank() == 4;
 
         return isSupportedParams;
     };
@@ -761,10 +761,10 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndDWConvolution(MKLDNNGraph &graph) {
         if (!isConvolutionNode(graphNodes[i])) continue;
 
         auto parentConvNode = graphNodes[i];
-        if (!isSutableParentConvolution(parentConvNode)) continue;
+        if (!isSuitableParentConvolution(parentConvNode)) continue;
 
         auto childConvNode = parentConvNode->getChildEdgeAt(0)->getChild();
-        if (!isSutableChildConvolution(parentConvNode, childConvNode)) continue;
+        if (!isSuitableChildConvolution(parentConvNode, childConvNode)) continue;
 
         if (!isFusingWorthwhile(parentConvNode, childConvNode)) continue;
 
@@ -783,7 +783,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndDWConvolution(MKLDNNGraph &graph) {
 void MKLDNNGraphOptimizer::FuseConvolutionAndSimpleOperationThroughMaxPool(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         return (node->getType() == Convolution || node->getType() == BinaryConvolution) && node->getChildEdges().size() == 1 &&
                node->getOriginalOutputPrecisionAtPort(0) == Precision::FP32;
     };
@@ -791,7 +791,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndSimpleOperationThroughMaxPool(MKLDN
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
@@ -831,14 +831,14 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndSimpleOperationThroughMaxPool(MKLDN
 void MKLDNNGraphOptimizer::FuseConvolutionAndSimpleOperation(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         return (node->getType() == Convolution || node->getType() == BinaryConvolution) && node->getChildEdges().size() == 1;
     };
 
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
@@ -876,7 +876,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionAndSimpleOperation(MKLDNNGraph &graph)
 void MKLDNNGraphOptimizer::FusePoolingAndFakeQuantize(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         if (node->getType() == Pooling) {
             if (!one_of(node->getOriginalInputPrecisionAtPort(0), Precision::U8, Precision::I8))
                 return false;
@@ -885,16 +885,16 @@ void MKLDNNGraphOptimizer::FusePoolingAndFakeQuantize(MKLDNNGraph &graph) {
         return false;
     };
 
-    auto isSutableChildNode = [](MKLDNNNodePtr node) {
+    auto isSuitableChildNode = [](MKLDNNNodePtr node) {
         return node->getType() == FakeQuantize && node->getAlgorithm() != Algorithm::FQBinarization;
     };
 
     for (int i = 0; i < graphNodes.size(); i++) {
         auto parent = graphNodes[i];
-        if (!isSutableParentNode(parent)) continue;
+        if (!isSuitableParentNode(parent)) continue;
 
         auto child = parent->getChildEdgeAt(0)->getChild();
-        if (!isSutableChildNode(child)) continue;
+        if (!isSuitableChildNode(child)) continue;
 
         child->fuseInto(parent);
 
@@ -987,22 +987,21 @@ void MKLDNNGraphOptimizer::FuseConvolutionSumAndConvolutionSumActivation(MKLDNNG
     };
 
     for (auto &graphNode : graphNodes) {
-        if (graphNode->getType() != Eltwise)
+        // TODO [DS]: at this moment this transformation prohibit for dynamic case
+        if (graphNode->getType() != Eltwise || graphNode->getAlgorithm() != EltwiseAdd || graphNode->isDynamicNode() ||
+                std::dynamic_pointer_cast<MKLDNNEltwiseNode>(graphNode)->isWithBroadcast())
             continue;
 
-        if (graphNode->getAlgorithm() != EltwiseAdd) continue;
-        if (std::dynamic_pointer_cast<MKLDNNEltwiseNode>(graphNode)->isWithBroadcast()) continue;
-
         // TODO: Enlarge to several inputs
-        bool isSutableNode = graphNode->getParentEdges().size() == 2;
-        if (!isSutableNode)
+        bool isSuitableNode = graphNode->getParentEdges().size() == 2;
+        if (!isSuitableNode)
             continue;
 
-        auto parent1 = graphNode->getParentEdgeAt(0)->getParent();
-        auto parent2 = graphNode->getParentEdgeAt(1)->getParent();
+        auto parent1 = graphNode->getParentEdgesAtPort(0)[0]->getParent();
+        auto parent2 = graphNode->getParentEdgesAtPort(1)[0]->getParent();
 
-        bool isSutableParent1 = parent1->getType() == Convolution || parent1->getType() == BinaryConvolution;
-        bool isSutableParent2 = parent2->getType() == Convolution || parent2->getType() == BinaryConvolution;
+        bool isSuitableParent1 = parent1->getType() == Convolution || parent1->getType() == BinaryConvolution;
+        bool isSuitableParent2 = parent2->getType() == Convolution || parent2->getType() == BinaryConvolution;
 
         auto canFuseSum = [](MKLDNNBinaryConvolutionNode *binConv, MKLDNNNodePtr fuseCandidate) {
             if (binConv->getImplType() == impl_desc_type::ref)
@@ -1025,34 +1024,34 @@ void MKLDNNGraphOptimizer::FuseConvolutionSumAndConvolutionSumActivation(MKLDNNG
 
         auto* binConvNode1 = dynamic_cast<MKLDNNBinaryConvolutionNode *>(parent1.get());
         if (binConvNode1) {
-            isSutableParent1 = isSutableParent1 && canFuseSum(binConvNode1, graphNode);
+            isSuitableParent1 = isSuitableParent1 && canFuseSum(binConvNode1, graphNode);
         }
 
         auto* binConvNode2 = dynamic_cast<MKLDNNBinaryConvolutionNode *>(parent2.get());
         if (binConvNode2) {
-            isSutableParent2 = isSutableParent2 && canFuseSum(binConvNode2, graphNode);
+            isSuitableParent2 = isSuitableParent2 && canFuseSum(binConvNode2, graphNode);
         }
 
         auto* convNode1 = dynamic_cast<MKLDNNConvolutionNode *>(parent1.get());
         if (convNode1) {
             if (!convNode1->canBeExecutedInInt8()) {
-                isSutableParent1 = isSutableParent1 && convNode1->getFusedWith().empty();
+                isSuitableParent1 = isSuitableParent1 && convNode1->getFusedWith().empty();
             }
         }
 
         auto* convNode2 = dynamic_cast<MKLDNNConvolutionNode *>(parent2.get());
         if (convNode2) {
             if (!convNode2->canBeExecutedInInt8()) {
-                isSutableParent2 = isSutableParent2 && convNode2->getFusedWith().empty();
+                isSuitableParent2 = isSuitableParent2 && convNode2->getFusedWith().empty();
             }
         }
 
-        if (!isSutableParent1 && !isSutableParent2)
+        if (!isSuitableParent1 && !isSuitableParent2)
             continue;
 
-        auto mergedConv = isSutableParent1 ? parent1 : parent2;
-        auto peerNode = isSutableParent1 ? parent2 : parent1;
-        if (isSutableParent1 && isSutableParent2) {
+        auto mergedConv = isSuitableParent1 ? parent1 : parent2;
+        auto peerNode = isSuitableParent1 ? parent2 : parent1;
+        if (isSuitableParent1 && isSuitableParent2) {
             if ((peerNode->getType() == Convolution || peerNode->getType() == BinaryConvolution) &&
                 mergedConv->getChildEdges().size() != 1) {
                 mergedConv = parent2;
@@ -1070,7 +1069,7 @@ void MKLDNNGraphOptimizer::FuseConvolutionSumAndConvolutionSumActivation(MKLDNNG
 
         bool fuse_allowed = mergedConv->getChildEdges().size() == 1;
         for (size_t j = 0; fuse_allowed && j < mergedConv->getParentEdges().size(); j++)
-            if (mergedConv->getParentEdgeAt(j)->getParent() == peerNode)
+            if (mergedConv->getParentEdgesAtPort(j)[0]->getParent() == peerNode)
                 fuse_allowed = false;
 
         // Fused Conv+Sum prim will be used inplace. That's mean that input blob will
@@ -1154,14 +1153,14 @@ void MKLDNNGraphOptimizer::FuseConvolutionSumAndConvolutionSumActivation(MKLDNNG
 void MKLDNNGraphOptimizer::FuseMVNAndSimpleOperation(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         return (node->getType() == MVN) && (node->getChildEdges().size() == 1);
     };
 
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
@@ -1196,7 +1195,7 @@ void MKLDNNGraphOptimizer::FuseInterpolateAndSimpleOperation(MKLDNNGraph &graph)
         return node->getType() == Interpolate && node->getChildEdges().size() == 1;
     };
 
-    auto isSutableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
+    auto isSuitableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
         // Avoid cycle dependencies
         for (auto &childParentEdge : childNode->getParentEdges()) {
             for (auto &parentParentEdge : parentNode->getParentEdges()) {
@@ -1219,7 +1218,7 @@ void MKLDNNGraphOptimizer::FuseInterpolateAndSimpleOperation(MKLDNNGraph &graph)
         }
 
         auto childNode = parentNode->getChildEdgeAt(0)->getChild();
-        if (!isSutableChildNode(parentNode, childNode)) {
+        if (!isSuitableChildNode(parentNode, childNode)) {
             parent++;
             continue;
         }
@@ -1244,14 +1243,14 @@ void MKLDNNGraphOptimizer::FuseInterpolateAndSimpleOperation(MKLDNNGraph &graph)
 void MKLDNNGraphOptimizer::FuseNormalizeL2AndSimpleOperation(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         return node->getType() == NormalizeL2 && node->getChildEdges().size() == 1;
     };
 
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
@@ -1282,11 +1281,11 @@ void MKLDNNGraphOptimizer::FuseNormalizeL2AndSimpleOperation(MKLDNNGraph &graph)
 void MKLDNNGraphOptimizer::FuseEltwiseAndSimple(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         return node->getType() == Eltwise && node->getChildEdges().size() == 1;
     };
 
-    auto isSutableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
+    auto isSuitableChildNode = [&](MKLDNNNodePtr parentNode, MKLDNNNodePtr childNode) {
         if (parentNode->isConstant() && !childNode->isConstant())
             return false;
         for (auto &childParentEdge : childNode->getParentEdges()) {
@@ -1305,20 +1304,19 @@ void MKLDNNGraphOptimizer::FuseEltwiseAndSimple(MKLDNNGraph &graph) {
         if (!childNode->getFusedWith().empty())
             return false;
 
-        auto eltwiseNode = dynamic_cast<MKLDNNEltwiseNode*>(parentNode.get());
-        return eltwiseNode->canFuse(childNode);
+        return parentNode->canFuse(childNode);
     };
 
     auto parent = graphNodes.begin();
     while (parent != graphNodes.end()) {
         auto parentNode = *parent;
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             parent++;
             continue;
         }
 
         auto childNode = parentNode->getChildEdgeAt(0)->getChild();
-        if (!isSutableChildNode(parentNode, childNode)) {
+        if (!isSuitableChildNode(parentNode, childNode)) {
             parent++;
             continue;
         }
@@ -1422,10 +1420,10 @@ void MKLDNNGraphOptimizer::DropDoubleReorders(MKLDNNGraph &graph) {
             if (nn == nullptr)
                 IE_THROW() << "Cannot get reorder layer " << nextNode->getName();
 
-            MKLDNNNodePtr p = n->getParentEdgeAt(0)->getParent();
-            MKLDNNNodePtr c = nn->getChildEdgeAt(0)->getChild();
+            MKLDNNNodePtr p = n->getParentEdgesAtPort(0)[0]->getParent();
+            MKLDNNNodePtr c = nn->getChildEdgesAtPort(0)[0]->getChild();
 
-            auto oldEdgeNum = n->getParentEdgeAt(0)->getInputNum();
+            auto oldEdgeNum = n->getParentEdgesAtPort(0)[0]->getInputNum();
 
             graph.DropNode(node);
             graph.DropNode(nextNode);
@@ -1461,11 +1459,11 @@ void MKLDNNGraphOptimizer::FuseBroadcastAndEltwise(MKLDNNGraph &graph) {
         MKLDNNNodePtr& broadcastNode = graphNode;
         MKLDNNNodePtr eltwiseNode = broadcastNode->getChildEdgeAt(0)->getChild();
         eltwiseNode->inputShapes[broadcastNode->getChildEdgeAt(0)->getOutputNum()]
-                = broadcastNode->getParentEdgeAt(0)->getShape();
+                = broadcastNode->getInputShapeAtPort(0);
 
         auto& edges = graph.GetEdges();
         for (size_t i = 1lu; i < broadcastNode->getParentEdges().size(); i++) {
-            auto constParent = broadcastNode->getParentEdgeAt(i)->getParent();
+            auto constParent = broadcastNode->getParentEdgesAtPort(i)[0]->getParent();
             for (auto it = edges.begin(); it != edges.end(); it++) {
                 if ((*it) == constParent->getChildEdgeAt(0)) {
                     edges.erase(it);
@@ -1481,11 +1479,11 @@ void MKLDNNGraphOptimizer::FuseBroadcastAndEltwise(MKLDNNGraph &graph) {
 void MKLDNNGraphOptimizer::FuseClampAndFakeQuantize(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableClampNode = [](MKLDNNNodePtr node) {
-        return node->getType() == Eltwise && node->getChildEdges().size() == 1 && node->getAlgorithm() == EltwiseClamp;
+    auto isSuitableClampNode = [](MKLDNNNodePtr node) {
+        return node->getType() == Eltwise && node->getAlgorithm() == EltwiseClamp && !node->isDynamicNode() && node->getChildEdges().size() == 1;
     };
 
-    auto isSutableFakeQuantizeNode = [](MKLDNNNodePtr node) {
+    auto isSuitableFakeQuantizeNode = [](MKLDNNNodePtr node) {
         return node->getType() == FakeQuantize && node->getAlgorithm() != FQBinarization;
     };
 
@@ -1516,10 +1514,10 @@ void MKLDNNGraphOptimizer::FuseClampAndFakeQuantize(MKLDNNGraph &graph) {
 
     for (int i = 0; i < graphNodes.size(); i++) {
         auto parent = graphNodes[i];
-        if (!isSutableClampNode(parent)) continue;
+        if (!isSuitableClampNode(parent)) continue;
 
         auto child = parent->getChildEdgeAt(0)->getChild();
-        if (!isSutableFakeQuantizeNode(child)) continue;
+        if (!isSuitableFakeQuantizeNode(child)) continue;
 
         if (fuseClampAndFakeQuantizeNodes(parent, child)) {
             graph.DropNode(parent);
@@ -1531,31 +1529,31 @@ void MKLDNNGraphOptimizer::FusePerformedAsScaleShiftAndFakeQuantize(MKLDNNGraph
     auto& graphNodes = graph.GetNodes();
 
     auto getConstPort = [](const MKLDNNNodePtr node) -> int {
-        if (node->getParentEdgeAt(0)->getParent()->getType() == Input && node->getParentEdgeAt(0)->getParent()->isConstant()) {
+        if (node->getParentEdgesAtPort(0)[0]->getParent()->getType() == Input && node->getParentEdgesAtPort(0)[0]->getParent()->isConstant()) {
             return 0;
-        } else if (node->getParentEdgeAt(1)->getParent()->getType() == Input && node->getParentEdgeAt(1)->getParent()->isConstant()) {
+        } else if (node->getParentEdgesAtPort(1)[0]->getParent()->getType() == Input && node->getParentEdgesAtPort(1)[0]->getParent()->isConstant()) {
            return 1;
         } else {
             return -1;
         }
     };
 
-    auto isSutableScaleShiftNode = [getConstPort](MKLDNNNodePtr node) {
-        if (one_of(node->getAlgorithm(), EltwiseAdd, EltwiseSubtract, EltwiseMultiply, EltwiseDivide, EltwiseMulAdd)) {
+    auto isSuitableScaleShiftNode = [getConstPort](MKLDNNNodePtr node) {
+        if (!node->isDynamicNode() && one_of(node->getAlgorithm(), EltwiseAdd, EltwiseSubtract, EltwiseMultiply, EltwiseDivide, EltwiseMulAdd)) {
             MKLDNNNode *parent = nullptr;
             if (node->getAlgorithm() != EltwiseMulAdd) {
                 const auto constPort = getConstPort(node);
                 if (constPort == -1) {
                     return false;
                 }
-                parent = node->getParentEdgeAt(1 - constPort)->getParent().get();
+                parent = node->getParentEdgesAtPort(1 - constPort)[0]->getParent().get();
             }
             return node->getType() == Eltwise && node->getChildEdges().size() == 1 && node->canBePerformedAsScaleShift(parent);
         }
         return false;
     };
 
-    auto isSutableFakeQuantizeNode = [](MKLDNNNodePtr node) {
+    auto isSuitableFakeQuantizeNode = [](MKLDNNNodePtr node) {
         return node->getType() == FakeQuantize && node->getAlgorithm() != FQBinarization;
     };
 
@@ -1566,7 +1564,7 @@ void MKLDNNGraphOptimizer::FusePerformedAsScaleShiftAndFakeQuantize(MKLDNNGraph
 
         std::vector<float> scalesBuffer;
         std::vector<float> shiftsBuffer;
-        parent->fillScalesAndShifts(parent->getParentEdgeAt(1 - getConstPort(parent))->getParent().get(), scalesBuffer, shiftsBuffer, 1);
+        parent->fillScalesAndShifts(parent->getParentEdgesAtPort(1 - getConstPort(parent))[0]->getParent().get(), scalesBuffer, shiftsBuffer, 1);
 
         for (int i = 0; i < scalesBuffer.size(); i++)
             if (scalesBuffer[i] == 0.f)
@@ -1644,10 +1642,10 @@ void MKLDNNGraphOptimizer::FusePerformedAsScaleShiftAndFakeQuantize(MKLDNNGraph
 
     for (int i = 0; i < graphNodes.size(); i++) {
         auto parent = graphNodes[i];
-        if (!isSutableScaleShiftNode(parent)) continue;
+        if (!isSuitableScaleShiftNode(parent)) continue;
 
         auto child = parent->getChildEdgeAt(0)->getChild();
-        if (!isSutableFakeQuantizeNode(child)) continue;
+        if (!isSuitableFakeQuantizeNode(child)) continue;
 
         if (fuseScaleShiftAndFakeQuantizeNodes(parent, child)) {
             auto parentEdges = parent->parentEdges;
@@ -1667,11 +1665,11 @@ void MKLDNNGraphOptimizer::FusePerformedAsScaleShiftAndFakeQuantize(MKLDNNGraph
 void MKLDNNGraphOptimizer::MergeTransposeAndReorder(MKLDNNGraph &graph) {
     auto& graphNodes = graph.GetNodes();
 
-    auto isSutableParentNode = [](MKLDNNNodePtr node) {
+    auto isSuitableParentNode = [](MKLDNNNodePtr node) {
         return node->getType() == Transpose && node->getChildEdges().size() == 1;
     };
 
-    auto isSutableChildNode = [](MKLDNNNodePtr node) {
+    auto isSuitableChildNode = [](MKLDNNNodePtr node) {
         return node->getType() == Reorder && node->getChildEdges().size() == 1;
     };
 
@@ -1685,33 +1683,32 @@ void MKLDNNGraphOptimizer::MergeTransposeAndReorder(MKLDNNGraph &graph) {
         }
 
         auto& transposeOrder = transposeNode->getOrder();
-        auto layoutOrder = MemoryDescUtils::convertToBlockedDescriptor(
-                                                *transposeNode->getSelectedPrimitiveDescriptor()->getConfig().outConfs[0].desc).getOrder();
+        auto layoutOrder = transposeNode->getSelectedPrimitiveDescriptor()->getConfig().outConfs[0].desc->as<BlockedMemoryDesc>()->getOrder();
 
-        auto inBlockedDesc = MemoryDescUtils::convertToBlockedDescriptor(*reorderNode->getSelectedPrimitiveDescriptor()->getConfig().inConfs[0].desc);
-        auto outBlockedDesc = MemoryDescUtils::convertToBlockedDescriptor(*reorderNode->getSelectedPrimitiveDescriptor()->getConfig().outConfs[0].desc);
+        auto inBlockedDesc = reorderNode->getSelectedPrimitiveDescriptor()->getConfig().inConfs[0].desc->as<BlockedMemoryDesc>();
+        auto outBlockedDesc = reorderNode->getSelectedPrimitiveDescriptor()->getConfig().outConfs[0].desc->as<BlockedMemoryDesc>();
 
-        auto& inOrder = inBlockedDesc.getOrder();
-        auto& outOrder = outBlockedDesc.getOrder();
+        auto& inOrder = inBlockedDesc->getOrder();
+        auto& outOrder = outBlockedDesc->getOrder();
 
         if (transposeOrder.size() != layoutOrder.size() || layoutOrder.size() != inOrder.size() || inOrder.size() != outOrder.size()) {
             return false;
         }
 
         // revLayoutOrder - reverse permutation for layoutOrder
-        auto revLayoutOrder = SizeVector(layoutOrder.size());
+        auto revLayoutOrder = VectorDims(layoutOrder.size());
         for (int i = 0; i < revLayoutOrder.size(); i++) {
             revLayoutOrder[layoutOrder[i]] = i;
         }
 
         // newTransposeOrder - Transpose layout-aware permutation
-        auto newTransposeOrder = SizeVector(transposeOrder.size());
+        auto newTransposeOrder = VectorDims(transposeOrder.size());
         for (int i = 0; i < newTransposeOrder.size(); i++) {
             newTransposeOrder[i] = layoutOrder[transposeOrder[revLayoutOrder[i]]];
         }
 
         // reorderOrder - Reorder layout-aware permutation
-        auto reorderOrder = SizeVector(outOrder.size());
+        auto reorderOrder = VectorDims(outOrder.size());
         for (int i = 0; i < reorderOrder.size(); i++) {
             for (int j = 0; j < reorderOrder.size(); j++) {
                 if (outOrder[i] == inOrder[j]) {
@@ -1722,7 +1719,7 @@ void MKLDNNGraphOptimizer::MergeTransposeAndReorder(MKLDNNGraph &graph) {
         }
 
         // summaryOrder - resulting Transpose+Reorder permutation
-        auto summaryOrder = SizeVector(transposeOrder.size());
+        auto summaryOrder = VectorDims(transposeOrder.size());
         for (int i = 0; i < summaryOrder.size(); i++) {
             summaryOrder[i] = reorderOrder[newTransposeOrder[i]];
         }
@@ -1774,9 +1771,8 @@ void MKLDNNGraphOptimizer::MergeTransposeAndReorder(MKLDNNGraph &graph) {
         auto inPrec = inDesc->getPrecision();
         auto outPrec = outDesc->getPrecision();
 
-        auto reorderInDesc = inDesc->clone();
-        auto reorderOutDesc = outDesc->clone();
-        reorderOutDesc->setPrecision(inPrec);
+        auto reorderInDesc = inDesc;
+        auto reorderOutDesc = MemoryDescUtils::cloneWithNewPrecision(*outDesc, inPrec);
 
         std::string reorderlayerName = parentParentNode->getName() + "_" +
                 MKLDNNReorderNode::getReorderArgs(*reorderInDesc, *reorderOutDesc) + "_" + "fake";
@@ -1796,8 +1792,8 @@ void MKLDNNGraphOptimizer::MergeTransposeAndReorder(MKLDNNGraph &graph) {
 
         // case 2
         if (inPrec != outPrec) {
-            auto reorderInDesc2 = reorderOutDesc->clone();
-            auto reorderOutDesc2 = outDesc->clone();
+            auto reorderInDesc2 = reorderOutDesc;
+            auto reorderOutDesc2 = outDesc;
 
             std::string reorderLayerName2 = reorderNode->getName() + "_" +
                                     MKLDNNReorderNode::getReorderArgs(*reorderInDesc2, *reorderOutDesc2) + "_" + childChildNode->getName();
@@ -1808,11 +1804,11 @@ void MKLDNNGraphOptimizer::MergeTransposeAndReorder(MKLDNNGraph &graph) {
 
     for (int i = 0; i < graphNodes.size(); i++) {
         auto parentNode = graphNodes[i];
-        if (!isSutableParentNode(parentNode)) {
+        if (!isSuitableParentNode(parentNode)) {
             continue;
         }
         auto childNode = parentNode->getChildEdgeAt(0)->getChild();
-        if (!isSutableChildNode(childNode)) {
+        if (!isSuitableChildNode(childNode)) {
             continue;
         }
 
@@ -1860,4 +1856,4 @@ void MKLDNNGraphOptimizer::reshapeRnnSeq(MKLDNNGraph &graph) {
             graph.RemoveEdge(edge);
         }
     }
-}
+}
\ No newline at end of file
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.cpp
index 1ce31f3ecb882c..8fb6fc325c8759 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.cpp
@@ -22,6 +22,7 @@
 #include <debug.h>
 #include "utils/general_utils.h"
 #include "utils/cpu_utils.hpp"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 MKLDNNPlugin::MKLDNNInferRequest::MKLDNNInferRequest(InferenceEngine::InputsDataMap     networkInputs,
                                                      InferenceEngine::OutputsDataMap    networkOutputs,
@@ -35,11 +36,11 @@ MKLDNNPlugin::MKLDNNInferRequest::MKLDNNInferRequest(InferenceEngine::InputsData
         IE_THROW() << "No graph was found";
     graph = &(execNetwork->GetGraph()._graph);
 
-    // Allocate all input blobs
+    // Allocate all input blobs if shape is static, delay allocation otherwise
     for (const auto& it : _networkInputs) {
         MKLDNNInferRequest::GetBlob(it.first);
     }
-    // Allocate all output blobs
+    // Allocate all output blobs if shape is static, delay allocation otherwise
     for (const auto& it : _networkOutputs) {
         MKLDNNInferRequest::GetBlob(it.first);
     }
@@ -164,6 +165,17 @@ void MKLDNNPlugin::MKLDNNInferRequest::PullStates() {
     }
 }
 
+void MKLDNNPlugin::MKLDNNInferRequest::redefineMemoryForInputNodes() {
+    const auto cpuInputNodes = graph->GetInputNodesMap();
+
+    for (const auto &blob : _inputs) {
+        const auto inputNode = cpuInputNodes.find(blob.first);
+        if (inputNode == cpuInputNodes.end())
+            IE_THROW() << "CPU execution graph doesn't contain input node with name: " << blob.first;
+        if (inputNode->second->isDynamicNode())
+            inputNode->second->redefineOutputMemory({blob.second->getTensorDesc().getDims()});
+    }
+}
 
 void MKLDNNPlugin::MKLDNNInferRequest::InferImpl() {
     using namespace openvino::itt;
@@ -173,6 +185,9 @@ void MKLDNNPlugin::MKLDNNInferRequest::InferImpl() {
 
     ThrowIfCanceled();
 
+    if (graph->hasDynamicInput())
+        redefineMemoryForInputNodes();
+
     execDataPreprocessing(_inputs);
 
     changeDefaultPtr();
@@ -221,30 +236,25 @@ InferenceEngine::Blob::Ptr MKLDNNPlugin::MKLDNNInferRequest::GetBlob(const std::
         }
 
         if (_inputs.find(name) == _inputs.end()) {
-            auto pBlob = graph->getInputBlob(name);
-            if (!pBlob) {
-                IE_THROW() << "MKLDNN graph doesn't contain input node with name: " << name;
-            }
-
-            InferenceEngine::TensorDesc desc = pBlob->getTensorDesc();
-
             if (_networkInputs.find(name) != _networkInputs.end()) {
-                InferenceEngine::Layout l = _networkInputs[name]->getLayout();
-                InferenceEngine::Precision p = _networkInputs[name]->getPrecision();
-                InferenceEngine::SizeVector dims = _networkInputs[name]->getTensorDesc().getDims();
+                InferenceEngine::TensorDesc desc = _networkInputs[name]->getTensorDesc();
+                bool isDynamic = _networkInputs[name]->getInputData()->isDynamic();
 
-                desc = InferenceEngine::TensorDesc(p, dims, l);
-            }
+                _inputs[name] = make_blob_with_precision(desc);
+                _inputs[name]->allocate();
 
-            _inputs[name] = make_blob_with_precision(desc);
-            _inputs[name]->allocate();
-            if (pBlob->getTensorDesc() == desc &&
-                graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end() && !graph->getProperty().batchLimit) {
-                externalPtr[name] = _inputs[name]->buffer();
+                if (!isDynamic &&
+                    desc == MemoryDescUtils::convertToTensorDesc(graph->getInputNodeByName(name)->getChildEdgesAtPort(0)[0]->getMemory().getDesc()) &&
+                        graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end() && !graph->getProperty().batchLimit) {
+                    externalPtr[name] = _inputs[name]->buffer();
+                }
+            } else {
+                IE_THROW() << "Blob with name: " << name << " exists in MKLDNN graph, but absents in network inputs";
             }
         }
         data = _inputs[name];
         checkBlob(data, name, true);
+
         // check if preprocess required, but still wasn't set
         auto preProcessedInput = std::find_if(std::begin(_networkInputs), std::end(_networkInputs),
             [&](const std::pair<std::string, InferenceEngine::InputInfo::Ptr>& pair) {
@@ -263,52 +273,60 @@ InferenceEngine::Blob::Ptr MKLDNNPlugin::MKLDNNInferRequest::GetBlob(const std::
     }
 
     if (graph->hasOutputWithName(name)) {
+        const auto outNode = graph->getOutputNodeByName(name);
         if (_outputs.find(name) == _outputs.end()) {
-            auto pBlob = graph->getOutputBlob(name);
-            if (!pBlob) {
-                IE_THROW() << "MKLDNN graph doesn't contain output node with name: " << name;
-            }
-
-            if (!data) {
-                InferenceEngine::TensorDesc desc = _networkOutputs[name]->getTensorDesc();
-                desc.setPrecision(normalizeToSupportedPrecision(desc.getPrecision()));
-
-                // WA: need to avoid exception thrown when we compare blocking desc in SetBlob
-                // in situation if we push output blobs as inputs for next network (in Hetero plugin)
-                // it may be that output tensor desc will be different from real input tensor desc for next network
-                // because the optimal descriptor was chosen (e.g. inPlace case for Split node)
-                auto currBlockDesc = InferenceEngine::BlockingDesc(desc.getBlockingDesc().getBlockDims(), desc.getBlockingDesc().getOrder());
-                desc = InferenceEngine::TensorDesc(desc.getPrecision(), desc.getDims(), currBlockDesc);
-
-                data = make_blob_with_precision(desc);
-                data->allocate();
-            } else {
-                const auto& expectedTensorDesc = pBlob->getTensorDesc();
+            if (_networkOutputs.find(name) != _networkOutputs.end()) {
+                bool isDynamic = outNode->isDynamicNode();
+                const auto &desc = outNode->getParentEdgesAtPort(0)[0]->getMemory().getDesc();
+
+                if (!data) {
+                    InferenceEngine::TensorDesc desc = _networkOutputs[name]->getTensorDesc();
+                    desc.setPrecision(normalizeToSupportedPrecision(desc.getPrecision()));
+
+                    data = make_blob_with_precision(desc);
+                    data->allocate();
+                } else {
+                    const auto& expectedTensorDesc = isDynamic ? InferenceEngine::TensorDesc(desc.getPrecision(),
+                                                                          InferenceEngine::TensorDesc::getLayoutByRank(desc.getShape().getRank()))
+                                                                : MemoryDescUtils::convertToTensorDesc(desc);
+                    const auto &tensorDesc = data->getTensorDesc();
+                    if (expectedTensorDesc.getPrecision() != tensorDesc.getPrecision()) {
+                        IE_THROW(ParameterMismatch) << "Network input and output use the same name: " << name << " but expect blobs with different precision: "
+                                                    << tensorDesc.getPrecision() << " for input and " << expectedTensorDesc.getPrecision()
+                                                    << " for output.";
+                    }
 
-                if (expectedTensorDesc.getPrecision() != data->getTensorDesc().getPrecision()) {
-                    IE_THROW(ParameterMismatch) << "Network input and output use the same name: " << name << " but expect blobs with different precision: "
-                                                << data->getTensorDesc().getPrecision() << " for input and " << expectedTensorDesc.getPrecision()
-                                                << " for output.";
-                }
+                    if (expectedTensorDesc.getDims() != tensorDesc.getDims()) {
+                        IE_THROW(ParameterMismatch) << "Network input and output use the same name: " << name << " but expect blobs with different shapes.";
+                    }
 
-                if (expectedTensorDesc.getDims() != data->getTensorDesc().getDims()) {
-                    IE_THROW(ParameterMismatch) << "Network input and output use the same name: " << name << " but expect blobs with different shapes.";
+                    if (tensorDesc.getLayout() != InferenceEngine::Layout::ANY && expectedTensorDesc.getLayout() != InferenceEngine::Layout::ANY) {
+                        if (tensorDesc.getLayout() != expectedTensorDesc.getLayout() && !(tensorDesc.getLayout() == InferenceEngine::Layout::BLOCKED &&
+                            InferenceEngine::TensorDesc(tensorDesc.getPrecision(), tensorDesc.getDims(), tensorDesc.getBlockingDesc()).getLayout() ==
+                                expectedTensorDesc.getLayout())) {
+                                IE_THROW(ParameterMismatch) << "Network input and output use the same name: " << name << " but expect blobs" <<
+                                                               " with different layouts.";
+                        }
+
+                        if (expectedTensorDesc.getBlockingDesc() != tensorDesc.getBlockingDesc())
+                            IE_THROW(ParameterMismatch) << "Network input and output use the same name: " << name
+                                                        << " but expect blobs with different blocking descriptors.";
+                    }
                 }
 
-                if (data->getTensorDesc().getLayout() != InferenceEngine::Layout::ANY && expectedTensorDesc.getLayout() != InferenceEngine::Layout::ANY &&
-                    expectedTensorDesc.getBlockingDesc() != data->getTensorDesc().getBlockingDesc()) {
-                    IE_THROW(ParameterMismatch) << "Network input and output use the same name: " << name
-                                                << " but expect blobs with different blocking descriptors.";
+                _outputs[name] = data;
+                if (!isDynamic && !externalPtr.count(name) && data->getTensorDesc() == MemoryDescUtils::convertToTensorDesc(desc) &&
+                        !graph->getProperty().batchLimit) {
+                    externalPtr[name] = data->buffer();
                 }
-            }
-
-            _outputs[name] = data;
-            if (!externalPtr.count(name) && data->getTensorDesc() == pBlob->getTensorDesc() && !graph->getProperty().batchLimit) {
-                externalPtr[name] = data->buffer();
+            } else {
+                IE_THROW() << "Blob with name: " << name << " exists in MKLDNN graph, but absents in network outputs";
             }
         }
+
         data = _outputs[name];
-        checkBlob(data, name, false);
+        if (!outNode->isDynamicNode())
+            checkBlob(data, name, false);
     }
     if (!data) {
         IE_THROW() << "Cannot find blob with name: " << name;
@@ -335,11 +353,12 @@ void MKLDNNPlugin::MKLDNNInferRequest::SetBlob(const std::string& name, const In
     InferenceEngine::DataPtr foundOutput;
     size_t dataSize = data->size();
     findInputAndOutputBlobByName(name, foundInput, foundOutput);
+    const auto &blobDesc = data->getTensorDesc();
 
     if (foundInput) {
-        if (foundInput->getPrecision() != data->getTensorDesc().getPrecision()) {
+        if (foundInput->getPrecision() != blobDesc.getPrecision()) {
             IE_THROW(ParameterMismatch) << "Failed to set input blob with precision: "
-                               << data->getTensorDesc().getPrecision() << ", if CNNNetwork input blob precision is: " << foundInput->getPrecision();
+                               << blobDesc.getPrecision() << ", if CNNNetwork input blob precision is: " << foundInput->getPrecision();
         }
 
         const bool preProcRequired = preProcessingRequired(foundInput, data);
@@ -360,26 +379,29 @@ void MKLDNNPlugin::MKLDNNInferRequest::SetBlob(const std::string& name, const In
             size_t inputSize = foundInput->getTensorDesc().getLayout() != InferenceEngine::Layout::SCALAR
                 ? InferenceEngine::details::product(foundInput->getTensorDesc().getDims())
                 : 1;
-            if (dataSize != inputSize) {
+
+            const bool isDynamic = foundInput->getInputData()->isDynamic();
+            if (!isDynamic && dataSize != inputSize) {
                 IE_THROW() << "Input blob size is not equal network input size ("
                                    << dataSize << "!=" << inputSize << ").";
             }
 
-            if (foundInput->getTensorDesc().getDims() != data->getTensorDesc().getDims()) {
+            if (!isDynamic && foundInput->getTensorDesc().getDims() != blobDesc.getDims()) {
                 IE_THROW(ParameterMismatch) << "Failed to set input blob. Dimensions mismatch.";
             }
 
-            if (data->getTensorDesc().getLayout() != InferenceEngine::Layout::ANY && foundInput->getTensorDesc().getLayout() != InferenceEngine::Layout::ANY &&
-                foundInput->getTensorDesc().getBlockingDesc() != data->getTensorDesc().getBlockingDesc()) {
-                IE_THROW(ParameterMismatch) << "Failed to set input blob. Blocking descriptor mismatch.";
-            }
+            if (blobDesc.getLayout() != InferenceEngine::Layout::ANY && foundInput->getTensorDesc().getLayout() != InferenceEngine::Layout::ANY) {
+                if (isDynamic && InferenceEngine::TensorDesc(foundInput->getPrecision(), blobDesc.getDims(), foundInput->getLayout()).getBlockingDesc() !=
+                        blobDesc.getBlockingDesc())
+                    IE_THROW(ParameterMismatch) << "Failed to set input blob. Layouts mismatch.";
 
-            auto pBlob = graph->getInputBlob(name);
-            if (!pBlob) {
-                IE_THROW() << "MKLDNN graph doesn't contain input node with name: " << name;
+                if (!isDynamic && foundInput->getTensorDesc().getBlockingDesc() != blobDesc.getBlockingDesc())
+                    IE_THROW(ParameterMismatch) << "Failed to set input blob. Blocking descriptor mismatch.";
             }
 
-            if (data->getTensorDesc() == pBlob->getTensorDesc() &&
+            const auto &actualDesc = graph->getInputNodeByName(name)->getChildEdgesAtPort(0)[0]->getMemory().getDesc();
+            if (blobDesc.getLayout() != InferenceEngine::Layout::ANY &&
+                actualDesc.isCompatible(MemoryDescUtils::convertToCpuBlockedMemoryDesc(blobDesc)) &&
                 graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end() && !graph->getProperty().batchLimit) {
                 externalPtr[name] = data->buffer();
             } else if (externalPtr.find(name) != externalPtr.end()) {
@@ -393,31 +415,34 @@ void MKLDNNPlugin::MKLDNNInferRequest::SetBlob(const std::string& name, const In
             IE_THROW(NotImplemented)
                                << "cannot set compound blob: supported only for input pre-processing";
         }
-        if (foundOutput->getPrecision() != data->getTensorDesc().getPrecision()) {
+        if (foundOutput->getPrecision() != blobDesc.getPrecision()) {
             IE_THROW(ParameterMismatch) << "Failed to set output blob with precision: "
-                               << data->getTensorDesc().getPrecision() << ", if CNNNetwork output blob precision is: " << foundOutput->getPrecision();
+                               << blobDesc.getPrecision() << ", if CNNNetwork output blob precision is: " << foundOutput->getPrecision();
         }
         size_t outputSize = foundOutput->getTensorDesc().getLayout() != InferenceEngine::Layout::SCALAR
             ? InferenceEngine::details::product(foundOutput->getDims())
             : 1;
-        if (dataSize != outputSize) {
+
+        const bool isDynamic = foundOutput->isDynamic();
+        if (!isDynamic && dataSize != outputSize) {
             IE_THROW() << "Output blob size is not equal network output size ("
                                << dataSize << "!=" << outputSize << ").";
         }
-        if (foundOutput->getTensorDesc().getDims() != data->getTensorDesc().getDims()) {
+        if (!isDynamic && foundOutput->getTensorDesc().getDims() != blobDesc.getDims()) {
             IE_THROW(ParameterMismatch) << "Failed to set output Blob. Dimensions mismatch.";
         }
-        if (data->getTensorDesc().getLayout() != InferenceEngine::Layout::ANY && foundOutput->getTensorDesc().getLayout() != InferenceEngine::Layout::ANY &&
-            foundOutput->getTensorDesc().getBlockingDesc() != data->getTensorDesc().getBlockingDesc()) {
+
+        if (blobDesc.getLayout() != InferenceEngine::Layout::ANY && foundOutput->getTensorDesc().getLayout() != InferenceEngine::Layout::ANY) {
+            if (isDynamic && InferenceEngine::TensorDesc(foundOutput->getPrecision(), blobDesc.getDims(), foundOutput->getLayout()).getBlockingDesc() !=
+                    blobDesc.getBlockingDesc())
+                IE_THROW(ParameterMismatch) << "Failed to set input blob. Layouts mismatch.";
+
+            if (!isDynamic && foundOutput->getTensorDesc().getBlockingDesc() != blobDesc.getBlockingDesc())
                 IE_THROW(ParameterMismatch) << "Failed to set output blob. Blocking descriptor mismatch.";
         }
 
-        auto pBlob = graph->getOutputBlob(name);
-        if (!pBlob)
-            IE_THROW() << "MKLDNN graph doesn't contain output node with name: " << name;
-
-        if (data->getTensorDesc() == pBlob->getTensorDesc() &&
-                !graph->getProperty().batchLimit) {
+        const auto &desc = graph->getOutputNodeByName(name)->getParentEdgesAtPort(0)[0]->getMemory().getDesc();
+        if (!isDynamic && blobDesc == MemoryDescUtils::convertToTensorDesc(desc) && !graph->getProperty().batchLimit) {
             externalPtr[name] = data->buffer();
         } else if (externalPtr.find(name) != externalPtr.end()) {
             externalPtr.erase(name);
@@ -432,8 +457,8 @@ static inline void changeEdgePtr(const MKLDNNPlugin::MKLDNNEdgePtr &edge, void *
 
 void MKLDNNPlugin::MKLDNNInferRequest::changeDefaultPtr() {
     for (auto& it : externalPtr) {
-        auto input = graph->inputNodesMap.find(it.first);
-        if (input != graph->inputNodesMap.end()) {
+        auto input = graph->GetInputNodesMap().find(it.first);
+        if (input != graph->GetInputNodesMap().end()) {
             if (input->second->getChildEdgeAt(0)->getMemory().GetPrimitive().get_data_handle() == it.second)
                 continue;
             // Input cannot be in-place with other primitives
@@ -467,7 +492,7 @@ void MKLDNNPlugin::MKLDNNInferRequest::changeDefaultPtr() {
         }
 
         MKLDNNNodePtr output;
-        for (auto& out : graph->outputNodesMap) {
+        for (auto& out : graph->GetOutputNodesMap()) {
             if (out.first == it.first) {
                 output = out.second;
                 break;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.h b/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.h
index f99c42cc7e8139..3141ed18ddc542 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_infer_request.h
@@ -51,6 +51,7 @@ class MKLDNNInferRequest : public InferenceEngine::IInferRequestInternal {
     void PushInputData();
     void PushStates();
     void PullStates();
+    void redefineMemoryForInputNodes();
 
     void pushInput(const std::string& inputName, InferenceEngine::Blob::Ptr& inputBlob, InferenceEngine::Precision dataType);
 
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_memory.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_memory.cpp
index a6a64120f00172..b10a564aca513a 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_memory.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_memory.cpp
@@ -18,8 +18,10 @@
 #include "nodes/common/cpu_convert.h"
 #include "mkldnn/ie_mkldnn.h"
 #include "cpu_shape.h"
-#include "cpu_memory_desc_utils.h"
-#include "mkldnn_extension_utils.h"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
+#include "utils/cpu_utils.hpp"
+#include "nodes/mkldnn_reorder_node.h"
+#include "memory_desc/cpu_memory_desc.h"
 
 using namespace InferenceEngine;
 using namespace mkldnn;
@@ -39,15 +41,11 @@ namespace {
 MKLDNNMemory::MKLDNNMemory(const mkldnn::engine& eng) : eng(eng) {}
 
 size_t MKLDNNMemory::GetSize() const {
-    uint8_t itemSize = MKLDNNExtensionUtils::sizeOfDataType(mkldnn::memory::data_type(GetDataType()));
-    return GetElementsCount() * itemSize;
-}
-
-size_t MKLDNNMemory::GetElementsCount() const {
-    auto desc = GetDescriptor();
-    std::vector<int> dims(desc.data.padded_dims,
-                          desc.data.padded_dims + desc.data.ndims);
-    return std::accumulate(std::begin(dims), std::end(dims), (size_t) 1, std::multiplies<size_t>());
+    auto size = getDesc().getCurrentMemSize();
+    if (size  == MemoryDesc::UNDEFINED_SIZE) {
+        IE_THROW() << "Can't get memory size for undefined shape";
+    }
+    return size;
 }
 
 void MKLDNNMemory::Create(const memory::dims& dims, memory::data_type data_type, memory::format_tag format, const void* data) {
@@ -55,7 +53,7 @@ void MKLDNNMemory::Create(const memory::dims& dims, memory::data_type data_type,
         format = memory::format_tag::any;
     }
 
-    memory::desc desc = MKLDNNMemoryDesc(MKLDNNExtensionUtils::convertToSizeVector(dims), data_type, format);
+    memory::desc desc = mkldnn::memory::desc(dims, data_type, format);
 
     Create(desc, data);
 }
@@ -91,94 +89,34 @@ void MKLDNNMemory::Create(const mkldnn::memory::desc& desc, const void *data, bo
 }
 
 void MKLDNNMemory::Create(const MemoryDesc &desc, const void *data, bool pads_zeroing) {
-    pMemDesc = desc.clone();
-    Create(mkldnn::memory::desc(MemoryDescUtils::convertToMKLDNNMemoryDesc(desc)), data, pads_zeroing);
+    Create(desc.clone(), data, pads_zeroing);
 }
 
-
-void MKLDNNMemory::reorderData(const MKLDNNMemory &input, const MKLDNNMemory &output, size_t size) {
-    if (size != 0)
-        IE_ASSERT(size <= output.GetDescriptor().get_size());
-    if (input.GetDescriptor() == output.GetDescriptor()) {
-        auto srcPtr = static_cast<uint8_t*>(input.GetPtr());
-        auto dstPtr = static_cast<uint8_t*>(output.GetPtr());
-
-        auto copySize = size == 0 ? output.GetSize() : size;
-        cpu_memcpy(dstPtr, srcPtr, copySize);
+void MKLDNNMemory::Create(MemoryDescPtr desc, const void* data, bool pads_zeroing) {
+    pMemDesc = std::move(desc);
+    if (nullptr != data) {
+        useExternalStorage = true;
     } else {
-        std::unique_ptr<mkldnn::reorder> pReorder;
-        std::shared_ptr<memory> srcMemoryPtr;
-        std::vector<uint8_t> tmpBuff;
-
-        try {
-            pReorder = std::unique_ptr<mkldnn::reorder>(new mkldnn::reorder(input.GetPrimitive(), output.GetPrimitive()));
-            srcMemoryPtr = input.prim;
-        }
-        catch (const mkldnn::error& err) {
-            if (mkldnn_unimplemented == err.status && output.GetDataType() != input.GetDataType()) {
-                //we probably could not make the reorder because there is no one supporting this precision conversion
-                //lets try to convert data first using cpu_convert
-                auto data = static_cast<const uint8_t *>(input.GetPtr());
-                tmpBuff.resize(input.GetSize());
-
-                cpu_convert(data, tmpBuff.data(), MKLDNNExtensionUtils::DataTypeToIEPrecision(input.GetDataType()),
-                            MKLDNNExtensionUtils::DataTypeToIEPrecision(output.GetDataType()), input.GetElementsCount());
-
-                MKLDNNMemory tmpMem(output.eng);
-                tmpMem.Create(input.GetDims(), output.GetDataType(), input.GetMKLDNNDesc().getFormat(), tmpBuff.data());
-
-                pReorder = std::unique_ptr<mkldnn::reorder>(new mkldnn::reorder(tmpMem.GetPrimitive(), output.GetPrimitive()));
-                srcMemoryPtr = tmpMem.prim;
-            } else {
-                throw;
-            }
-        }
-        if (pReorder) {
-            mkldnn::stream loc_stream(output.eng, stream::flags::default_order);
-            pReorder->execute(loc_stream, *srcMemoryPtr, *output.prim);
-        } else {
-            IE_THROW() << "Could not make mkldnn reorder.";
-        }
+        useExternalStorage = false;
     }
-}
-
-// TODO: It should be done via wrap into Memory;
-void MKLDNNMemory::SetData(memory::data_type dataType, memory::format_tag format, const void* data, size_t size, bool ftz) const {
-    IE_ASSERT(!one_of(format, memory::format_tag::undef, memory::format_tag::any));
-
-    auto dst_desc = GetDescriptor();
-    memory::desc src_desc{dst_desc.dims(), dataType, format};
 
-    IE_ASSERT(size <= dst_desc.get_size());
-
-    if (dst_desc == src_desc) {
-        uint8_t itemSize = MKLDNNExtensionUtils::sizeOfDataType(mkldnn::memory::data_type(dataType));
-        uint8_t* dataPtr = static_cast<uint8_t*>(GetData());
-        // We cannot support strides for i/o blobs because it affects performance.
-        dataPtr += itemSize * prim->get_desc().data.offset0;
-        cpu_memcpy(dataPtr, data, size);
+    if (pMemDesc->isDefined()) {
+        Create(MemoryDescUtils::convertToDnnlMemoryDesc(pMemDesc)->getDnnlDesc(), data, pads_zeroing);
     } else {
-        auto memData = this->GetDescriptor().data;
-        memory::dims dims(memData.dims, memData.dims + memData.ndims);
-
-        MKLDNNMemory src(this->eng);
-        src.Create(dims, dataType, format, data);
-
-        reorderData(src, *this);
+        //delayed dynamic allocation
+        size_t maxMemSize = pMemDesc->getMaxMemSize();
+        VectorDims dummySize{!pMemDesc->hasDefinedMaxSize() ? 0 : maxMemSize};
+        DnnlBlockedMemoryDesc dummyDesc(InferenceEngine::Precision::U8, Shape(dummySize));
+        Create(dummyDesc.getDnnlDesc(), data, false);  // no pads zeroing
     }
-    if (ftz
-        && dataType == memory::data_type::f32
-        && prim->get_desc().data.format_kind != dnnl_format_kind_wino
-        && GetDataType() != memory::data_type::bf16) {
-        // Internal blobs haven't strides yet.
-        auto *memData = static_cast<float *>(GetData());
-        memData += prim->get_desc().data.offset0;
-        setSubnormalsToZero(memData, GetSize() / sizeof(float));
+    size_t newUpperBound = MKLDNNExtensionUtils::getMemSizeForDnnlDesc(prim->get_desc());
+    if (newUpperBound > memUpperBound) {
+        memUpperBound = newUpperBound;
     }
 }
 
 void MKLDNNMemory::SetData(const MKLDNNMemory& src, size_t size, bool ftz) const {
-    reorderData(src, *this, size);
+    MKLDNNReorderNode::reorderData(src, *this, size);
 
     if (ftz
         && src.GetDataType() == memory::data_type::f32
@@ -193,726 +131,49 @@ void MKLDNNMemory::SetData(const MKLDNNMemory& src, size_t size, bool ftz) const
 
 void MKLDNNMemory::FillZero() {
     void* dataPtr = GetData();
-    memset(dataPtr, 0, GetSize());
-}
-
-memory::format_tag MKLDNNMemory::GetPlainFormatByRank(size_t rank) {
-    switch (rank) {
-        case 0:
-        case 1:
-            return memory::format_tag::a;
-        case 2:
-            return memory::format_tag::ab;
-        case 3:
-            return memory::format_tag::abc;
-        case 4:
-            return memory::format_tag::abcd;
-        case 5:
-            return memory::format_tag::abcde;
-        case 6:
-            return memory::format_tag::abcdef;
-        default:
-            return memory::format_tag::undef;
-    }
-}
-
-InferenceEngine::Layout MKLDNNMemory::GetPlainLayout(const memory::dims& dims) {
-    switch (dims.size()) {
-        case 0: return Layout::SCALAR;
-        case 1: return Layout::C;
-        case 2: return Layout::NC;
-        case 3: return Layout::CHW;
-        case 4: return Layout::NCHW;
-        case 5: return Layout::NCDHW;
-        default:
-            return Layout::BLOCKED;
-    }
-}
-
-Precision MKLDNNMemory::convertToIePrec(memory::data_type dataType) {
-    return MKLDNNExtensionUtils::DataTypeToIEPrecision(dataType);
-}
-
-memory::data_type MKLDNNMemory::convertToDataType(const InferenceEngine::Precision &precision) {
-    return MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
-}
-
-memory::format_tag MKLDNNMemory::Convert(const InferenceEngine::Layout layout) {
-    switch (layout) {
-        case NCHW:
-            return memory::format_tag::nchw;
-        case NHWC:
-            return memory::format_tag::nhwc;
-        case NCDHW:
-            return memory::format_tag::ncdhw;
-        case NDHWC:
-            return memory::format_tag::ndhwc;
-        case CHW:
-            return memory::format_tag::tnc;
-        case NC:
-            return memory::format_tag::nc;
-        case C:
-            return memory::format_tag::x;
-        case SCALAR:
-            return memory::format_tag::x;
-        default:
-            return memory::format_tag::undef;
-    }
-}
-
-std::string MKLDNNMemory::formatToString(memory::format_tag fmt) {
-    return mkldnn::utils::fmt2str(fmt);
+    if (dataPtr != nullptr)
+        memset(dataPtr, 0, getDesc().getMaxMemSize());
 }
 
 void *MKLDNNMemory::GetPtr() const  {
     auto ptr = static_cast<uint8_t*>(GetData());
-    auto md = GetDescriptor().data;
+    auto md = prim->get_desc().data;
     mkldnn::impl::memory_desc_wrapper wrapper(md);
     ptr += wrapper.offset0() * wrapper.data_type_size();
     return ptr;
 }
 
-template<>
-MKLDNNMemoryDesc MKLDNNMemory::GetDescWithType<MKLDNNMemoryDesc, 0, 0>() const {
-    if (auto descPtr = dynamic_cast<const MKLDNNMemoryDesc*>(pMemDesc.get())) {
-        return *descPtr;
-    } else {
-        switch (pMemDesc->getType()) {
-            case (MemoryDescType::Blocked):
-                return MemoryDescUtils::convertToMKLDNNMemoryDesc(*(pMemDesc->as<BlockedMemoryDesc>()));
-            default:
-                IE_THROW() << "Can not convert unsupported memory descriptor";
-        }
-    }
+void MKLDNNMemory::redefineDesc(const MemoryDesc& desc, void *data) {
+    redefineDesc(desc.clone(), data);
 }
 
-template<>
-BlockedMemoryDesc MKLDNNMemory::GetDescWithType<BlockedMemoryDesc, 0, 0>() const {
-    if (auto descPtr = dynamic_cast<const BlockedMemoryDesc*>(pMemDesc.get())) {
-        return *descPtr;
-    } else {
-        switch (pMemDesc->getType()) {
-            case (MemoryDescType::Mkldnn):
-                return MemoryDescUtils::convertToBlockedDescriptor(*(pMemDesc->as<MKLDNNMemoryDesc>()));
-            default:
-                IE_THROW() << "Can not convert unsupported memory descriptor";
+void MKLDNNMemory::redefineDesc(MemoryDescPtr desc, void *data) {
+    if (data != nullptr) {
+        this->Create(std::move(desc), data, false);
+    } else if (useExternalStorage) {
+        if (!desc->hasDefinedMaxSize()) {
+            IE_THROW() << "Can not reset descriptor, memory upper bound is unknown.";
         }
-    }
-}
-
-bool MKLDNNMemoryDesc::operator==(const MKLDNNMemoryDesc &rhs) const {
-    return this->desc == rhs.desc;
-}
-
-bool MKLDNNMemoryDesc::operator!=(const MKLDNNMemoryDesc &rhs) const {
-    return !(*this == rhs);
-}
 
-MKLDNNMemoryDesc::operator mkldnn::memory::desc() const {
-    return desc;
-}
-
-MKLDNNMemoryDesc::MKLDNNMemoryDesc(const mkldnn::memory::desc& desc) :
-    MemoryDesc(Shape(MKLDNNExtensionUtils::convertToSizeVector(desc.dims())), Mkldnn), desc(desc) {
-    if (desc.data.format_kind == dnnl::impl::format_kind::any)
-        IE_THROW(Unexpected) << "Memory format any is prohibited!";
-}
-
-MKLDNNMemoryDesc::MKLDNNMemoryDesc(const std::vector<size_t>& _dims, mkldnn::memory::data_type dataType, mkldnn::memory::format_tag format)
-       : MemoryDesc(Shape(_dims), Mkldnn) {
-    if (format == memory::format_tag::any)
-        IE_THROW(Unexpected) << "Memory format any is prohibited!";
-    if (format != memory::format_tag::undef) {
-        if (format == memory::format_tag::x && _dims.size() == 0) {
-            desc = mkldnn::memory::desc(mkldnn::memory::dims(1, 1), dataType, format);
+        size_t descMaxSize = desc->getMaxMemSize();
+        if (descMaxSize <= memUpperBound) {
+            this->Create(std::move(desc), prim->get_data_handle(), false);
         } else {
-            desc = mkldnn::memory::desc(MKLDNNExtensionUtils::convertToDnnlDims(_dims), dataType, format);
-        }
-    } else {
-        // Trying to create plain descriptor
-        // This WA is needed since memory::format_tag doesn't contain plain tag for tensors with rank > 6D
-        mkldnn::memory::dims strides(_dims.size(), 1);
-        for (int d = _dims.size() - 2; d >= 0; d--) {
-            strides[d] = strides[d + 1] * _dims[d + 1];
-        }
-
-        desc = mkldnn::memory::desc(MKLDNNExtensionUtils::convertToDnnlDims(_dims), dataType, strides);
-    }
-}
-
-MKLDNNMemoryDesc::MKLDNNMemoryDesc(const std::vector<size_t>& _dims, mkldnn::memory::data_type dataType)
-        : MemoryDesc(Shape(_dims), Mkldnn), desc() {
-    const auto ndims = _dims.size();
-    mkldnn::memory::dims plain_strides(ndims, 1);
-    for (size_t i = 1; i < ndims; i++) {
-        plain_strides[ndims - i -1] = plain_strides[ndims - i] * _dims[ndims - i];
-    }
-    desc = {MKLDNNExtensionUtils::convertToDnnlDims(_dims), dataType, plain_strides};
-}
-
-static const std::map<int, std::vector<mkldnn::memory::format_tag>> form_tags_by_ndims {
-    {0, {
-        mkldnn::memory::format_tag::a   // TODO :: really 1d layout for scalar??
-     }}, {1, {
-        mkldnn::memory::format_tag::a
-     }}, {2, {
-        mkldnn::memory::format_tag::ab,
-        mkldnn::memory::format_tag::ba
-     }}, {3, {
-        mkldnn::memory::format_tag::abc,
-        mkldnn::memory::format_tag::acb,
-        mkldnn::memory::format_tag::bac,
-        mkldnn::memory::format_tag::bca,
-        mkldnn::memory::format_tag::cba,
-
-        mkldnn::memory::format_tag::Abc16a,
-        mkldnn::memory::format_tag::ABc16a16b,
-        mkldnn::memory::format_tag::ABc4a4b,
-        mkldnn::memory::format_tag::aBc16b,
-        mkldnn::memory::format_tag::aBc32b,
-        mkldnn::memory::format_tag::ABc16b16a,
-        mkldnn::memory::format_tag::Abc4a,
-        mkldnn::memory::format_tag::aBc4b,
-        mkldnn::memory::format_tag::ABc4b16a4b,
-        mkldnn::memory::format_tag::ABc2b8a4b,
-        mkldnn::memory::format_tag::ABc16b16a4b,
-        mkldnn::memory::format_tag::ABc16b16a2b,
-        mkldnn::memory::format_tag::ABc4b4a,
-        mkldnn::memory::format_tag::ABc8a16b2a,
-        mkldnn::memory::format_tag::ABc8a8b,
-        mkldnn::memory::format_tag::ABc8a4b,
-        mkldnn::memory::format_tag::aBc8b,
-        mkldnn::memory::format_tag::ABc8b16a2b,
-        mkldnn::memory::format_tag::ABc8b8a,
-        mkldnn::memory::format_tag::Acb16a,
-        mkldnn::memory::format_tag::Acb4a,
-        mkldnn::memory::format_tag::Acb8a,
-        mkldnn::memory::format_tag::BAc16a16b,
-        mkldnn::memory::format_tag::BAc16b16a,
-     }}, {4, {                                 // Popular
-        mkldnn::memory::format_tag::abcd,      // plain
-        mkldnn::memory::format_tag::acdb,      // tail_c
-        mkldnn::memory::format_tag::aBcd8b,    // blocked 8c
-        mkldnn::memory::format_tag::aBcd16b,   // blocked 16c
-
-        mkldnn::memory::format_tag::abdc,
-
-        mkldnn::memory::format_tag::bacd,
-        mkldnn::memory::format_tag::bcda,
-        mkldnn::memory::format_tag::cdba,
-        mkldnn::memory::format_tag::dcab,
-
-        mkldnn::memory::format_tag::Abcd8a,
-        mkldnn::memory::format_tag::Abcd16a,
-        mkldnn::memory::format_tag::Abcd32a,
-        mkldnn::memory::format_tag::ABcd16a16b,
-        mkldnn::memory::format_tag::aBcd32b,
-        mkldnn::memory::format_tag::ABcd16b16a,
-        mkldnn::memory::format_tag::aBCd16b16c,
-        mkldnn::memory::format_tag::aBCd16c16b,
-        mkldnn::memory::format_tag::Abcd4a,
-        mkldnn::memory::format_tag::aBcd4b,
-        mkldnn::memory::format_tag::ABcd4b16a4b,
-        mkldnn::memory::format_tag::ABcd2b8a4b,
-        mkldnn::memory::format_tag::ABcd4b4a,
-        mkldnn::memory::format_tag::ABcd4a4b,
-        mkldnn::memory::format_tag::aBCd4c16b4c,
-        mkldnn::memory::format_tag::aBCd2c8b4c,
-        mkldnn::memory::format_tag::ABcd16b16a4b,
-        mkldnn::memory::format_tag::ABcd16b16a2b,
-        mkldnn::memory::format_tag::aBCd16c16b4c,
-        mkldnn::memory::format_tag::aBCd16c16b2c,
-        mkldnn::memory::format_tag::aBCd4c4b,
-        mkldnn::memory::format_tag::aBCd4b4c,
-        mkldnn::memory::format_tag::ABcd8a16b2a,
-        mkldnn::memory::format_tag::ABcd8a8b,
-        mkldnn::memory::format_tag::ABcd8a32b,
-        mkldnn::memory::format_tag::ABcd32a32b,
-        mkldnn::memory::format_tag::ABcd8a4b,
-
-        mkldnn::memory::format_tag::ABcd8b16a2b,
-        mkldnn::memory::format_tag::aBCd8b16c2b,
-        mkldnn::memory::format_tag::ABcd8b8a,
-        mkldnn::memory::format_tag::aBCd8b8c,
-        mkldnn::memory::format_tag::aBCd8b4c,
-        mkldnn::memory::format_tag::aBCd8c16b2c,
-        mkldnn::memory::format_tag::aBCd8c8b,
-
-        mkldnn::memory::format_tag::ABcd4a8b8a4b,
-        mkldnn::memory::format_tag::ABcd2a8b8a2b,
-
-        mkldnn::memory::format_tag::aBdc16b,
-        mkldnn::memory::format_tag::aBdc4b,
-        mkldnn::memory::format_tag::aBdc8b,
-        mkldnn::memory::format_tag::aCBd16b16c,
-        mkldnn::memory::format_tag::aCBd16c16b,
-        mkldnn::memory::format_tag::Acdb16a,
-        mkldnn::memory::format_tag::Acdb4a,
-        mkldnn::memory::format_tag::Acdb8a,
-        mkldnn::memory::format_tag::BAcd16a16b,
-        mkldnn::memory::format_tag::BAcd16b16a,
-        mkldnn::memory::format_tag::ABcd32a32b,
-        mkldnn::memory::format_tag::Acdb32a,
-        mkldnn::memory::format_tag::aBCd2b4c2b,
-        mkldnn::memory::format_tag::aBCd2c4b2c,
-        mkldnn::memory::format_tag::aBCd4b8c2b,
-        mkldnn::memory::format_tag::aBCd4c8b2c,
-    }}, {5, {                                   // Popular
-        mkldnn::memory::format_tag::abcde,      // plain
-        mkldnn::memory::format_tag::acdeb,      // tail_c
-        mkldnn::memory::format_tag::aBcde8b,    // blocked 8c
-        mkldnn::memory::format_tag::aBcde16b,   // blocked 16c
-
-        mkldnn::memory::format_tag::abdec,
-        mkldnn::memory::format_tag::acbde,
-        mkldnn::memory::format_tag::bacde,
-        mkldnn::memory::format_tag::bcdea,
-        mkldnn::memory::format_tag::cdeba,
-        mkldnn::memory::format_tag::decab,
-
-        mkldnn::memory::format_tag::Abcde16a,
-        mkldnn::memory::format_tag::Abcde32a,
-        mkldnn::memory::format_tag::ABcde16a16b,
-        mkldnn::memory::format_tag::aBcde32b,
-        mkldnn::memory::format_tag::ABcde16b16a,
-        mkldnn::memory::format_tag::aBCde16b16c,
-        mkldnn::memory::format_tag::aBCde16c16b,
-        mkldnn::memory::format_tag::aBCde2c8b4c,
-        mkldnn::memory::format_tag::Abcde4a,
-        mkldnn::memory::format_tag::aBcde4b,
-        mkldnn::memory::format_tag::ABcde4b4a,
-        mkldnn::memory::format_tag::ABcde4a4b,
-        mkldnn::memory::format_tag::aBCde4b4c,
-        mkldnn::memory::format_tag::aBCde4c16b4c,
-        mkldnn::memory::format_tag::aBCde16c16b4c,
-        mkldnn::memory::format_tag::aBCde16c16b2c,
-        mkldnn::memory::format_tag::aBCde4c4b,
-        mkldnn::memory::format_tag::Abcde8a,
-        mkldnn::memory::format_tag::ABcde8a8b,
-        mkldnn::memory::format_tag::ABcde8a4b,
-        mkldnn::memory::format_tag::ABcde8b16a2b,
-        mkldnn::memory::format_tag::ABcde4b16a4b,
-        mkldnn::memory::format_tag::ABcde2b8a4b,
-        mkldnn::memory::format_tag::aBCde8b16c2b,
-        mkldnn::memory::format_tag::ABcde8b8a,
-        mkldnn::memory::format_tag::aBCde8b8c,
-        mkldnn::memory::format_tag::aBCde8b4c,
-        mkldnn::memory::format_tag::aBCde4b8c8b4c,
-        mkldnn::memory::format_tag::aBCde2b8c8b2c,
-        mkldnn::memory::format_tag::aBCde8c16b2c,
-        mkldnn::memory::format_tag::aBCde8c8b,
-        mkldnn::memory::format_tag::aBdec16b,
-        mkldnn::memory::format_tag::aBdec4b,
-        mkldnn::memory::format_tag::aBdec8b,
-        mkldnn::memory::format_tag::aCBde16b16c,
-        mkldnn::memory::format_tag::aCBde16c16b,
-        mkldnn::memory::format_tag::Acdeb16a,
-        mkldnn::memory::format_tag::Acdeb4a,
-        mkldnn::memory::format_tag::Acdeb8a,
-        mkldnn::memory::format_tag::BAcde16b16a,
-        mkldnn::memory::format_tag::BAcde16a16b,
-        mkldnn::memory::format_tag::aBdec32b,
-        mkldnn::memory::format_tag::aBCde2b4c2b,
-        mkldnn::memory::format_tag::aBCde2c4b2c,
-        mkldnn::memory::format_tag::aBCde4b8c2b,
-        mkldnn::memory::format_tag::aBCde4c8b2c,
-    }}, {6, {                                    // Popular
-        mkldnn::memory::format_tag::abcdef,      // plain
-        mkldnn::memory::format_tag::acbdef,      // permute
-        mkldnn::memory::format_tag::defcab,      // permute
-        mkldnn::memory::format_tag::aBcdef16b,   // blocked 16c
-
-        mkldnn::memory::format_tag::aBCdef16b16c,
-        mkldnn::memory::format_tag::aBCdef16c16b,
-        mkldnn::memory::format_tag::aBcdef4b,
-        mkldnn::memory::format_tag::aBCdef2c8b4c,
-        mkldnn::memory::format_tag::aBCdef4c4b,
-        mkldnn::memory::format_tag::aBCdef4b4c,
-        mkldnn::memory::format_tag::aBCdef8b8c,
-        mkldnn::memory::format_tag::aBCdef8b4c,
-        mkldnn::memory::format_tag::aBCdef8c16b2c,
-        mkldnn::memory::format_tag::aBCdef4c16b4c,
-        mkldnn::memory::format_tag::aBCdef8c8b,
-
-        mkldnn::memory::format_tag::aBdefc16b,
-        mkldnn::memory::format_tag::aCBdef16c16b,
-        mkldnn::memory::format_tag::aCBdef16b16c,
-        mkldnn::memory::format_tag::aBdefc4b,
-        mkldnn::memory::format_tag::aBdefc8b,
-
-        mkldnn::memory::format_tag::Abcdef4a,
-        mkldnn::memory::format_tag::Abcdef8a,
-        mkldnn::memory::format_tag::Abcdef16a,
-        mkldnn::memory::format_tag::Abcdef32a,
-        mkldnn::memory::format_tag::aBCdef2b4c2b,
-        mkldnn::memory::format_tag::aBCdef2c4b2c,
-        mkldnn::memory::format_tag::aBCdef4b8c2b,
-        mkldnn::memory::format_tag::aBCdef4c8b2c,
-        }}
-};
-
-mkldnn::memory::format_tag MKLDNNMemoryDesc::getFormat() const {
-    // TODO [OneDNN]: Previously it was a field of tdesc, but now the brute
-    //                force search here. Please avoid of using this method.
-    const auto ndims = desc.dims().size();
-
-    // There are no suitable format_tag for this
-    if (ndims == 0 || ndims > 6)
-        return mkldnn::memory::format_tag::undef;
-
-    for (const auto fmt : form_tags_by_ndims.at(ndims)) {
-        if (this->isSame(fmt))
-            return fmt;
-    }
-
-    return mkldnn::memory::format_tag::undef;
-}
-
-bool MKLDNNMemoryDesc::isSame(mkldnn::memory::format_tag fmt) const {
-    memory::desc refDesc(desc.dims(), desc.data_type(), fmt);
-
-    if (desc.data.ndims != refDesc.data.ndims)
-        return false;
-
-    if (desc.data.format_kind != dnnl_blocked || refDesc.data.format_kind != dnnl_blocked)
-        IE_THROW() << "MKLDNNMemoryDesc::isSame is not implemented for non blocked memory format";
-
-    auto actualBlkDesc = desc.data.format_desc.blocking;
-    auto refBlkDesc = refDesc.data.format_desc.blocking;
-    if (actualBlkDesc.inner_nblks != refBlkDesc.inner_nblks)
-        return false;
-
-    for (size_t i = 0; i < actualBlkDesc.inner_nblks; ++i)
-        if (actualBlkDesc.inner_blks[i] != refBlkDesc.inner_blks[i])
-            return false;
-
-    for (size_t i = 0; i < actualBlkDesc.inner_nblks; ++i)
-        if (actualBlkDesc.inner_idxs[i] != refBlkDesc.inner_idxs[i])
-            return false;
-
-    auto actualStrides = desc.data.format_desc.blocking.strides;
-    auto refStrides = refDesc.data.format_desc.blocking.strides;
-
-    std::vector<size_t> actualOrder(desc.data.ndims);
-    {
-        const auto dims = desc.dims();
-        std::vector<size_t> total_block_per_dim(dims.size(), 1);
-        const auto &blk_desc = desc.data.format_desc.blocking;
-        for (int i = 0; i < blk_desc.inner_nblks; i++) {
-            total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
-        }
-        std::vector<size_t> outer_block_dims(std::begin(dims), std::begin(dims) + dims.size());
-        for (size_t i = 0; i < outer_block_dims.size(); i++) {
-            outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
-        }
-
-        std::iota(actualOrder.begin(), actualOrder.end(), 0);
-        std::sort(actualOrder.begin(), actualOrder.end(),
-                  [&actualStrides, &outer_block_dims] (size_t ind_l, size_t ind_r) {
-                      return (actualStrides[ind_l] > actualStrides[ind_r]) ||
-                             (actualStrides[ind_l] == actualStrides[ind_r] && outer_block_dims[ind_l] > outer_block_dims[ind_r]);
-                  });
-    }
-
-    std::vector<size_t> refOrder(refDesc.data.ndims);
-    {
-        const auto dims = refDesc.dims();
-        std::vector<size_t> total_block_per_dim(dims.size(), 1);
-        const auto &blk_desc = refDesc.data.format_desc.blocking;
-        for (int i = 0; i < blk_desc.inner_nblks; i++) {
-            total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
+            this->Create(std::move(desc), nullptr, false);
         }
-        std::vector<size_t> outer_block_dims(std::begin(dims), std::begin(dims) + dims.size());
-        for (size_t i = 0; i < outer_block_dims.size(); i++) {
-            outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
-        }
-
-        std::iota(refOrder.begin(), refOrder.end(), 0);
-        std::sort(refOrder.begin(), refOrder.end(),
-                  [&refStrides, &outer_block_dims] (size_t ind_l, size_t ind_r) {
-                      return (refStrides[ind_l] > refStrides[ind_r]) ||
-                             (refStrides[ind_l] == refStrides[ind_r] && outer_block_dims[ind_l] > outer_block_dims[ind_r]);
-                  });
-    }
-
-    if (actualOrder != refOrder) {
-        return false;
-    }
-
-    return true;
-}
-
-bool MKLDNNMemoryDesc::isPlainFormat() const {
-    if (desc.data.format_kind != dnnl_blocked ||
-        desc.data.format_desc.blocking.inner_nblks != 0)
-        return false;
-
-    const auto ndims = desc.data.ndims;
-    const auto dims = desc.data.dims;
-    const auto &strides = desc.data.format_desc.blocking.strides;
-    bool is_plain_strides = (strides[ndims-1] == 1);
-    for (int i = 0; i < ndims - 1; i++) {
-        is_plain_strides &= (strides[i] == strides[i+1] * dims[i+1]);
-    }
-
-    return is_plain_strides;
-}
-
-bool MKLDNNMemoryDesc::isBlockedCFormat(size_t blk_size) const {
-    const auto &blocking = desc.data.format_desc.blocking;
-
-    if (desc.data.format_kind != dnnl_blocked ||
-        blocking.inner_nblks != 1 ||
-        blocking.inner_idxs[0] != 1)
-        return false;
-
-    const auto &ndims = desc.data.ndims;
-    const auto &strides = desc.data.format_desc.blocking.strides;
-    const auto &dims = desc.data.padded_dims;
-
-    if (blk_size == UNREACHABLE_DIM) {
-        blk_size = blocking.inner_blks[0];
-    } else {
-        if (blk_size != blocking.inner_blks[0])
-            return false;
-    }
-
-    bool is_direct_order = (strides[ndims-1] == blocking.inner_blks[0]);
-    for (int i = 0; i < ndims - 1; i++) {
-        auto dim = (i == 0) ? div_up(dims[i+1], blk_size) : dims[i+1];
-        is_direct_order &= (strides[i] >= strides[i+1] * dim);
-    }
-
-    return is_direct_order;
-}
-
-bool MKLDNNMemoryDesc::isTailCFormat() const {
-    const auto &blocking = desc.data.format_desc.blocking;
-
-    if (desc.data.format_kind != dnnl_blocked ||
-        blocking.inner_nblks != 0)
-        return false;
-
-    const auto &ndims = desc.data.ndims;
-    const auto &strides = desc.data.format_desc.blocking.strides;
-    const auto &dims = desc.data.padded_dims;
-
-    // dense permutation of acd..b
-    bool is_tailc_strides = (strides[1] == 1 && strides[ndims-1] == dims[1] && strides[0] == dims[2] * strides[2]);
-    for (int i = 2; i < ndims - 1; i++) {
-        is_tailc_strides &= (strides[i] == strides[i+1] * dims[i+1]);
-    }
-
-    return is_tailc_strides;
-}
-
-bool MKLDNNMemoryDesc::blocksExtended() const {
-    for (int i = 0; i < desc.data.ndims; i++) {
-        if (desc.data.dims[i] != desc.data.padded_dims[i])
-            return true;
-    }
-    return false;
-}
-
-size_t MKLDNNMemoryDesc::getMemSizeImp() const {
-    return desc.get_size();
-}
-
-size_t MKLDNNMemoryDesc::getElementOffset(size_t elemNumber) const {
-    mkldnn::impl::memory_desc_wrapper wrapped(desc.data);
-    return wrapped.off_l(elemNumber);
-}
-
-bool MKLDNNMemoryDesc::isCompatible(const MemoryDesc &rhs) const {
-    if (MemoryDescType::Blocked == rhs.getType()) {
-        return isCompatible(*(rhs.as<BlockedMemoryDesc>()));
-    } else if (MemoryDescType::Mkldnn == rhs.getType()) {
-        return isCompatible(*(rhs.as<MKLDNNMemoryDesc>()));
     } else {
-        return false;
+        this->Create(std::move(desc), nullptr, false);
     }
 }
 
-bool MKLDNNMemoryDesc::isCompatible(const MKLDNNMemoryDesc &rhs) const {
-    using namespace dnnl;
-    using namespace impl;
-    using namespace dnnl::impl::utils;
-    if (this->desc == rhs.desc) {
-        return true;
-    }
-    mkldnn::impl::memory_desc_wrapper wrappedThis(this->desc.data);
-    mkldnn::impl::memory_desc_wrapper wrappedRhs(rhs.desc.data);
-    if (one_of(wrappedThis.format_kind(), format_kind::undef, format_kind::any))
-        return false;
-    if (wrappedThis.is_wino_desc() || wrappedThis.is_rnn_packed_desc()) return false;
-
-    const auto &blk = wrappedThis.blocking_desc();
-    const auto &r_blk = wrappedRhs.blocking_desc();
-
-    int stride_start = wrappedThis.ndims() >0 && wrappedThis.dims()[0] == 1 ? 1 : 0;  //ignore batch axis stride if batch size == 1
-
-    // Here is a slightly modified version of mkldnn::impl::memory_desc_wrapper::similar_to() call able to skip specific strides check.
-    return wrappedThis.ndims() == wrappedRhs.ndims()
-           && wrappedThis.format_kind() == wrappedRhs.format_kind()
-           && wrappedThis.data_type() == wrappedRhs.data_type()
-           && array_cmp(wrappedThis.dims(), wrappedRhs.dims(), wrappedThis.ndims())
-           && array_cmp(blk.strides + stride_start, r_blk.strides + stride_start, wrappedThis.ndims() - stride_start)
-           && blk.inner_nblks == r_blk.inner_nblks
-           && array_cmp(blk.inner_blks, r_blk.inner_blks, blk.inner_nblks)
-           && array_cmp(blk.inner_idxs, r_blk.inner_idxs, blk.inner_nblks)
-           && array_cmp(wrappedThis.padded_dims(), wrappedRhs.padded_dims(), wrappedRhs.ndims())
-           && array_cmp(wrappedThis.padded_offsets(), wrappedRhs.padded_offsets(), wrappedThis.ndims())
-           && dimsEqualWeak(wrappedThis.offset0(), wrappedRhs.offset0());
-}
-
-
-/**
- * Check compatibility with BlockedMemoryDesc
- *
- * mkl:  IOhw_4i16o4i    dims {32, 64, 128, 128}
- *   strides               // the order of outer dims is encoded here
- *   inner_blks   4 16 4
- *   inner_idxs   1  0 1
- *
- * BlockedMemoryDesc desc has more expressive ability.
- * How to check compatibility with BlockedMemoryDesc representation:
- *    0. Detect a new_outer_order of outer_dims via descending strides.
- *    1. BlockedMemoryDesc strides :  concatenate strides in new_outer_order and inner strides.
- *    2. BlockedMemoryDesc dims    :  concatenate outer dims in new_outer_order with auto padding and inner blocks
- *    3. BlockedMemoryDesc order   :  concatenate new_outer_order and inner_idxs
- */
-
-bool MKLDNNMemoryDesc::isCompatible(const BlockedMemoryDesc &rhs) const {
-    if (this->getShape() != rhs.getShape() || this->getPrecision() != rhs.getPrecision()) {
-        return false;
-    }
-
-    const auto dims = desc.dims();
-
-    if (desc.data.format_kind != dnnl_blocked) {
-        return false;
-    }
-
-    const auto &blk_desc = desc.data.format_desc.blocking;
-
-    const size_t outer_ndims = dims.size();
-    const size_t inner_ndims = blk_desc.inner_nblks;
-    const size_t total_ndims = outer_ndims + inner_ndims;
-
-    // strides of inner dims. In case of 4i16o4i will be {64, 4, 1}
-    std::vector<size_t> inner_strides(inner_ndims, 1);
-    for (size_t i = 1; i < blk_desc.inner_nblks; i++) {
-        inner_strides[blk_desc.inner_nblks - 1 - i] = inner_strides[blk_desc.inner_nblks - i] * blk_desc.inner_blks[blk_desc.inner_nblks - i];
-    }
-
-    // total inner block size. in case of 4i16o4i will be {16, 16, 1, 1}
-    std::vector<size_t> total_block_per_dim(outer_ndims, 1);
-    for (int i = 0; i < inner_ndims; i++) {
-        total_block_per_dim[blk_desc.inner_idxs[i]] *= blk_desc.inner_blks[i];
-    }
-    std::vector<size_t> outer_block_dims(std::begin(dims), std::begin(dims) + outer_ndims);
-    for (size_t i = 0; i < outer_block_dims.size(); i++) {
-        outer_block_dims[i] = div_up(outer_block_dims[i], total_block_per_dim[i]);
-    }
-
-    // order of outer dims. In case of IOhw_ will be {1, 0, 2, 3}
-    std::vector<size_t> outer_order(outer_ndims);
-    std::iota(outer_order.begin(), outer_order.end(), 0);
-    std::sort(outer_order.begin(), outer_order.end(),
-              [&blk_desc, &outer_block_dims] (size_t ind_l, size_t ind_r) {
-                  return (blk_desc.strides[ind_l] > blk_desc.strides[ind_r]) ||
-                         (blk_desc.strides[ind_l] == blk_desc.strides[ind_r] && outer_block_dims[ind_l] > outer_block_dims[ind_r]);
-              });
-
-    // blocked order
-    // [new_outer_order] U [inner_idxs]
-    SizeVector blk_order(total_ndims, 0);
-    std::copy(outer_order.begin(), outer_order.end(), blk_order.begin());
-    std::copy(blk_desc.inner_idxs, blk_desc.inner_idxs + blk_desc.inner_nblks, blk_order.begin() + dims.size());
-
-    if (!dimsEqualWeak(blk_order, rhs.getOrder())) {
-        return false;
-    }
-
-    //TODO [DS]: undefined offset is also used now as an indicator of undefined strides
-    if (desc.data.offset0 != Shape::UNDEFINED_DIM) {
-        // blocked strides
-        // [outer_strides via new_outer_order] U [inner_strides]
-        SizeVector blk_strides(total_ndims, 0);
-        std::copy(inner_strides.rbegin(), inner_strides.rend(), blk_strides.rbegin());
-        std::transform(outer_order.begin(), outer_order.end(), blk_strides.begin(),
-                       [&](size_t i) { return blk_desc.strides[i]; });
-
-        size_t skipAxis = this->getShape().getRank() > 0 && this->getShape().getDims().front() == 1 ? 0 :
-                Shape::UNDEFINED_DIM; //ignore batch axis if batch size == 1
-        if (!dimsEqualWeak(blk_strides, rhs.getStrides(), skipAxis)) {
-            return false;
-        }
-    }
-
-    // blocked dims
-    // [dims via new_outer_order with auto pad] U [inner_blk_dims]
-    SizeVector blk_dims(total_ndims, 0);
-    std::copy(blk_desc.inner_blks, blk_desc.inner_blks + blk_desc.inner_nblks,
-              blk_dims.end() - blk_desc.inner_nblks);
-    std::transform(outer_order.begin(), outer_order.end(), blk_dims.begin(),
-                   [&] (size_t i) { return outer_block_dims[i]; });
-
-    if (!dimsEqualWeak(blk_dims, rhs.getBlockDims())) {
-        return false;
-    }
-
-    // offset padded to data. Same as for oneDNN
-    SizeVector blk_offset_to_data {desc.data.padded_offsets, desc.data.padded_offsets + desc.data.ndims};
-    // TODO: The BlockedMemoryDesc implementation allow to specify offset_to_data for inner blocked dims.
-    //       Which is not obvious behavior. It required offset_to_data.size == total_ndims, so will
-    //       fill it with zero.
-    blk_offset_to_data.insert(blk_offset_to_data.end(), inner_ndims, 0);
-    if (!dimsEqualWeak(blk_offset_to_data, rhs.getOffsetPaddingToData())) {
-        return false;
-    }
-
-    return dimsEqualWeak(desc.data.offset0, rhs.getOffsetPadding());
-}
-
-bool MKLDNNMemoryDesc::hasLayoutType(LayoutType layoutType) const {
-    switch (layoutType) {
-        case LayoutType::ncsp:
-            return isPlainFormat();
-        case LayoutType::nspc:
-            return isTailCFormat();
-        case LayoutType::nCsp8c:
-            return isBlockedCFormat(8);
-        case LayoutType::nCsp16c:
-            return isBlockedCFormat(16);
-        default:
-            return false;
-    }
-}
-
-std::string MKLDNNMemoryDesc::serializeFormat() const {
-    if (desc.data.format_kind == dnnl_format_kind_wino) {
-        switch (desc.data.format_desc.wino_desc.wino_format) {
-            case dnnl_wino_memory_format_t::dnnl_wino_wei_aaOIoi: return "wino_aaOIoi";
-            case dnnl_wino_memory_format_t::dnnl_wino_wei_aaOio: return "wino_aaOio";
-            case dnnl_wino_memory_format_t::dnnl_wino_wei_aaOBiOo: return "wino_aaOBiOo";
-            case dnnl_wino_memory_format_t::dnnl_wino_wei_OBaaIBOIio: return "wino_OBaaIBOIio";
-            default: return "wino_undef";
-        }
-    }
-    auto fmt = getFormat();
-    return mkldnn::utils::fmt2str(fmt);
-}
-
-bool MKLDNNMemoryDesc::isDefined() const {
-    return desc.data.offset0 != Shape::UNDEFINED_DIM;
+template<>
+DnnlMemoryDescPtr MKLDNNMemory::GetDescWithType<DnnlMemoryDesc, 0, 0>() const {
+    return MemoryDescUtils::convertToDnnlMemoryDesc(pMemDesc);
 }
 
-InferenceEngine::Precision MKLDNNMemoryDesc::getPrecision() const {
-    return MKLDNNExtensionUtils::DataTypeToIEPrecision(desc.data_type());
+template<>
+BlockedMemoryDescPtr MKLDNNMemory::GetDescWithType<BlockedMemoryDesc, 0, 0>() const {
+    return MemoryDescUtils::convertToBlockedMemoryDesc(pMemDesc);
 }
 
-void MKLDNNMemoryDesc::setPrecision(InferenceEngine::Precision prc) {
-    desc.data.data_type = static_cast<dnnl_data_type_t>(MKLDNNExtensionUtils::IEPrecisionToDataType(prc));
-}
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_memory.h b/inference-engine/src/mkldnn_plugin/mkldnn_memory.h
index 42284edca8368f..dea62afb97da89 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_memory.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_memory.h
@@ -5,13 +5,14 @@
 #pragma once
 
 #include "ie_layouts.h"
-#include "mkldnn_dims.h"
-#include "cpu_memory_desc.h"
+#include "memory_desc/cpu_memory_desc.h"
 #include "mkldnn_extension_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
 #include <mkldnn.hpp>
 #include <mkldnn_types.h>
 #include <cpu_shape.h>
-#include <cpu_blocked_memory_desc.h>
+
+#include "memory_desc/dnnl_memory_desc.h"
 
 #include <string>
 #include <functional>
@@ -22,11 +23,6 @@
 /**
  * @file contains a concept classes to work with memory/tensor/blob abstractions on plugin level.
  *
- * MKLDNNMemoryDesc - the descriptor of tensor representation in memory. Describes all required information
- * for proper allocation and handling tensor in some buffer. The real memory is not present, just description.
- * This object answers on question how and where data with logical index [x1, x2, .. xN] placed in real buffer.
- * In the simplest case it describe a mapping between "logical offset" and "real offset".
- *
  * MKLDNNMemory is an abstraction of some real tensor which contains some data. As in short it's a pair of
  * memory descriptor and raw buffer handler to contains data. In case of system memory raw buffer it's simple
  * "void*" on some system memory buffer.
@@ -35,82 +31,6 @@
 
 namespace MKLDNNPlugin {
 
-/**
- * Represent internal plugin abstraction of tensor description
- *
- */
-class MKLDNNMemoryDesc : public MemoryDesc {
-public:
-    /** Construct a tensor desc with plain layout format (like ND C array) */
-    MKLDNNMemoryDesc(const std::vector<size_t>& _dims, mkldnn::memory::data_type dataType);
-
-    /** Construct a tensor desc with specified layout format tag. Any and Undef is not supported */
-    MKLDNNMemoryDesc(const std::vector<size_t>& _dims, mkldnn::memory::data_type dataType, mkldnn::memory::format_tag format);
-
-    explicit MKLDNNMemoryDesc(const mkldnn::memory::desc& desc);
-
-    /**
-     * Try to define original format tag use on creation
-     *
-     * @return format tag if was able to define it
-     */
-    mkldnn::memory::format_tag getFormat() const;
-
-    mkldnn::memory::data_type getDataType() const {
-        return static_cast<mkldnn::memory::data_type>(desc.data.data_type);
-    }
-
-    MKLDNNDims getDims() const {
-        return MKLDNNDims(desc.data.dims, desc.data.ndims);
-    }
-
-    bool blocksExtended() const;
-    operator bool() const {
-        return getFormat() != mkldnn::memory::format_tag::any && getFormat() != mkldnn::memory::format_tag::undef;
-    }
-
-    bool operator == (const MKLDNNMemoryDesc& rhs) const;
-    bool operator != (const MKLDNNMemoryDesc& rhs) const;
-
-    operator mkldnn::memory::desc() const;
-
-    bool isSame(mkldnn::memory::format_tag fmt) const;
-
-    dnnl_format_kind_t getFormatKind() const {
-        return desc.data.format_kind;
-    }
-
-    std::unique_ptr<MemoryDesc> clone() const override {
-        return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(*this);
-    }
-
-    bool hasLayoutType(LayoutType layoutType) const override;
-
-    std::string serializeFormat() const override;
-
-    bool isDefined() const override;
-
-    InferenceEngine::Precision getPrecision() const override;
-
-    void setPrecision(InferenceEngine::Precision prc) override;
-
-    bool isCompatible(const MemoryDesc& rhs) const override;
-    bool isCompatible(const BlockedMemoryDesc& rhs) const;
-    bool isCompatible(const MKLDNNMemoryDesc& rhs) const;
-
-private:
-    size_t getElementOffset(size_t elemNumber) const override;
-    size_t getMemSizeImp() const override;
-    bool isPlainFormat() const;
-    bool isBlockedCFormat(size_t blk_size = UNREACHABLE_DIM) const;
-    bool isTailCFormat() const;
-
-private:
-    static constexpr size_t UNREACHABLE_DIM = std::numeric_limits<size_t>::max();
-    mkldnn::memory::desc desc;
-};
-
-
 class MKLDNNMemory {
 public:
     explicit MKLDNNMemory(const mkldnn::engine& eng);
@@ -129,18 +49,14 @@ class MKLDNNMemory {
         return prim;
     }
 
-    mkldnn::memory::desc GetDescriptor() const {
-        return prim->get_desc();
-    }
-
-    const MemoryDesc& GetDesc() const {
+    const MemoryDesc& getDesc() const {
         return *pMemDesc;
     }
 
     template <typename T,
             typename std::enable_if<!std::is_pointer<T>::value && !std::is_reference<T>::value, int>::type = 0,
             typename std::enable_if<std::is_base_of<MemoryDesc, T>::value, int>::type = 0>
-    T GetDescWithType() const;
+    std::shared_ptr<T> GetDescWithType() const;
 
     /**
      * Return handler of buffer. Real data may starts from some other offset
@@ -161,33 +77,42 @@ class MKLDNNMemory {
     void* GetPtr() const;
 
     mkldnn::memory::data_type GetDataType() const {
-        return static_cast<mkldnn::memory::data_type>(GetDescriptor().data.data_type);
+        return MKLDNNExtensionUtils::IEPrecisionToDataType(getDesc().getPrecision());
     }
 
     size_t GetSize() const;
-    size_t GetElementsCount() const;
 
-    mkldnn::memory::dims GetDims() const {
-        auto data = GetDescriptor().data;
-        return {std::begin(data.dims), std::begin(data.dims) + data.ndims};
+    const Shape& GetShape() const {
+        return getDesc().getShape();
     }
 
     void Create(const MemoryDesc& desc, const void* data = nullptr, bool pads_zeroing = true);
+    void Create(MemoryDescPtr desc, const void* data = nullptr, bool pads_zeroing = true);
+
+    // Redefines descriptor. The memory descriptor will be replaced with the new one.
+    // Memory will not be reallocated if the new tensor size is less or equal the upper bound.
+    // Caution!!! This action invalidates the previous data layout. The old data may become unreachable.
+    void redefineDesc(const MemoryDesc& desc, void *data = nullptr);
+    void redefineDesc(MemoryDescPtr desc, void *data = nullptr);
 
-    // Like a plain format
-    void SetData(mkldnn::memory::data_type dataType, mkldnn::memory::format_tag format, const void* data, size_t size, bool ftz = true) const;
     void SetData(const MKLDNNMemory& memory, size_t size = 0, bool ftz = true) const;
     void FillZero();
 
-    static mkldnn::memory::format_tag GetPlainFormatByRank(size_t rank);
-    static InferenceEngine::Layout GetPlainLayout(const mkldnn::memory::dims& dims);
-    static mkldnn::memory::format_tag Convert(const InferenceEngine::Layout layout);
-    static InferenceEngine::Precision convertToIePrec(mkldnn::memory::data_type dataType);
-    static mkldnn::memory::data_type convertToDataType(const InferenceEngine::Precision &precision);
+    bool hasExternalStorage() const {
+        return useExternalStorage;
+    }
 
-    static std::string formatToString(mkldnn::memory::format_tag fmt);
+    const VectorDims& getStaticDims() const {
+        return getDesc().getShape().getStaticDims();
+    }
 
-    static void reorderData(const MKLDNNMemory& input, const MKLDNNMemory& output, size_t size = 0);
+    mkldnn::engine getEngine() const {
+        return eng;
+    }
+
+    bool isUsedExternalStorage() const {
+        return useExternalStorage;
+    }
 
 private:
     void Create(const mkldnn::memory::dims& dims, mkldnn::memory::data_type data_type, mkldnn::memory::format_tag format,
@@ -195,14 +120,12 @@ class MKLDNNMemory {
 
     void Create(const mkldnn::memory::desc& desc, const void* data = nullptr, bool pads_zeroing = true);
 
-    const MKLDNNMemoryDesc GetMKLDNNDesc() const {
-        return MKLDNNMemoryDesc(prim->get_desc());
-    }
-
 private:
     MemoryDescPtr pMemDesc;
     std::shared_ptr<mkldnn::memory> prim;
     mkldnn::engine eng;
+    bool useExternalStorage = false;
+    size_t memUpperBound = 0ul;
 };
 
 using MKLDNNMemoryPtr = std::shared_ptr<MKLDNNMemory>;
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_memory_state.h b/inference-engine/src/mkldnn_plugin/mkldnn_memory_state.h
index 3cbe768370cd01..92f8cf4f2de42d 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_memory_state.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_memory_state.h
@@ -8,7 +8,7 @@
 #include "blob_factory.hpp"
 #include "mkldnn_memory.h"
 #include "nodes/common/cpu_memcpy.h"
-#include "cpu_memory_desc_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
 
 #include <string>
 
@@ -18,7 +18,7 @@ class MKLDNNVariableState : public InferenceEngine::IVariableStateInternal {
 public:
     MKLDNNVariableState(std::string name, MKLDNNMemoryPtr storage) :
             InferenceEngine::IVariableStateInternal{name} {
-        state = make_blob_with_precision(MemoryDescUtils::convertToTensorDesc(storage->GetDesc()));
+        state = make_blob_with_precision(MemoryDescUtils::convertToTensorDesc(storage->getDesc()));
         state->allocate();
         cpu_memcpy(state->buffer(), storage->GetData(), storage->GetSize());
     }
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_node.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_node.cpp
index 7e29589caf9a21..c1e9b5e8216948 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_node.cpp
@@ -50,12 +50,14 @@
 #include "nodes/common/cpu_memcpy.h"
 #include "mkldnn_debug.h"
 #include "utils/rt_info/memory_formats_attribute.hpp"
+#include <ngraph/opsets/opset1.hpp>
 
 #include <ie_ngraph_utils.hpp>
 #include "utils/general_utils.h"
 #include "utils/cpu_utils.hpp"
 #include "nodes/common/cpu_convert.h"
-#include "cpu_memory_desc_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -226,17 +228,204 @@ static const InferenceEngine::details::caseless_unordered_map<std::string, Type>
         { "ExperimentalDetectronPriorGridGenerator", ExperimentalDetectronPriorGridGenerator},
         { "ExperimentalDetectronGenerateProposalsSingleImage", ExperimentalDetectronGenerateProposalsSingleImage},
         { "ExtractImagePatches", ExtractImagePatches},
+        { "NonMaxSuppression", NonMaxSuppression},
         { "NonMaxSuppressionIEInternal", NonMaxSuppression},
         { "MatrixNms", MatrixNms},
         { "MulticlassNms", MulticlassNms}
 };
 
-Type TypeFromName(const std::string type) {
+Type TypeFromName(const std::string & type) {
     auto itType = type_to_name_tbl.find(type);
     if (type_to_name_tbl.end() != itType) {
         return itType->second;
-    } else {
-        return Unknown;
+    }
+    return Unknown;
+}
+
+template<>
+DnnlMemoryDescPtr MKLDNNNode::getInputMemDescAtPort<DnnlMemoryDesc, 0, 0>(size_t portNum) const {
+    return MemoryDescUtils::convertToDnnlMemoryDesc(getBaseMemDescAtInputPort(portNum));
+}
+
+template<>
+BlockedMemoryDescPtr MKLDNNNode::getInputMemDescAtPort<BlockedMemoryDesc, 0, 0>(size_t portNum) const {
+    return MemoryDescUtils::convertToBlockedMemoryDesc(getBaseMemDescAtInputPort(portNum));
+}
+
+template<>
+DnnlMemoryDescPtr MKLDNNNode::getOutputMemDescAtPort<DnnlMemoryDesc, 0, 0>(size_t portNum) const {
+    return MemoryDescUtils::convertToDnnlMemoryDesc(getBaseMemDescAtOutputPort(portNum));
+}
+
+template<>
+BlockedMemoryDescPtr MKLDNNNode::getOutputMemDescAtPort<BlockedMemoryDesc, 0, 0>(size_t portNum) const {
+    return MemoryDescUtils::convertToBlockedMemoryDesc(getBaseMemDescAtOutputPort(portNum));
+}
+
+std::string NameFromType(Type type) {
+    switch (type) {
+        case Generic:
+            return "Generic";
+        case Reorder:
+            return "Reorder";
+        case Input:
+            return "Input";
+        case Output:
+            return "Output";
+        case Convolution:
+            return "Convolution";
+        case Deconvolution:
+            return "Deconvolution";
+        case Lrn:
+            return "Lrn";
+        case Pooling:
+            return "Pooling";
+        case AdaptivePooling:
+            return "AdaptivePooling";
+        case FullyConnected:
+            return "FullyConnected";
+        case MatMul:
+            return "MatMul";
+        case Softmax:
+            return "Softmax";
+        case Split:
+            return "Split";
+        case Concatenation:
+            return "Concatenation";
+        case StridedSlice:
+            return "StridedSlice";
+        case Reshape:
+            return "Reshape";
+        case Tile:
+            return "Tile";
+        case ROIAlign:
+            return "ROIAlign";
+        case ROIPooling:
+            return "ROIPooling";
+        case PSROIPooling:
+            return "PSROIPooling";
+        case DepthToSpace:
+            return "DepthToSpace";
+        case BatchToSpace:
+            return "BatchToSpace";
+        case Pad:
+            return "Pad";
+        case Transpose:
+            return "Transpose";
+        case SpaceToDepth:
+            return "SpaceToDepth";
+        case SpaceToBatch:
+            return "SpaceToBatch";
+        case MemoryOutput:
+            return "MemoryOutput";
+        case MemoryInput:
+            return "MemoryInput";
+        case RNNSeq:
+            return "RNNSeq";
+        case RNNCell:
+            return "RNNCell";
+        case Eltwise:
+            return "Eltwise";
+        case FakeQuantize:
+            return "FakeQuantize";
+        case BinaryConvolution:
+            return "BinaryConvolution";
+        case DeformableConvolution:
+            return "DeformableConvolution";
+        case MVN:
+            return "MVN";
+        case TensorIterator:
+            return "TensorIterator";
+        case Convert:
+            return "Convert";
+        case NormalizeL2:
+            return "NormalizeL2";
+        case ScatterUpdate:
+            return "ScatterUpdate";
+        case ScatterElementsUpdate:
+            return "ScatterElementsUpdate";
+        case ScatterNDUpdate:
+            return "ScatterNDUpdate";
+        case Interpolate:
+            return "Interpolate";
+        case Reduce:
+            return "Reduce";
+        case Broadcast:
+            return "Broadcast";
+        case EmbeddingSegmentsSum:
+            return "EmbeddingSegmentsSum";
+        case EmbeddingBagPackedSum:
+            return "EmbeddingBagPackedSum";
+        case EmbeddingBagOffsetsSum:
+            return "EmbeddingBagOffsetsSum";
+        case Gather:
+            return "Gather";
+        case GatherElements:
+            return "GatherElements";
+        case GatherND:
+            return "GatherND";
+        case OneHot:
+            return "OneHot";
+        case RegionYolo:
+            return "RegionYolo";
+        case Select:
+            return "Select";
+        case Roll:
+            return "Roll";
+        case ShuffleChannels:
+            return "ShuffleChannels";
+        case DFT:
+            return "DFT";
+        case Math:
+            return "Math";
+        case CTCLoss:
+            return "CTCLoss";
+        case Bucketize:
+            return "Bucketize";
+        case CTCGreedyDecoder:
+            return "CTCGreedyDecoder";
+        case CTCGreedyDecoderSeqLen:
+            return "CTCGreedyDecoderSeqLen";
+        case CumSum:
+            return "CumSum";
+        case DetectionOutput:
+            return "DetectionOutput";
+        case ExperimentalDetectronDetectionOutput:
+            return "ExperimentalDetectronDetectionOutput";
+        case LogSoftmax:
+            return "LogSoftmax";
+        case TopK:
+            return "TopK";
+        case GatherTree:
+            return "GatherTree";
+        case GRN:
+            return "GRN";
+        case Range:
+            return "Range";
+        case Proposal:
+            return "Proposal";
+        case ReorgYolo:
+            return "ReorgYolo";
+        case ReverseSequence:
+            return "ReverseSequence";
+        case ExperimentalDetectronTopKROIs:
+            return "ExperimentalDetectronTopKROIs";
+        case ExperimentalDetectronROIFeatureExtractor:
+            return "ExperimentalDetectronROIFeatureExtractor";
+        case ExperimentalDetectronPriorGridGenerator:
+            return "ExperimentalDetectronPriorGridGenerator";
+        case ExperimentalDetectronGenerateProposalsSingleImage:
+            return "ExperimentalDetectronGenerateProposalsSingleImage";
+        case ExtractImagePatches:
+            return "ExtractImagePatches";
+        case NonMaxSuppression:
+            return "NonMaxSuppression";
+        case MatrixNms:
+            return "MatrixNms";
+        case MulticlassNms:
+            return "MulticlassNms";
+        default:
+            return "Unknown";
     }
 }
 
@@ -257,11 +446,11 @@ MKLDNNNode::MKLDNNNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::en
 
     for (size_t i = 0; i < op->get_input_size(); i++) {
         const auto &shape = op->get_input_partial_shape(i);
-
-        bool isScalar = false;
-        if (shape.rank().is_static()) {
-            isScalar = shape.rank().get_length() == 0;
+        if (shape.rank().is_dynamic()) {
+            IE_THROW(Unexpected) << "CPU plug-in doesn't support operation with dynamic rank";
         }
+
+        bool isScalar = shape.rank().get_length() == 0;
         inputShapes.emplace_back(isScalar ? ngraph::PartialShape{1} : shape);
         originalInputPrecisions.emplace_back(details::convertPrecision(op->get_input_element_type(i)));
     }
@@ -272,16 +461,21 @@ MKLDNNNode::MKLDNNNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::en
         }
         for (size_t i = 0; i < op->get_output_size(); i++) {
             const auto &shape = op->get_output_partial_shape(i);
-
-            bool isScalar = false;
-            if (shape.rank().is_static()) {
-                isScalar = shape.rank().get_length() == 0;
+            if (shape.rank().is_dynamic()) {
+                IE_THROW(Unexpected) << "CPU plug-in doesn't support operation with dynamic rank";
             }
+
+            bool isScalar = shape.rank().get_length() == 0;
             outputShapes.emplace_back(isScalar ? ngraph::PartialShape{1} : shape);
             originalOutputPrecisions.emplace_back(details::convertPrecision(op->get_output_element_type(i)));
         }
     }
 
+    isDynamic = std::any_of(inputShapes.begin(), inputShapes.end(), [](const Shape& shape){ return shape.isDynamic(); }) ||
+                std::any_of(outputShapes.begin(), outputShapes.end(), [](const Shape& shape){ return shape.isDynamic(); });
+
+    createShapeInferSubgraph(op);
+
     const auto& rtInfo = op->get_rt_info();
     if (rtInfo.count("originalLayersNames")) {
         originalLayers = getRTInfoValue(rtInfo, "originalLayersNames");
@@ -462,16 +656,18 @@ bool MKLDNNNode::canBeInPlace() const {
             return false;
     }
 
-    auto inShape = getParentEdgeAt(0)->getShape();
-    for (size_t cIdx = 0; cIdx < getChildEdges().size(); cIdx++) {
-        if (getChildEdgeAt(cIdx)->getShape() != inShape) {
+    auto inShape = getInputShapeAtPort(0);
+    for (size_t cIdx = 0; cIdx < outputShapes.size(); cIdx++) {
+        if (getOutputShapeAtPort(cIdx) != inShape) {
             return false;
         }
     }
     return true;
 }
 
-void MKLDNNNode::resolveNotAllocatedEdges() {
+void MKLDNNNode::resolveInPlaceEdges() {
+    // TODO [DS]: first version dynamic shapes do not support inPlace logic
+    // after enabling inPlace logic for dynamic shapes we need to update this method for nodes with several edges at single port
     const NodeDesc *selected_pd = getSelectedPrimitiveDescriptor();
     if (!selected_pd)
         IE_THROW() << "Cannot find selected primitive descriptor for node: " << getName();
@@ -501,6 +697,28 @@ void MKLDNNNode::resolveNotAllocatedEdges() {
     }
 }
 
+MemoryDescPtr MKLDNNNode::getBaseMemDescAtInputPort(size_t portNum) const {
+    if (auto primDesc = getSelectedPrimitiveDescriptor()) {
+        const auto& inConfs = primDesc->getConfig().inConfs;
+        if (inConfs.size() < portNum) {
+            IE_THROW() << "Can't get input memory desc at port: " << portNum << ", incorrect port number";
+        }
+        return inConfs[portNum].desc;
+    }
+    IE_THROW() << "Can't get input memory desc, primitive descriptor is not selected";
+}
+
+MemoryDescPtr MKLDNNNode::getBaseMemDescAtOutputPort(size_t portNum) const {
+    if (auto primDesc = getSelectedPrimitiveDescriptor()) {
+        const auto& outConfs = primDesc->getConfig().outConfs;
+        if (outConfs.size() < portNum) {
+            IE_THROW() << "Can't get output memory desc at port: " << portNum << ", incorrect port number";
+        }
+        return outConfs[portNum].desc;
+    }
+    IE_THROW() << "Can't get output memory desc, primitive descriptor is not selected";
+}
+
 std::string MKLDNNNode::getPrimitiveDescriptorType() {
     auto selectedPrimitiveDesc = getSelectedPrimitiveDescriptor();
 
@@ -636,6 +854,51 @@ void MKLDNNNode::execute(mkldnn::stream strm) {
     }
 }
 
+void MKLDNNNode::executeDynamic(mkldnn::stream strm) {
+    bool isInShapeChanged = isInputShapeChanged();
+    if (isInShapeChanged) {
+        if (isShapeInferNeeded())
+            redefineOutputMemory(shapeInfer());
+    }
+    if (isPrepareParamsNeeded())
+        prepareParams();
+    executeDynamicImpl(strm);
+    if (isInShapeChanged)
+        initCurrentDims();
+}
+
+void MKLDNNNode::redefineOutputMemory(const std::vector<VectorDims> &newOutputShapes) {
+    if (newOutputShapes.size() != outputShapes.size()) {
+        IE_THROW() << "Number shapes mismatch with real outputs number for node with name: " << getName();
+    }
+    for (size_t i = 0; i < outputShapes.size(); i++) {
+        const auto edges = getChildEdgesAtPort(i);
+        const auto memDesc = getBaseMemDescAtOutputPort(i)->cloneWithNewDims(newOutputShapes[i]);
+
+        const auto &currDesc = edges[0]->getMemory().getDesc();
+        if (currDesc.getShape().isStatic() && currDesc.getShape().getStaticDims() == newOutputShapes[i])
+            continue;
+
+        // this path neccesary if there are several edges per one port
+        // in this case edge memory share same physical memory
+        // so we need to find which edge allocate memory, reallocate memory and share this memory between other edges
+        size_t sharedEdgeNum = 0;
+        for (size_t j = 0; j < edges.size(); j++) {
+            if (!edges[j]->getMemory().isUsedExternalStorage()) {
+                sharedEdgeNum = j;
+                break;
+            }
+        }
+        edges[sharedEdgeNum]->getMemoryPtr()->redefineDesc(*memDesc);
+        void *data = edges[sharedEdgeNum]->getMemoryPtr()->GetData();
+        for (size_t j = 0; j < edges.size(); j++) {
+            if (j == sharedEdgeNum)
+                continue;
+            edges[j]->getMemoryPtr()->redefineDesc(*memDesc, data);
+        }
+    }
+}
+
 void MKLDNNNode::initSupportedPrimitiveDescriptors() {
     if (!supportedPrimitiveDescriptors.empty())
         return;
@@ -650,7 +913,12 @@ void MKLDNNNode::initSupportedPrimitiveDescriptors() {
                 PortConfig portConfig;
                 portConfig.inPlace = -1;
                 portConfig.constant = false;
-                portConfig.desc = MemoryDescUtils::applyUndefinedOffset(*getSrcMemDesc(itpd, i));
+                auto desc = getSrcMemDesc(itpd, i);
+                if (desc->getType() & MemoryDescType::Blocked) {
+                    portConfig.desc = MemoryDescUtils::cloneWithUndefStridesAndOffset(*desc);
+                } else {
+                    portConfig.desc = std::move(desc);
+                }
                 config.inConfs.push_back(portConfig);
             }
 
@@ -658,7 +926,12 @@ void MKLDNNNode::initSupportedPrimitiveDescriptors() {
                 PortConfig portConfig;
                 portConfig.inPlace = canBeInPlace() ? 0 : -1;
                 portConfig.constant = false;
-                portConfig.desc = MemoryDescUtils::applyUndefinedOffset(*getDstMemDesc(itpd, i));
+                auto desc = getDstMemDesc(itpd, i);
+                if (desc->getType() & MemoryDescType::Blocked) {
+                    portConfig.desc = MemoryDescUtils::cloneWithUndefStridesAndOffset(*desc);
+                } else {
+                    portConfig.desc = std::move(desc);
+                }
                 config.outConfs.push_back(portConfig);
             }
             impl_desc_type impl_type = parse_impl_name(itpd.impl_info_str());
@@ -673,10 +946,9 @@ void MKLDNNNode::initSupportedPrimitiveDescriptors() {
 void MKLDNNNode::filterSupportedPrimitiveDescriptors() {
     // Compare by partial layout descriptor (without particular strides values)
     auto areCompatible = [](const MemoryDesc& desc, mkldnn::memory::format_tag fmt) -> bool {
-        MKLDNNMemoryDesc fmt_tdesc = MKLDNNMemoryDesc{desc.getShape().getStaticDims(),
-                                                      MKLDNNExtensionUtils::IEPrecisionToDataType(desc.getPrecision()),
-                                                      fmt};
-
+        auto fmt_tdesc = DnnlBlockedMemoryDesc(desc.getShape(),
+                                                 MKLDNNExtensionUtils::IEPrecisionToDataType(desc.getPrecision()),
+                                                 fmt);
         return desc.isCompatible(fmt_tdesc);
     };
 
@@ -710,12 +982,12 @@ void MKLDNNNode::initDescriptor(const NodeConfig& config) {
     if (!selectedPD) {
         return;
     }
-    std::vector<const MemoryDesc*> inDescs;
+    std::vector<MemoryDescPtr> inDescs;
     for (const auto& inConf : config.inConfs)
-        inDescs.push_back(inConf.desc.get());
-    std::vector<const MemoryDesc*> outDescs;
+        inDescs.emplace_back(inConf.desc);
+    std::vector<MemoryDescPtr> outDescs;
     for (const auto& outConf : config.outConfs)
-        outDescs.push_back(outConf.desc.get());
+        outDescs.emplace_back(outConf.desc);
     createDescriptor(inDescs, outDescs);
 
     std::shared_ptr<mkldnn::primitive_attr> attr = initPrimitiveAttr();
@@ -773,12 +1045,12 @@ void MKLDNNNode::initDescriptor(const NodeConfig& config) {
 
         for (size_t i = 0; i < selectedConfig.inConfs.size(); i++) {
             if (!selectedConfig.inConfs[i].desc->isCompatible(*config.inConfs[i].desc))
-                IE_THROW() << "Incorrect descriptor for node: " << getName();
+                IE_THROW() << "Incorrect descriptor for node: " << getName() << " on " << i << " intput port";
         }
 
         for (size_t i = 0; i < selectedConfig.outConfs.size(); i++) {
             if (!selectedConfig.outConfs[i].desc->isCompatible(*config.outConfs[i].desc))
-                IE_THROW() << "Incorrect descriptor for node: " << getName();
+                IE_THROW() << "Incorrect descriptor for node: " << getName() << " on " << i << " output port";
         }
         rightConfig = config;
     }
@@ -799,7 +1071,7 @@ void MKLDNNNode::prepareMemory(const NodeDesc *selected_pd, mkldnn::primitive_de
             IE_THROW() << "Destination memory didn't allocate for node " << getName()
                                << " from node " << getParentEdgeAt(i)->getParent()->getName() << ".";
     }
-    std::vector<MKLDNNMemoryDesc> intDescs;
+    std::vector<DnnlMemoryDescPtr> intDescs;
     for (auto &it : internalBlobDesc)
         intDescs.push_back(it(itpd, 0));
 
@@ -809,13 +1081,13 @@ void MKLDNNNode::prepareMemory(const NodeDesc *selected_pd, mkldnn::primitive_de
 
         auto create = [&] () {
             // TODO [DS]: internal blobs should be removed or rewritten using Memory object
-            auto newDesc = MemoryDescUtils::convertToMKLDNNMemoryDesc(internalBlob->getTensorDesc());
+            auto newDesc = MemoryDescUtils::convertToDnnlBlockedMemoryDesc(internalBlob->getTensorDesc());
 
             MKLDNNMemory memory{ engine };
             memory.Create(newDesc, internalBlob->buffer());
 
             MKLDNNMemoryPtr _ptr = MKLDNNMemoryPtr(new MKLDNNMemory(engine));
-            _ptr->Create(intDescs[i]);
+            _ptr->Create(*intDescs[i]);
             _ptr->SetData(memory);
 
             return _ptr;
@@ -950,14 +1222,14 @@ const std::vector<impl_desc_type>& MKLDNNNode::getPrimitivesPriority() {
     return implPriorities;
 }
 
-std::unique_ptr<MemoryDesc> MKLDNNNode::getDefinedInputDesc(const NodeConfig &config, size_t idx) const {
+MemoryDescPtr MKLDNNNode::getDefinedInputDesc(const NodeConfig &config, size_t idx) const {
     int num = getParentEdgeAt(idx)->getInputNum();
     auto *selectedPD = getParentEdgeAt(idx)->getParent()->getSelectedPrimitiveDescriptor();
     if (!selectedPD)
         IE_THROW() << "Cannot get selected primitive descriptor for node: " << getParentEdgeAt(idx)->getParent()->getName();
 
     if (config.inConfs[idx].desc->isDefined()) {
-        return config.inConfs[idx].desc->clone();
+        return config.inConfs[idx].desc;
     }
 
     if (config.inConfs[idx].inPlace >= 0) {
@@ -966,26 +1238,26 @@ std::unique_ptr<MemoryDesc> MKLDNNNode::getDefinedInputDesc(const NodeConfig &co
 
     if (num >= 0) {
         auto parentConf = selectedPD->getConfig().outConfs[num];
-        parentConf.desc->setPrecision(config.inConfs[idx].desc->getPrecision());
+        parentConf.desc = MemoryDescUtils::cloneWithNewPrecision(*parentConf.desc, config.inConfs[idx].desc->getPrecision());
         if (!parentConf.desc->isDefined() && parentConf.inPlace >= 0)
             getParentEdgeAt(idx)->getParent()->initOptimalPrimitiveDescriptor();
         parentConf = getParentEdgeAt(idx)->getParent()->getSelectedPrimitiveDescriptor()->getConfig().outConfs[num];
         if (parentConf.desc->isDefined() && parentConf.desc->isCompatible(*config.inConfs[idx].desc)) {
-            return parentConf.desc->clone();
+            return parentConf.desc;
         }
     }
 
-    return MemoryDescUtils::resetOffset(config.inConfs[idx].desc.get());
+    return MemoryDescUtils::cloneWithDefaultStridesAndOffset(*config.inConfs[idx].desc);
 }
 
-std::unique_ptr<MemoryDesc> MKLDNNNode::getDefinedOutputDesc(const NodeConfig &config, size_t idx) const {
+MemoryDescPtr MKLDNNNode::getDefinedOutputDesc(const NodeConfig &config, size_t idx) const {
     int num = getChildEdgeAt(idx)->getOutputNum();
     auto *selectedPD = getChildEdgeAt(idx)->getChild()->getSelectedPrimitiveDescriptor();
     if (!selectedPD)
         IE_THROW() << "Cannot get selected primitive descriptor for node: " << getChildEdgeAt(idx)->getChild()->getName();
 
     if (config.outConfs[idx].desc->isDefined()) {
-        return config.outConfs[idx].desc->clone();
+        return config.outConfs[idx].desc;
     }
 
     if (config.outConfs[idx].inPlace >= 0) {
@@ -994,16 +1266,16 @@ std::unique_ptr<MemoryDesc> MKLDNNNode::getDefinedOutputDesc(const NodeConfig &c
 
     if (num >= 0) {
         auto childConf = selectedPD->getConfig().inConfs[num];
-        childConf.desc->setPrecision(config.outConfs[idx].desc->getPrecision());
+        childConf.desc = MemoryDescUtils::cloneWithNewPrecision(*childConf.desc, config.outConfs[idx].desc->getPrecision());
         if (!childConf.desc->isDefined() && childConf.inPlace >= 0)
             getChildEdgeAt(idx)->getChild()->initOptimalPrimitiveDescriptor();
         childConf = getChildEdgeAt(idx)->getChild()->getSelectedPrimitiveDescriptor()->getConfig().inConfs[num];
         if (childConf.desc->isDefined() && childConf.desc->isCompatible(*config.outConfs[idx].desc)) {
-            return childConf.desc->clone();
+            return childConf.desc;
         }
     }
 
-    return MemoryDescUtils::resetOffset(config.outConfs[idx].desc.get());
+    return MemoryDescUtils::cloneWithDefaultStridesAndOffset(*config.outConfs[idx].desc);
 }
 
 void MKLDNNNode::initOptimalPrimitiveDescriptor() {
@@ -1036,19 +1308,20 @@ bool MKLDNNNode::isConfigDefined(const NodeConfig &config) const {
     return true;
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
-    return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(primitive_desc_it.src_desc(idx));
+MemoryDescPtr MKLDNNNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+    return MKLDNNExtensionUtils::makeDescriptor(primitive_desc_it.src_desc(idx));
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNNode::getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
-    return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(primitive_desc_it.dst_desc(idx));
+MemoryDescPtr MKLDNNNode::getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+    return MKLDNNExtensionUtils::makeDescriptor(primitive_desc_it.dst_desc(idx));
 }
 
-int MKLDNNNode::batchToProcess() {
+int MKLDNNNode::batchToProcess() const {
     return dynBatchLim == 0 ? getMaxBatch() : std::min<int>(getMaxBatch(), dynBatchLim);
 }
 
-int MKLDNNNode::getMaxBatch() {
+// TODO [DS]: how we should process this for dynamic shape?
+size_t MKLDNNNode::getMaxBatch() const {
     // FIXME: batch != 0 dims number
     if (!inputShapes.empty()) {
         if (inputShapes[0].getRank())
@@ -1164,20 +1437,30 @@ InferenceEngine::Precision MKLDNNNode::getRuntimePrecision() const {
 
 MKLDNNNode* MKLDNNNode::NodesFactory::create(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng,
                                              const MKLDNNExtensionManager::Ptr& extMgr, MKLDNNWeightsSharing::Ptr &w_cache) {
+    // getExceptionDescWithoutStatus removes redundant information from the exception message. For instance, the NotImplemented
+    // exception is generated in the form: full_path_to_src_file:line_number [ NOT_IMPLEMENTED ] reason.
+    // An example for gather node:
+    // /path-to-openVino-root/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.cpp:42 [ NOT_IMPLEMENTED ] Only opset7 Gather operation is supported
+    // The most important part of the message is the reason, so the lambda trims everything up to "]"
+    // Note that the op type and its friendly name will also be provided if we fail to create the node.
+    auto getExceptionDescWithoutStatus = [](const InferenceEngine::Exception& ex) {
+        std::string desc = ex.what();
+        size_t pos = desc.find("]");
+        if (pos != std::string::npos) {
+            if (desc.size() == pos + 1) {
+                desc.erase(0, pos + 1);
+            } else {
+                desc.erase(0, pos + 2);
+            }
+        }
+        return desc;
+    };
     MKLDNNNode *newNode = nullptr;
     std::string errorMessage;
-    try {
+    {
         std::unique_ptr<MKLDNNNode> ol(createNodeIfRegistered(MKLDNNPlugin, Generic, op, eng, w_cache));
         if (ol != nullptr && ol->created(extMgr))
             newNode = ol.release();
-    } catch (const InferenceEngine::Exception& ex) {
-        IE_SUPPRESS_DEPRECATED_START
-        if (ex.getStatus() != NOT_IMPLEMENTED) {
-            throw;
-        } else {
-            errorMessage += getExceptionDescWithoutStatus(ex);
-        }
-        IE_SUPPRESS_DEPRECATED_END
     }
 
     if (newNode == nullptr) {
@@ -1186,13 +1469,11 @@ MKLDNNNode* MKLDNNNode::NodesFactory::create(const std::shared_ptr<ngraph::Node>
             if (ol != nullptr && ol->created(extMgr))
                 newNode = ol.release();
         } catch (const InferenceEngine::Exception& ex) {
-            IE_SUPPRESS_DEPRECATED_START
-            if (ex.getStatus() != NOT_IMPLEMENTED) {
-                throw;
-            } else {
+            if (dynamic_cast<const NotImplemented*>(&ex) != nullptr) {
                 errorMessage += getExceptionDescWithoutStatus(ex);
+            } else {
+                throw;
             }
-            IE_SUPPRESS_DEPRECATED_END
         }
     }
 
@@ -1202,13 +1483,13 @@ MKLDNNNode* MKLDNNNode::NodesFactory::create(const std::shared_ptr<ngraph::Node>
             if (ol != nullptr && ol->created(extMgr))
                 newNode = ol.release();
         } catch (const InferenceEngine::Exception& ex) {
-            IE_SUPPRESS_DEPRECATED_START
-            if (ex.getStatus() != NOT_IMPLEMENTED) {
-                throw;
+            if (dynamic_cast<const NotImplemented*>(&ex) != nullptr) {
+                const auto currErrorMess = getExceptionDescWithoutStatus(ex);
+                if (!currErrorMess.empty())
+                    errorMessage += errorMessage.empty() ? currErrorMess : "\n" + currErrorMess;
             } else {
-                errorMessage += getExceptionDescWithoutStatus(ex);
+                throw;
             }
-            IE_SUPPRESS_DEPRECATED_END
         }
     }
 
@@ -1222,7 +1503,7 @@ MKLDNNNode* MKLDNNNode::NodesFactory::create(const std::shared_ptr<ngraph::Node>
     if (!newNode) {
         std::string errorDetails;
         if (!errorMessage.empty()) {
-            errorDetails = "\nDetails: \n" + errorMessage;
+            errorDetails = "\nDetails:\n" + errorMessage;
         }
         IE_THROW() << "Unsupported operation of type: " << op->get_type_name() << " name: " << op->get_friendly_name() << errorDetails;
     }
@@ -1233,7 +1514,7 @@ MKLDNNNode* MKLDNNNode::NodesFactory::create(const std::shared_ptr<ngraph::Node>
 bool MKLDNNNode::canBePerformedAsScaleShift(const MKLDNNNode *parentNode) const {
     size_t fusingPort = 0;
     for (size_t i = (parentNode == nullptr ? 1 : 0); i < getParentEdges().size(); i++) {
-        MKLDNNNode *node = getParentEdgeAt(i)->getParent().get();
+        MKLDNNNode *node = getParentEdgesAtPort(i)[0]->getParent().get();
         if (node == nullptr) {
             IE_THROW() << "Cannot get parent node for " << getName() << " on " << i << " port";
         }
@@ -1247,11 +1528,11 @@ bool MKLDNNNode::canBePerformedAsScaleShift(const MKLDNNNode *parentNode) const
     }
 
     const auto isBroadcastableToDataInput = [&]() {
-        const auto dataShape = getParentEdgeAt(fusingPort)->getShape().getStaticDims();
+        auto& dataShape = getInputShapeAtPort(fusingPort).getDims();
         for (size_t i = 0; i < getParentEdges().size(); i++) {
             if (i == fusingPort)
                 continue;
-            auto weightShape = getParentEdgeAt(i)->getShape().getStaticDims();
+            auto& weightShape = getInputShapeAtPort(i).getDims();
             if (getParentEdgesAtPort(i)[0]->getParent()->getChildEdges().size() != 1 || !isPerTensorOrPerChannelBroadcastable(dataShape, weightShape))
                 return false;
         }
@@ -1273,6 +1554,62 @@ bool MKLDNNNode::canBePerformedAsScaleShift(const MKLDNNNode *parentNode) const
             || isConvertablePowerStatic();
 }
 
+bool MKLDNNNode::isInputShapesDefined() const {
+    for (size_t i = 0; i < getParentEdges().size(); i++) {
+        if (!getParentEdgesAtPort(i)[0]->getMemory().getDesc().isDefined())
+            return false;
+    }
+    return true;
+}
+
+bool MKLDNNNode::isPrepareParamsNeeded() const {
+    return isInputShapeChanged();
+}
+
+bool MKLDNNNode::isInputShapeChanged() const {
+    if (currentInDims.size() != getParentEdges().size())
+        IE_THROW() << "Input dims and parent edges number mismatch!";
+    for (size_t i = 0; i < currentInDims.size(); i++) {
+        if (currentInDims[i] != getParentEdgesAtPort(i)[0]->getMemory().getStaticDims())
+            return true;
+    }
+    return false;
+}
+
+// should be called after isInputShapeChanged
+bool MKLDNNNode::isShapeInferNeeded() const {
+    return true;
+}
+
+std::vector<VectorDims> MKLDNNNode::shapeInfer() const {
+    for (size_t i = 0; i < opToShapeInfer->get_input_size(); i++) {
+        if (!dynamic_cast<ngraph::opset1::Constant *>(opToShapeInfer->get_input_node_ptr(i))) {
+            opToShapeInfer->get_input_tensor(i).set_partial_shape(
+                getParentEdgesAtPort(i)[0]->getMemory().getDesc().getShape().toPartialShape());
+        }
+    }
+
+    opToShapeInfer->validate_and_infer_types();
+
+    IE_ASSERT(opToShapeInfer->get_output_size() == outputShapes.size());
+
+    std::vector<VectorDims> newOutputShapes(outputShapes.size());
+    for (size_t i = 0; i < newOutputShapes.size(); i++) {
+        const auto &partShape = opToShapeInfer->get_output_partial_shape(i);
+        if (partShape.is_dynamic())
+            IE_THROW(NotImplemented) << "CPU plug-in doesn't support default shape infer for nodes with internal dynamism";
+        newOutputShapes[i] = partShape.get_shape();
+    }
+    return newOutputShapes;
+}
+
+void MKLDNNNode::initCurrentDims() {
+    if (currentInDims.size() != getParentEdges().size())
+        IE_THROW() << "Input dims and parent edges number mismatch!";
+    for (size_t i = 0; i < currentInDims.size(); i++)
+        currentInDims[i] = getParentEdgesAtPort(i)[0]->getMemory().getStaticDims();
+}
+
 bool MKLDNNNode::canFuseSimpleOperation(const MKLDNNNodePtr& node) const {
     if (node->getType() == FakeQuantize) {
         bool ret = node->getAlgorithm() != FQBinarization;
@@ -1295,7 +1632,7 @@ void MKLDNNNode::fillScalesAndShifts(const MKLDNNNode *parentNode, std::vector<f
     const auto fillValuesFrom = [&](const MKLDNNNodePtr& constInput, std::vector<float>& buffer) {
         auto *constInputNode = dynamic_cast<MKLDNNInputNode *>(constInput.get());
         auto constBlob = constInputNode->getMemoryPtr();
-        auto const elementsCount = constBlob->GetElementsCount();
+        const auto elementsCount = constBlob->GetDescWithType<BlockedMemoryDesc>()->getPaddedElementsCount();
         buffer.resize(elementsCount);
         cpu_convert(constBlob->GetPtr(),
                     &buffer[0],
@@ -1368,3 +1705,18 @@ void MKLDNNNode::fillScalesAndShifts(const MKLDNNNode *parentNode, std::vector<f
         default: break;
     }
 }
+
+void MKLDNNNode::createShapeInferSubgraph(const std::shared_ptr<ngraph::Node>& op) {
+    if (isDynamic) {
+        ngraph::OutputVector inputsForShapeInfer;
+        for (size_t i = 0; i < inputShapes.size(); i++) {
+            if (dynamic_cast<ngraph::opset1::Constant *>(op->get_input_node_ptr(i))) {
+                inputsForShapeInfer.push_back(op->get_input_node_shared_ptr(i));
+            } else {
+                inputsForShapeInfer.push_back(std::make_shared<ngraph::opset1::Parameter>(op->get_input_element_type(i),
+                                                                                          op->get_input_partial_shape(i)));
+            }
+        }
+        opToShapeInfer = op->clone_with_new_inputs(inputsForShapeInfer);
+    }
+}
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_node.h b/inference-engine/src/mkldnn_plugin/mkldnn_node.h
index 77dab59e904d09..7174560cee8a52 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_node.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_node.h
@@ -11,7 +11,6 @@
 #include <cassert>
 #include <algorithm>
 #include <caseless.hpp>
-#include "mkldnn_dims.h"
 #include "mkldnn_memory.h"
 #include "mkldnn_edge.h"
 #include "mkldnn_descriptor.h"
@@ -29,181 +28,16 @@
 #include <nodes/common/blocked_desc_creator.h>
 #include "cpu_types.h"
 #include "cpu_shape.h"
-#include "cpu_memory_desc.h"
+#include "memory_desc/cpu_memory_desc.h"
 
 namespace MKLDNNPlugin {
 
 using MKLDNNNodePtr = std::shared_ptr<MKLDNNNode>;
+using MKLDNNNodeConstPtr = std::shared_ptr<const MKLDNNNode>;
 using MKLDNNNodeWeakPtr = std::weak_ptr<MKLDNNNode>;
 
-Type TypeFromName(const std::string type);
-
-static std::string NameFromType(Type type) {
-    switch (type) {
-        case Generic:
-            return "Generic";
-        case Reorder:
-            return "Reorder";
-        case Input:
-            return "Input";
-        case Output:
-            return "Output";
-        case Convolution:
-            return "Convolution";
-        case Deconvolution:
-            return "Deconvolution";
-        case Lrn:
-            return "Lrn";
-        case Pooling:
-            return "Pooling";
-        case AdaptivePooling:
-            return "AdaptivePooling";
-        case FullyConnected:
-            return "FullyConnected";
-        case MatMul:
-            return "MatMul";
-        case Softmax:
-            return "Softmax";
-        case Split:
-            return "Split";
-        case Concatenation:
-            return "Concatenation";
-        case StridedSlice:
-            return "StridedSlice";
-        case Reshape:
-            return "Reshape";
-        case Tile:
-            return "Tile";
-        case ROIAlign:
-            return "ROIAlign";
-        case ROIPooling:
-            return "ROIPooling";
-        case PSROIPooling:
-            return "PSROIPooling";
-        case DepthToSpace:
-            return "DepthToSpace";
-        case BatchToSpace:
-            return "BatchToSpace";
-        case Pad:
-            return "Pad";
-        case Transpose:
-            return "Transpose";
-        case SpaceToDepth:
-            return "SpaceToDepth";
-        case SpaceToBatch:
-            return "SpaceToBatch";
-        case MemoryOutput:
-            return "MemoryOutput";
-        case MemoryInput:
-            return "MemoryInput";
-        case RNNSeq:
-            return "RNNSeq";
-        case RNNCell:
-            return "RNNCell";
-        case Eltwise:
-            return "Eltwise";
-        case FakeQuantize:
-            return "FakeQuantize";
-        case BinaryConvolution:
-            return "BinaryConvolution";
-        case DeformableConvolution:
-            return "DeformableConvolution";
-        case MVN:
-            return "MVN";
-        case TensorIterator:
-            return "TensorIterator";
-        case Convert:
-            return "Convert";
-        case NormalizeL2:
-            return "NormalizeL2";
-        case ScatterUpdate:
-            return "ScatterUpdate";
-        case ScatterElementsUpdate:
-            return "ScatterElementsUpdate";
-        case ScatterNDUpdate:
-            return "ScatterNDUpdate";
-        case Interpolate:
-            return "Interpolate";
-        case Reduce:
-            return "Reduce";
-        case Broadcast:
-            return "Broadcast";
-        case EmbeddingSegmentsSum:
-            return "EmbeddingSegmentsSum";
-        case EmbeddingBagPackedSum:
-            return "EmbeddingBagPackedSum";
-        case EmbeddingBagOffsetsSum:
-            return "EmbeddingBagOffsetsSum";
-        case Gather:
-            return "Gather";
-        case GatherElements:
-            return "GatherElements";
-        case GatherND:
-            return "GatherND";
-        case OneHot:
-            return "OneHot";
-        case RegionYolo:
-            return "RegionYolo";
-        case Select:
-            return "Select";
-        case Roll:
-            return "Roll";
-        case ShuffleChannels:
-            return "ShuffleChannels";
-        case DFT:
-            return "DFT";
-        case Math:
-            return "Math";
-        case CTCLoss:
-            return "CTCLoss";
-        case Bucketize:
-            return "Bucketize";
-        case CTCGreedyDecoder:
-            return "CTCGreedyDecoder";
-        case CTCGreedyDecoderSeqLen:
-            return "CTCGreedyDecoderSeqLen";
-        case CumSum:
-            return "CumSum";
-        case DetectionOutput:
-            return "DetectionOutput";
-        case ExperimentalDetectronDetectionOutput:
-            return "ExperimentalDetectronDetectionOutput";
-        case LogSoftmax:
-            return "LogSoftmax";
-        case TopK:
-            return "TopK";
-        case GatherTree:
-            return "GatherTree";
-        case GRN:
-            return "GRN";
-        case Range:
-            return "Range";
-        case Proposal:
-            return "Proposal";
-        case ReorgYolo:
-            return "ReorgYolo";
-        case ReverseSequence:
-            return "ReverseSequence";
-        case ExperimentalDetectronTopKROIs:
-            return "ExperimentalDetectronTopKROIs";
-        case ExperimentalDetectronROIFeatureExtractor:
-            return "ExperimentalDetectronROIFeatureExtractor";
-        case ExperimentalDetectronPriorGridGenerator:
-            return "ExperimentalDetectronPriorGridGenerator";
-        case ExperimentalDetectronGenerateProposalsSingleImage:
-            return "ExperimentalDetectronGenerateProposalsSingleImage";
-        case ExtractImagePatches:
-            return "ExtractImagePatches";
-        case NonMaxSuppression:
-            return "NonMaxSuppression";
-        case MatrixNms:
-            return "MatrixNms";
-        case MulticlassNms:
-            return "MulticlassNms";
-        default:
-            return "Unknown";
-    }
-}
+Type TypeFromName(const std::string & type);
+std::string NameFromType(Type type);
 
 class PortConfigurator {
 public:
@@ -238,7 +72,7 @@ struct PortConfig {
         this->constant = rhs.constant;
         this->inPlace = rhs.inPlace;
         if (rhs.desc) {
-            this->desc = rhs.desc->clone();
+            this->desc = rhs.desc;
         }
     }
 
@@ -246,7 +80,7 @@ struct PortConfig {
         this->constant = rhs.constant;
         this->inPlace = rhs.inPlace;
         if (rhs.desc) {
-            this->desc = rhs.desc->clone();
+            this->desc = rhs.desc;
         }
         return *this;
     }
@@ -257,7 +91,7 @@ struct PortConfig {
     // TODO [DS]: better to make private and const
     bool constant = false;
     int inPlace = -1;
-    std::unique_ptr<MemoryDesc> desc;
+    MemoryDescPtr desc;
 };
 
 struct NodeConfig {
@@ -454,6 +288,44 @@ class MKLDNNNode {
         return &supportedPrimitiveDescriptors[selectedPrimitiveDescriptorIndex];
     }
 
+    /**
+     * @brief Returns input selected primitive descriptor on the specified port
+     * must be used after selectOptimalPrimitiveDescriptor stage
+     * @param portNum port number
+     * @return pointer to selected primitive descriptor with type MemoryDesc
+     */
+    MemoryDescPtr getBaseMemDescAtInputPort(size_t portNum) const;
+
+    /**
+     * @brief Returns output selected primitive descriptor on the specified port
+     * must be used after selectOptimalPrimitiveDescriptor stage
+     * @param portNum port number
+     * @return pointer to selected primitive descriptor with type MemoryDesc
+     */
+    MemoryDescPtr getBaseMemDescAtOutputPort(size_t portNum) const;
+
+    /**
+     * @brief Returns input selected primitive descriptor on the specified port
+     * must be used after selectOptimalPrimitiveDescriptor stage
+     * @param portNum port number
+     * @return pointer to selected primitive descriptor with type T
+     */
+    template <typename T,
+              typename std::enable_if<!std::is_pointer<T>::value && !std::is_reference<T>::value, int>::type = 0,
+              typename std::enable_if<std::is_base_of<MemoryDesc, T>::value, int>::type = 0>
+    std::shared_ptr<T> getInputMemDescAtPort(size_t portNum) const;
+
+    /**
+     * @brief Returns output selected primitive descriptor on the specified port
+     * must be used after selectOptimalPrimitiveDescriptor stage
+     * @param portNum port number
+     * @return pointer to selected primitive descriptor with type T
+     */
+    template <typename T,
+              typename std::enable_if<!std::is_pointer<T>::value && !std::is_reference<T>::value, int>::type = 0,
+              typename std::enable_if<std::is_base_of<MemoryDesc, T>::value, int>::type = 0>
+    std::shared_ptr<T> getOutputMemDescAtPort(size_t portNum) const;
+
     void selectPrimitiveDescriptorByIndex(int index) {
         if (index < 0 || index >= supportedPrimitiveDescriptors.size())
             selectedPrimitiveDescriptorIndex = -1;
@@ -467,8 +339,12 @@ class MKLDNNNode {
 
     virtual void setDynamicBatchLim(int lim);
 
-    void resolveNotAllocatedEdges();
+    void resolveInPlaceEdges();
+
     virtual void execute(mkldnn::stream strm);
+    void executeDynamic(mkldnn::stream strm);
+    void redefineOutputMemory(const std::vector<VectorDims> &newShapes);
+
     virtual void initSupportedPrimitiveDescriptors();
 
     /**
@@ -484,8 +360,8 @@ class MKLDNNNode {
 
     virtual void getSupportedDescriptors() = 0;
     // TODO [DS]: Should be moved into Node derivative class
-    virtual void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                                  const std::vector<const MemoryDesc*>& outputDesc) {}
+    virtual void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                                  const std::vector<MemoryDescPtr>& outputDesc) {}
     virtual void initDescriptor(const NodeConfig& config);
     virtual bool created() const = 0;
     virtual bool created(const MKLDNNExtensionManager::Ptr& extMgr) {
@@ -621,10 +497,23 @@ class MKLDNNNode {
         originalOutputPrecisions.push_back(precision);
     }
 
+    // TODO: alighn behaviour for original(Input/Output)Precisions and (input/output)Shapes
+    /**
+     * @brief Returns inputs number which have ngraph nodes.
+     * Inputs number compute as size of originalInputPrecisions vector
+     * IMPORTANT!!!
+     * FuseConvolutionAndBias and FuseMultiplyAndAdd change originalInputPrecisions vector
+     * @return original inputs number
+     */
     size_t getOriginalInputsNumber() const {
         return originalInputPrecisions.size();
     }
 
+    /**
+     * @brief Returns outputs number which have ngraph nodes.
+     * Outputs number compute as size of originalOutputPrecisions vector
+     * @return original outputs number
+     */
     size_t getOriginalOutputsNumber() const {
         return originalOutputPrecisions.size();
     }
@@ -647,6 +536,24 @@ class MKLDNNNode {
 
     bool canBePerformedAsScaleShift(const MKLDNNNode *parentNode = nullptr) const;
 
+    bool isDynamicNode() const {
+        return isDynamic;
+    }
+
+    const Shape& getInputShapeAtPort(size_t port) const {
+        if (inputShapes.size() <= port) {
+            IE_THROW() << "Incorrect input port number for node " << getName();
+        }
+        return inputShapes[port];
+    }
+
+    const Shape& getOutputShapeAtPort(size_t port) const {
+        if (outputShapes.size() <= port) {
+            IE_THROW() << "Incorrect output port number for node " << getName();
+        }
+        return outputShapes[port];
+    }
+
 protected:
     bool canFuseSimpleOperation(const MKLDNNNodePtr& node) const;
     // TODO [mandrono]: place outside of the node API
@@ -656,13 +563,13 @@ class MKLDNNNode {
         this->type = type;
     }
 
-    virtual int getMaxBatch();
+    virtual size_t getMaxBatch() const;
 
 
-    virtual std::unique_ptr<MemoryDesc> getDefinedInputDesc(const NodeConfig &config, size_t idx) const;
-    virtual std::unique_ptr<MemoryDesc> getDefinedOutputDesc(const NodeConfig &config, size_t idx) const;
-    virtual std::unique_ptr<MKLDNNMemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx);
-    virtual std::unique_ptr<MKLDNNMemoryDesc> getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx);
+    virtual MemoryDescPtr getDefinedInputDesc(const NodeConfig &config, size_t idx) const;
+    virtual MemoryDescPtr getDefinedOutputDesc(const NodeConfig &config, size_t idx) const;
+    virtual MemoryDescPtr getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx);
+    virtual MemoryDescPtr getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx);
 
     /**
      * @brief Appends new item into ops list with the information on how the node should be executed as post operation.
@@ -672,7 +579,7 @@ class MKLDNNNode {
     virtual void appendPostOps(mkldnn::post_ops& ops);
     virtual std::shared_ptr<mkldnn::primitive_attr> initPrimitiveAttr() const { return nullptr; }
 
-    typedef std::function<MKLDNNMemoryDesc (mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx)>
+    typedef std::function<DnnlMemoryDescPtr (mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx)>
             GetPrimitiveMemoryFormatFunc;
     std::vector<GetPrimitiveMemoryFormatFunc> internalBlobDesc;
 
@@ -725,7 +632,7 @@ class MKLDNNNode {
     virtual const std::vector<impl_desc_type>& getPrimitivesPriority();
 
     virtual std::vector<mkldnn::memory::format_tag> getAvailableFormatsForDims(const Shape& dims) const;
-    int batchToProcess();
+    int batchToProcess() const;
 
     InferenceEngine::Layout getWeightsLayoutByDims(InferenceEngine::SizeVector dims, bool isGrouped);
 
@@ -755,7 +662,7 @@ class MKLDNNNode {
             PortConfig portConfig;
             portConfig.inPlace = portConfigurator.inPlace;
             portConfig.constant = portConfigurator.constant;
-            portConfig.desc = portConfigurator.blockedDescCreator->createUniqueDesc(prc, shape.getStaticDims());
+            portConfig.desc = portConfigurator.blockedDescCreator->createSharedDesc(prc, shape);
 
             port.push_back(std::move(portConfig));
 
@@ -764,14 +671,14 @@ class MKLDNNNode {
 
         NodeConfig config;
         for (size_t i = 0; i < inPortConfigs.size(); i++) {
-            auto shape = inPortConfigs[i].shape.getRank() == 0 ? getParentEdgesAtPort(i)[0]->getShape() : inPortConfigs[i].shape;
+            auto shape = inPortConfigs[i].shape.getRank() == 0 ? getInputShapeAtPort(i) : inPortConfigs[i].shape;
             auto prc = inPortConfigs[i].prc == InferenceEngine::Precision::UNSPECIFIED ? getOriginalInputPrecisionAtPort(i) : inPortConfigs[i].prc;
             if (!fill_port(inPortConfigs[i], shape, prc, config.inConfs))
                 return;
         }
 
         for (size_t i = 0; i < outPortConfigs.size(); i++) {
-            auto dims = outPortConfigs[i].shape.getRank() == 0 ? getChildEdgesAtPort(i)[0]->getShape() : outPortConfigs[i].shape;
+            auto dims = outPortConfigs[i].shape.getRank() == 0 ? getOutputShapeAtPort(i) : outPortConfigs[i].shape;
             auto prc = outPortConfigs[i].prc == InferenceEngine::Precision::UNSPECIFIED ? getOriginalOutputPrecisionAtPort(i) : outPortConfigs[i].prc;
             if (!fill_port(outPortConfigs[i], dims, prc, config.outConfs))
                 return;
@@ -781,7 +688,31 @@ class MKLDNNNode {
         supportedPrimitiveDescriptors.push_back({config, implType});
     }
 
+    bool isDynamic = false;
+
+    bool isInputShapesDefined() const;
+    void initCurrentDims();
+
+    bool isInputShapeChanged() const;
+    virtual bool isShapeInferNeeded() const;
+    virtual std::vector<VectorDims> shapeInfer() const;
+    // TODO [DS] : make pure after all nodes will be support dynamic shapes
+    virtual void executeDynamicImpl(mkldnn::stream strm) {
+        IE_THROW(NotImplemented) << "[DS] executeDynamicImpl not implemented for node with type: " << getTypeStr();
+    }
+
+    virtual bool isPrepareParamsNeeded() const;
+    // TODO [mandrono]: add description
+    // called after memory allocation/reallocation
+    virtual void prepareParams() {
+        IE_THROW(NotImplemented) << "[DS] prapareParams not implemented for node with type " << NameFromType(getType());
+    }
+
+    std::vector<VectorDims> currentInDims = {};
+
 private:
+    std::shared_ptr<ngraph::Node> opToShapeInfer;
+
     std::vector<MKLDNNEdgeWeakPtr> parentEdges;
     std::vector<MKLDNNEdgeWeakPtr> childEdges;
 
@@ -804,6 +735,8 @@ class MKLDNNNode {
 
     bool isEdgesEmpty(const std::vector<MKLDNNEdgeWeakPtr>& edges) const;
 
+    void createShapeInferSubgraph(const std::shared_ptr<ngraph::Node>& op);
+
     template <class PD, class D, typename FPD>
     typename std::enable_if<!std::is_same<FPD, bool>::value, PD>::type
     createPd(MKLDNNDescriptor desc) {
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp
index ed42651a738965..5bb831e34073c7 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_plugin.cpp
@@ -7,10 +7,14 @@
 #include "mkldnn_extension_mngr.h"
 #include "mkldnn_weights_cache.hpp"
 #include "mkldnn_itt.h"
+#include "mkldnn_serialize.h"
 
 #include <threading/ie_executor_manager.hpp>
 #include <memory>
 #include <ie_plugin_config.hpp>
+#include <cpp_interfaces/interface/ie_internal_plugin_config.hpp>
+#include <ie_icore.hpp>
+#include <fstream>
 #include <vector>
 #include <tuple>
 #include <unordered_set>
@@ -58,11 +62,13 @@
 #include <transformations/op_conversions/convert_matrix_nms_to_matrix_nms_ie.hpp>
 #include <transformations/op_conversions/convert_deformable_conv_v8_to_v1.hpp>
 #include <transformations/smart_reshape/matmul_sr.hpp>
+#include <transformations/op_conversions/convert_minimum_to_power_and_max.hpp>
 #include <transformations/convert_precision.hpp>
 #include <transformations/init_node_info.hpp>
 #include <transformations/rt_info/fused_names_attribute.hpp>
 #include <transformations/op_conversions/fq_decomposition.hpp>
 #include <transformations/utils/utils.hpp>
+#include <transformations/serialize.hpp>
 
 #include <ngraph/opsets/opset2.hpp>
 #include <ngraph/opsets/opset3.hpp>
@@ -85,6 +91,7 @@
 #include <low_precision/network_helper.hpp>
 
 #include <ie_algorithm.hpp>
+#include "performance_heuristics.hpp"
 
 #include "nodes/mkldnn_mvn_node.h"
 #include "nodes/mkldnn_fake_quantize_node.h"
@@ -114,14 +121,12 @@ Engine::~Engine() {
     ExecutorManager::getInstance()->clear("CPUCallbackExecutor");
 }
 
-static void Transformation(CNNNetwork& clonedNetwork, const Config& conf) {
-    auto nGraphFunc = clonedNetwork.getFunction();
-
+static void TransformationUpToCPUSpecificOpSet(std::shared_ptr<ngraph::Function> nGraphFunc, const bool _enableLPT) {
     ngraph::pass::Manager manager;
     manager.register_pass<ngraph::pass::InitNodeInfo>();
 
     const bool useLpt =
-        (conf.lpTransformsMode == Config::LPTransformsMode::On) &&
+            _enableLPT &&
         ngraph::pass::low_precision::LowPrecision::isFunctionQuantized(nGraphFunc);
     if (useLpt) {
         manager.register_pass<ngraph::pass::DisableConvertConstantFoldingOnConstPath>(
@@ -289,6 +294,19 @@ static void Transformation(CNNNetwork& clonedNetwork, const Config& conf) {
                 return node->input_value(0).get_partial_shape().rank().get_length() > 5;
             });
 
+    pass_config->set_callback<ngraph::pass::ConvertNMSToNMSIEInternal>(
+            [](const_node_ptr &node) -> bool {
+                for (size_t i = 0; i < node->get_output_size(); i++) {
+                    const auto outputs = node->get_output_target_inputs(i);
+                    for (const auto &out : outputs) {
+                        if (out.get_node()->get_type_info() != ngraph::op::v0::Result::type_info) {
+                            return false;
+                        }
+                    }
+                }
+                return true;
+            });
+
     // List of enabled/disabled transformations
     pass_config->disable<ngraph::pass::ConvertGELU>();
     pass_config->disable<ngraph::pass::ConvertShuffleChannels3>();
@@ -304,6 +322,7 @@ static void Transformation(CNNNetwork& clonedNetwork, const Config& conf) {
     pass_config->disable<ngraph::pass::WeightsDequantizeToFakeQuantize>();
     pass_config->disable<ngraph::pass::SimplifyCTCGreedyDecoderSeqLen>();
     pass_config->disable<ngraph::pass::ConvertGather7ToGather1>();
+    pass_config->disable<ngraph::pass::ConvertMinimum>();
 
     pass_config->enable<ngraph::pass::NormalizeL2Decomposition>();
     pass_config->enable<ngraph::pass::ConvertInterpolate1ToInterpolate4>();
@@ -381,12 +400,16 @@ static void Transformation(CNNNetwork& clonedNetwork, const Config& conf) {
     });
 
     postLPTPassManager.run_passes(nGraphFunc);
+}
 
+static void Transformation(CNNNetwork& clonedNetwork, const bool _enableLPT) {
+    auto nGraphFunc = clonedNetwork.getFunction();
+    TransformationUpToCPUSpecificOpSet(nGraphFunc, _enableLPT);
     ConvertToCPUSpecificOpset(nGraphFunc);
 }
 
 InferenceEngine::IExecutableNetworkInternal::Ptr
-Engine::LoadExeNetworkImpl(const InferenceEngine::CNNNetwork &network, const std::map<std::string, std::string> &config) {
+Engine::LoadExeNetworkImpl(const InferenceEngine::CNNNetwork &network, const std::map<std::string, std::string> &orig_config) {
     OV_ITT_SCOPED_TASK(itt::domains::MKLDNNPlugin, "Engine::LoadExeNetworkImpl");
 
     // verification of supported input
@@ -408,25 +431,97 @@ Engine::LoadExeNetworkImpl(const InferenceEngine::CNNNetwork &network, const std
         }
     }
 
-    // TODO: handle input precision differently - per input and not one per network...
+    auto config = orig_config;
+    CNNNetwork clonedNetwork = InferenceEngine::details::cloneNetwork(network);
+    const auto& lptProp = config.find(InferenceEngine::PluginConfigInternalParams::KEY_LP_TRANSFORMS_MODE);
+    const bool enableLPT = (lptProp != config.end() && lptProp->second == PluginConfigParams::YES) /* enabled in the orig_config*/
+            || Config::LPTransformsMode::On == engConfig.lpTransformsMode /* or already enabled for the plugin */;
+    auto nGraphFunc = clonedNetwork.getFunction();
+    TransformationUpToCPUSpecificOpSet(nGraphFunc, enableLPT);
+
+    // Here the OV perf modes are turned into specific settings (as we need the network for better params selection)
+    const auto& mode = config.find(PluginConfigParams::KEY_PERFORMANCE_HINT);
+    // the mode may have just arrived to the LoadNetwork, or was set with the plugins' SetConfig
+    if (mode != config.end() || !engConfig.perfHintsConfig.ovPerfHint.empty()) {
+        const auto mode_name = (mode != config.end())
+                               ? PerfHintsConfig::CheckPerformanceHintValue(mode->second) : engConfig.perfHintsConfig.ovPerfHint;
+        //checking streams (to avoid overriding what user might explicitly set in the incoming config or previously via SetConfig)
+        const auto streams = config.find(PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS);
+        if (streams == config.end() && !streamsSet) {
+            if (mode_name == CONFIG_VALUE(LATENCY)) {
+                config[PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS] = CONFIG_VALUE(CPU_THROUGHPUT_NUMA);
+            } else if (mode_name == CONFIG_VALUE(THROUGHPUT)) {
+                const auto isa = dnnl::get_effective_cpu_isa();
+                float isaSpecificThreshold = 1.0f;
+                switch (isa) {
+                    case dnnl::cpu_isa::sse41 :
+                        isaSpecificThreshold = 0.5f;
+                        break;
+                    case dnnl::cpu_isa::avx2:
+                    case dnnl::cpu_isa::avx512_core:
+                        isaSpecificThreshold = 1.0f;
+                        break;
+                    case dnnl::cpu_isa::avx512_core_vnni:
+                    case dnnl::cpu_isa::avx2_vnni:
+                        isaSpecificThreshold = 2.0f;
+                        break;
+                    case dnnl::cpu_isa::avx512_core_amx:
+                        isaSpecificThreshold = 4.0f;
+                        break;
+                    default:
+                        isaSpecificThreshold = 1.0f;
+                }
+                // the more "capable" the CPU in general, the more streams we may want to keep to keep it utilized
+                const float memThresholdAssumeLimitedForISA = ov::MemBandwidthPressure::LIMITED/isaSpecificThreshold;
+                const float L2_cache_size = mkldnn::utils::get_cache_size(2 /*level*/, true /*per core */);
+                const float L3_cache_size = mkldnn::utils::get_cache_size(3, false);
+                ov::MemBandwidthPressure networkToleranceForLowCache = ov::MemBandwidthPressureTolerance(
+                        clonedNetwork.getFunction(),
+                        L2_cache_size, L3_cache_size,
+                        memThresholdAssumeLimitedForISA);
+                // num of phys CPU cores (most aggressive value for #streams)
+                const auto num_cores = getNumberOfCPUCores();
+                // less aggressive
+                const auto num_streams_less_aggressive = num_cores / 2;
+                // default #streams value (most conservative)
+                const auto default_num_streams = IStreamsExecutor::Config::GetDefaultNumStreams();
+                int num_streams = default_num_streams;
+                if (networkToleranceForLowCache.max_mem_tolerance == ov::MemBandwidthPressure::UNKNOWN) {
+                    if ((networkToleranceForLowCache.ratio_compute_convs == ov::MemBandwidthPressure::ALL)
+                        || (networkToleranceForLowCache.ratio_compute_deconvs == ov::MemBandwidthPressure::ALL)) {
+                        // all relevant layers (convs, etc) are compute-limited, the most aggressive val for #streams
+                        num_streams = num_cores;
+                    }   // otherwise (no recognized layers) falling back to the default value
+                } else if (networkToleranceForLowCache.max_mem_tolerance > memThresholdAssumeLimitedForISA) {
+                    // network is below the ISA-specific threshold
+                    num_streams = num_cores;
+                } else if (networkToleranceForLowCache.max_mem_tolerance > ov::MemBandwidthPressure::LIMITED) {
+                    // network is below general threshold
+                    num_streams = std::max(default_num_streams, num_streams_less_aggressive);
+                }
+                auto num_requests = config.find(PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS);
+                if (num_requests != config.end())
+                    num_streams = std::min(num_streams, PerfHintsConfig::CheckPerformanceHintRequestValue(num_requests->second));
+                config[PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS] = std::to_string(num_streams);
+           }
+        }
+    }
+    ConvertToCPUSpecificOpset(nGraphFunc);
 
+    // update the props after the perf mode translated to configs
     // TODO: Clarify the behavior of SetConfig method. Skip eng_config or not?
     Config conf = engConfig;
     conf.readProperties(config);
-
     if (conf.enableDynamicBatch) {
         conf.batchLimit = static_cast<int>(network.getBatchSize());
     }
 
-    CNNNetwork clonedNetwork = InferenceEngine::details::cloneNetwork(network);
-
-    Transformation(clonedNetwork, conf);
-
     return std::make_shared<MKLDNNExecNetwork>(clonedNetwork, conf, extensionManager, weightsSharing);
 }
 
 void Engine::SetConfig(const std::map<std::string, std::string> &config) {
     // accumulate config parameters on engine level
+    streamsSet = (config.find(PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS) != config.end());
     engConfig.readProperties(config);
 }
 
@@ -457,14 +552,16 @@ static bool hasAVX512() {
 
 Parameter Engine::GetMetric(const std::string& name, const std::map<std::string, Parameter>& /*options*/) const {
     if (name == METRIC_KEY(SUPPORTED_METRICS)) {
-        std::vector<std::string> metrics;
-        metrics.push_back(METRIC_KEY(AVAILABLE_DEVICES));
-        metrics.push_back(METRIC_KEY(SUPPORTED_METRICS));
-        metrics.push_back(METRIC_KEY(FULL_DEVICE_NAME));
-        metrics.push_back(METRIC_KEY(OPTIMIZATION_CAPABILITIES));
-        metrics.push_back(METRIC_KEY(SUPPORTED_CONFIG_KEYS));
-        metrics.push_back(METRIC_KEY(RANGE_FOR_ASYNC_INFER_REQUESTS));
-        metrics.push_back(METRIC_KEY(RANGE_FOR_STREAMS));
+        std::vector<std::string> metrics = {
+            METRIC_KEY(AVAILABLE_DEVICES),
+            METRIC_KEY(SUPPORTED_METRICS),
+            METRIC_KEY(FULL_DEVICE_NAME),
+            METRIC_KEY(OPTIMIZATION_CAPABILITIES),
+            METRIC_KEY(SUPPORTED_CONFIG_KEYS),
+            METRIC_KEY(RANGE_FOR_ASYNC_INFER_REQUESTS),
+            METRIC_KEY(RANGE_FOR_STREAMS),
+            METRIC_KEY(IMPORT_EXPORT_SUPPORT),
+        };
         IE_SET_METRIC_RETURN(SUPPORTED_METRICS, metrics);
     } else if (name == METRIC_KEY(FULL_DEVICE_NAME)) {
         std::string brand_string;
@@ -511,6 +608,8 @@ Parameter Engine::GetMetric(const std::string& name, const std::map<std::string,
     } else if (name == METRIC_KEY(RANGE_FOR_STREAMS)) {
         std::tuple<unsigned int, unsigned int> range = std::make_tuple(1, parallel_get_max_threads());
         IE_SET_METRIC_RETURN(RANGE_FOR_STREAMS, range);
+    } else if (name == METRIC_KEY(IMPORT_EXPORT_SUPPORT)) {
+        IE_SET_METRIC_RETURN(IMPORT_EXPORT_SUPPORT, true);
     } else {
         IE_THROW() << "Unsupported metric key " << name;
     }
@@ -541,7 +640,10 @@ QueryNetworkResult Engine::QueryNetwork(const CNNNetwork& network, const std::ma
 
         auto clonedNetwork = InferenceEngine::details::cloneNetwork(network);
         auto ops = clonedNetwork.getFunction()->get_ordered_ops();
-        Transformation(clonedNetwork, conf);
+        const auto& lptProp = config.find(InferenceEngine::PluginConfigInternalParams::KEY_LP_TRANSFORMS_MODE);
+        const bool enableLPT = (lptProp != config.end() && lptProp->second == PluginConfigParams::YES) /* enabled in the orig_config*/
+                               || Config::LPTransformsMode::On == engConfig.lpTransformsMode /* or already enabled */;
+        Transformation(clonedNetwork, enableLPT);
         std::unordered_set<std::string> supported;
         std::unordered_set<std::string> unsupported;
         for (auto op : ops) {
@@ -604,5 +706,33 @@ QueryNetworkResult Engine::QueryNetwork(const CNNNetwork& network, const std::ma
     return res;
 }
 
+InferenceEngine::IExecutableNetworkInternal::Ptr Engine::ImportNetwork(std::istream& networkModel,
+                                            const std::map<std::string, std::string>& config) {
+    OV_ITT_SCOPE(FIRST_INFERENCE, itt::domains::MKLDNN_LT, "ImportNetwork");
+
+    CNNNetworkDeserializer deserializer(networkModel,
+        [this](const std::string& model, const Blob::CPtr& weights) {
+            return GetCore()->ReadNetwork(model, weights);
+        });
+
+    CNNNetwork cnnnetwork;
+    deserializer >> cnnnetwork;
+
+    Config conf = engConfig;
+    conf.readProperties(config);
+
+    if (conf.enableDynamicBatch) {
+        conf.batchLimit = static_cast<int>(cnnnetwork.getBatchSize());
+    }
+
+    auto execNetwork = std::make_shared<MKLDNNExecNetwork>(cnnnetwork, conf, extensionManager, weightsSharing);
+
+    execNetwork->setNetworkInputs(cnnnetwork.getInputsInfo());
+    execNetwork->setNetworkOutputs(cnnnetwork.getOutputsInfo());
+    execNetwork->SetPointerToPlugin(shared_from_this());
+
+    return execNetwork;
+}
+
 static const Version version = {{2, 1}, CI_BUILD_NUMBER, "MKLDNNPlugin"};
 IE_DEFINE_PLUGIN_CREATE_FUNCTION(Engine, version)
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_plugin.h b/inference-engine/src/mkldnn_plugin/mkldnn_plugin.h
index d0cf39e32a0c48..8d600f93132096 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_plugin.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_plugin.h
@@ -13,6 +13,7 @@
 #include <memory>
 #include <functional>
 #include <vector>
+#include <cfloat>
 
 namespace MKLDNNPlugin {
 
@@ -36,10 +37,14 @@ class Engine : public InferenceEngine::IInferencePlugin {
     InferenceEngine::QueryNetworkResult QueryNetwork(const InferenceEngine::CNNNetwork& network,
                                                      const std::map<std::string, std::string>& config) const override;
 
+    InferenceEngine::IExecutableNetworkInternal::Ptr ImportNetwork(std::istream& networkModel,
+                                                     const std::map<std::string, std::string>& config) override;
+
 private:
     Config engConfig;
     NumaNodesWeights weightsSharing;
     MKLDNNExtensionManager::Ptr extensionManager = std::make_shared<MKLDNNExtensionManager>();
+    bool streamsSet = false;
 };
 
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_primitive.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_primitive.cpp
index abc1ef36434274..f37556e65e7727 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_primitive.cpp
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_primitive.cpp
@@ -9,7 +9,7 @@ using namespace MKLDNNPlugin;
 
 MKLDNNPrimitive::MKLDNNPrimitive() {}
 
-MKLDNNPrimitive::operator bool() {
+MKLDNNPrimitive::operator bool() const {
     return prim ? true : false;
 }
 
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_primitive.h b/inference-engine/src/mkldnn_plugin/mkldnn_primitive.h
index d2b9fd6ec273d6..ffd43ee8dbda87 100644
--- a/inference-engine/src/mkldnn_plugin/mkldnn_primitive.h
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_primitive.h
@@ -15,7 +15,7 @@ namespace MKLDNNPlugin {
 class MKLDNNPrimitive {
 public:
     MKLDNNPrimitive();
-    operator bool();
+    operator bool() const;
     MKLDNNPrimitive& operator=(const std::shared_ptr<mkldnn::primitive>& primitive);
     mkldnn::primitive operator*();
 
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_serialize.cpp b/inference-engine/src/mkldnn_plugin/mkldnn_serialize.cpp
new file mode 100644
index 00000000000000..b7a538c7997f84
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_serialize.cpp
@@ -0,0 +1,173 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+#include "mkldnn_serialize.h"
+
+#include <transformations/serialize.hpp>
+
+#include <pugixml.hpp>
+
+using namespace InferenceEngine;
+
+namespace MKLDNNPlugin {
+namespace {
+    std::string to_string(InferenceEngine::Layout layout) {
+        std::stringstream ss;
+        ss << layout;
+        return ss.str();
+    }
+
+    InferenceEngine::Layout layout_from_string(const std::string & name) {
+        static const std::unordered_map<std::string, InferenceEngine::Layout> layouts = {
+            { "ANY", InferenceEngine::Layout::ANY },
+            { "NCHW", InferenceEngine::Layout::NCHW },
+            { "NHWC", InferenceEngine::Layout::NHWC },
+            { "NCDHW", InferenceEngine::Layout::NCDHW },
+            { "NDHWC", InferenceEngine::Layout::NDHWC },
+            { "OIHW", InferenceEngine::Layout::OIHW },
+            { "C", InferenceEngine::Layout::C },
+            { "CHW", InferenceEngine::Layout::CHW },
+            { "HWC", InferenceEngine::Layout::HWC },
+            { "HW", InferenceEngine::Layout::HW },
+            { "NC", InferenceEngine::Layout::NC },
+            { "CN", InferenceEngine::Layout::CN },
+            { "BLOCKED", InferenceEngine::Layout::BLOCKED }
+        };
+        auto it = layouts.find(name);
+        if (it != layouts.end()) {
+            return it->second;
+        }
+        IE_THROW(NetworkNotRead) << "Unknown layout with name '" << name << "'";
+    }
+
+    template<typename T>
+    void setPrecisionsAndLayouts(
+        pugi::xml_object_range<pugi::xml_named_node_iterator> && nodes,
+        T && info) {
+        for (auto n : nodes) {
+            auto name_attr = n.attribute("name");
+            auto precision_attr = n.attribute("precision");
+            auto layout_attr = n.attribute("layout");
+
+            if (!name_attr
+                || !precision_attr
+                || !layout_attr) {
+                IE_THROW(NetworkNotRead) << "The inputs/outputs information is invalid.";
+            }
+
+            auto it = info.find(name_attr.value());
+            if (it == info.end()) {
+                IE_THROW(NetworkNotRead) << "The input/output with name '" << name_attr.value() << "' not found";
+            }
+
+            it->second->setPrecision(Precision::FromStr(precision_attr.value()));
+            it->second->setLayout(layout_from_string(layout_attr.value()));
+        }
+    }
+};  // namespace
+
+CNNNetworkSerializer::CNNNetworkSerializer(std::ostream & ostream, MKLDNNExtensionManager::Ptr extensionManager)
+    : _ostream(ostream)
+    , _extensionManager(extensionManager) {
+}
+
+void CNNNetworkSerializer::operator << (const CNNNetwork & network) {
+    auto getCustomOpSets = [this]() {
+        std::map<std::string, ngraph::OpSet> custom_opsets;
+
+        if (_extensionManager) {
+            auto extensions = _extensionManager->Extensions();
+            for (const auto& extension : extensions) {
+                auto opset = extension->getOpSets();
+                custom_opsets.insert(std::begin(opset), std::end(opset));
+            }
+        }
+
+        return custom_opsets;
+    };
+
+    auto serializeInputsAndOutputs = [&](std::ostream & stream) {
+        const std::string name = "cnndata";
+        pugi::xml_document xml_doc;
+        pugi::xml_node root = xml_doc.append_child(name.c_str());
+        pugi::xml_node inputs = root.append_child("inputs");
+        pugi::xml_node outputs = root.append_child("outputs");
+
+        for (const auto & in : network.getInputsInfo()) {
+            auto in_node = inputs.append_child("in");
+
+            in_node.append_attribute("name")
+                    .set_value(in.first.c_str());
+            in_node.append_attribute("precision")
+                    .set_value(in.second->getPrecision().name());
+            in_node.append_attribute("layout")
+                    .set_value(to_string(in.second->getLayout()).c_str());
+        }
+
+        for (const auto & out : network.getOutputsInfo()) {
+            auto out_node = outputs.append_child("out");
+            out_node.append_attribute("name")
+                    .set_value(out.first.c_str());
+            out_node.append_attribute("precision")
+                    .set_value(out.second->getPrecision().name());
+            out_node.append_attribute("layout")
+                    .set_value(to_string(out.second->getLayout()).c_str());
+        }
+
+        xml_doc.save(stream);
+    };
+
+    ngraph::pass::StreamSerialize serializer(_ostream, getCustomOpSets(), serializeInputsAndOutputs);
+    serializer.run_on_function(std::const_pointer_cast<ngraph::Function>(network.getFunction()));
+}
+
+CNNNetworkDeserializer::CNNNetworkDeserializer(std::istream & istream, cnn_network_builder fn)
+    : _istream(istream)
+    , _cnn_network_builder(fn) {
+}
+
+void CNNNetworkDeserializer::operator >> (InferenceEngine::CNNNetwork & network) {
+    using namespace ngraph::pass;
+
+    std::string xmlString, xmlInOutString;
+    InferenceEngine::Blob::Ptr dataBlob;
+
+    StreamSerialize::DataHeader hdr = {};
+    _istream.read(reinterpret_cast<char*>(&hdr), sizeof hdr);
+
+    // read CNNNetwork input/output precisions
+    _istream.seekg(hdr.custom_data_offset);
+    xmlInOutString.resize(hdr.custom_data_size);
+    _istream.read(const_cast<char*>(xmlInOutString.c_str()), hdr.custom_data_size);
+    pugi::xml_document xmlInOutDoc;
+    auto res = xmlInOutDoc.load_string(xmlInOutString.c_str());
+    if (res.status != pugi::status_ok) {
+        IE_THROW(NetworkNotRead) << "The inputs and outputs information is invalid.";
+    }
+
+    // read blob content
+    _istream.seekg(hdr.consts_offset);
+    if (hdr.consts_size) {
+        dataBlob = InferenceEngine::make_shared_blob<std::uint8_t>(
+            InferenceEngine::TensorDesc(InferenceEngine::Precision::U8, {hdr.consts_size}, InferenceEngine::Layout::C));
+        dataBlob->allocate();
+        _istream.read(dataBlob->buffer(), hdr.consts_size);
+    }
+
+    // read XML content
+    _istream.seekg(hdr.model_offset);
+    xmlString.resize(hdr.model_size);
+    _istream.read(const_cast<char*>(xmlString.c_str()), hdr.model_size);
+
+    network = _cnn_network_builder(xmlString, std::move(dataBlob));
+
+    // Set input and output precisions
+    pugi::xml_node root = xmlInOutDoc.child("cnndata");
+    pugi::xml_node inputs = root.child("inputs");
+    pugi::xml_node outputs = root.child("outputs");
+
+    setPrecisionsAndLayouts(inputs.children("in"), network.getInputsInfo());
+    setPrecisionsAndLayouts(outputs.children("out"), network.getOutputsInfo());
+}
+
+}  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/mkldnn_serialize.h b/inference-engine/src/mkldnn_plugin/mkldnn_serialize.h
new file mode 100644
index 00000000000000..5aab9714121f6a
--- /dev/null
+++ b/inference-engine/src/mkldnn_plugin/mkldnn_serialize.h
@@ -0,0 +1,39 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+#pragma once
+#include "mkldnn_extension_mngr.h"
+
+#include <iostream>
+#include <functional>
+#include <cpp/ie_cnn_network.h>
+
+namespace MKLDNNPlugin {
+
+class CNNNetworkSerializer {
+public:
+    CNNNetworkSerializer(std::ostream & ostream, MKLDNNExtensionManager::Ptr extensionManager);
+    void operator << (const InferenceEngine::CNNNetwork & network);
+
+private:
+    std::ostream & _ostream;
+    MKLDNNExtensionManager::Ptr _extensionManager;
+};
+
+class CNNNetworkDeserializer {
+public:
+    typedef std::function<
+                InferenceEngine::CNNNetwork(
+                        const std::string&,
+                        const InferenceEngine::Blob::CPtr&)> cnn_network_builder;
+    CNNNetworkDeserializer(std::istream & istream, cnn_network_builder fn);
+    void operator >> (InferenceEngine::CNNNetwork & network);
+
+private:
+    std::istream & _istream;
+    cnn_network_builder _cnn_network_builder;
+};
+
+// const std::string& model, const Blob::CPtr& weights
+
+}  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/fully_connected.cpp b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/fully_connected.cpp
index cf41d41efd4590..a6aa4b0a57c301 100644
--- a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/fully_connected.cpp
+++ b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/fully_connected.cpp
@@ -41,5 +41,6 @@ void MKLDNNPlugin::FullyConnectedNode::validate_and_infer_types() {
 
 bool MKLDNNPlugin::FullyConnectedNode::visit_attributes(ngraph::AttributeVisitor &visitor) {
     visitor.on_attribute("out-size", m_output_size);
+    visitor.on_attribute("out-shape", m_output_shape);
     return true;
 }
diff --git a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/leaky_relu.hpp b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/leaky_relu.hpp
index 7a4cfec982ecf9..f296f690a9cc8b 100644
--- a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/leaky_relu.hpp
+++ b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/leaky_relu.hpp
@@ -14,6 +14,8 @@ class LeakyReluNode : public ngraph::op::Op {
     static constexpr const ::ngraph::Node::type_info_t& get_type_info_static() { return type_info; }
     const ngraph::NodeTypeInfo& get_type_info() const override { return type_info; }
 
+    LeakyReluNode() = default;
+
     LeakyReluNode(const ngraph::Output<ngraph::Node> &data, const float &negative_slope, const ngraph::element::Type output_type);
 
     void validate_and_infer_types() override;
diff --git a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/power_static.hpp b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/power_static.hpp
index cb71b59c723447..0744ea65b9adca 100644
--- a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/power_static.hpp
+++ b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/power_static.hpp
@@ -14,6 +14,8 @@ class PowerStaticNode : public ngraph::op::Op {
     static constexpr const ::ngraph::Node::type_info_t& get_type_info_static() { return type_info; }
     const ngraph::NodeTypeInfo& get_type_info() const override { return type_info; }
 
+    PowerStaticNode() = default;
+
     PowerStaticNode(const ngraph::Output<ngraph::Node> &data, const float &power, const float &scale, const float &shift,
                     const ngraph::element::Type output_type = ngraph::element::undefined);
 
diff --git a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/swish_cpu.hpp b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/swish_cpu.hpp
index 9477af47f846c3..9dcf0359bc1481 100644
--- a/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/swish_cpu.hpp
+++ b/inference-engine/src/mkldnn_plugin/ngraph_transformations/op/swish_cpu.hpp
@@ -14,6 +14,8 @@ class SwishNode : public ngraph::op::Op {
     static constexpr const ::ngraph::Node::type_info_t& get_type_info_static() { return type_info; }
     const ngraph::NodeTypeInfo &get_type_info() const override { return type_info; }
 
+    SwishNode() = default;
+
     explicit SwishNode(const ngraph::Output<Node> &input, float alpha = 1.0);
 
     void validate_and_infer_types() override;
@@ -21,6 +23,7 @@ class SwishNode : public ngraph::op::Op {
     std::shared_ptr<ngraph::Node> clone_with_new_inputs(const ngraph::OutputVector &new_args) const override;
 
     float get_alpha() const;
+
 protected:
     float m_alpha;
 };
diff --git a/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.cpp b/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.cpp
index 85566b3833ac6b..258207bf30e696 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.cpp
@@ -13,21 +13,21 @@ constexpr size_t channelsPos = 1lu;
 
 class PlainFormatCreator : public BlockedDescCreator {
 public:
-    BlockedMemoryDesc createDesc(const InferenceEngine::Precision& precision, const InferenceEngine::SizeVector& srcDims) const override {
-        SizeVector order(srcDims.size());
+    CpuBlockedMemoryDesc createDesc(const InferenceEngine::Precision& precision, const Shape& srcShape) const override {
+        SizeVector order(srcShape.getRank());
         std::iota(order.begin(), order.end(), 0);
-        return BlockedMemoryDesc(precision, srcDims, srcDims, order);
+        return CpuBlockedMemoryDesc(precision, srcShape, srcShape.getDims(), order);
     }
     size_t getMinimalRank() const override { return 0lu; }
 };
 
 class PerChannelCreator : public BlockedDescCreator {
 public:
-    BlockedMemoryDesc createDesc(const InferenceEngine::Precision &precision, const InferenceEngine::SizeVector &srcDims) const override {
-        SizeVector order(srcDims.size());
+    CpuBlockedMemoryDesc createDesc(const InferenceEngine::Precision &precision, const Shape& srcShape) const override {
+        SizeVector order(srcShape.getRank());
         std::iota(order.begin(), order.end(), 0);
-        SizeVector blkDims = srcDims;
-        if (srcDims.size() > 2) {
+        SizeVector blkDims = srcShape.getDims();
+        if (srcShape.getRank() > 2) {
             auto moveElementBack = [](SizeVector& vector, size_t indx) {
                 auto itr = vector.begin() + indx;
                 std::rotate(itr, itr + 1, vector.end());
@@ -37,7 +37,7 @@ class PerChannelCreator : public BlockedDescCreator {
             moveElementBack(blkDims, channelsPos);
         }
 
-        return BlockedMemoryDesc(precision, srcDims, blkDims, order);
+        return CpuBlockedMemoryDesc(precision, srcShape, blkDims, order);
     }
     size_t getMinimalRank() const override { return 3lu; }
 };
@@ -45,22 +45,22 @@ class PerChannelCreator : public BlockedDescCreator {
 class ChannelBlockedCreator : public BlockedDescCreator {
 public:
     ChannelBlockedCreator(size_t blockSize) : _blockSize(blockSize) {}
-    BlockedMemoryDesc createDesc(const InferenceEngine::Precision& precision, const InferenceEngine::SizeVector& srcDims) const override {
-        if (srcDims.size() < 2) {
+    CpuBlockedMemoryDesc createDesc(const InferenceEngine::Precision& precision, const Shape& srcShape) const override {
+        if (srcShape.getRank() < 2) {
             IE_THROW() << "Can't create blocked tensor descriptor!";
         }
 
-        SizeVector order(srcDims.size());
+        SizeVector order(srcShape.getRank());
         std::iota(order.begin(), order.end(), 0);
         order.push_back(channelsPos);
 
-        SizeVector blkDims = srcDims;
+        SizeVector blkDims = srcShape.getDims();
         if (Shape::UNDEFINED_DIM != blkDims[channelsPos]) {
             blkDims[channelsPos] = blkDims[channelsPos] / _blockSize + (blkDims[channelsPos] % _blockSize ? 1 : 0);
         }
         blkDims.push_back(_blockSize);
 
-        return BlockedMemoryDesc(precision, srcDims, blkDims, order);
+        return CpuBlockedMemoryDesc(precision, srcShape, blkDims, order);
     }
     size_t getMinimalRank() const override { return 3lu; }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.h b/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.h
index f53524288e4e7c..95da8560cb3786 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/common/blocked_desc_creator.h
@@ -6,7 +6,7 @@
 
 #include <functional>
 #include "cpu_shape.h"
-#include "cpu_blocked_memory_desc.h"
+#include "memory_desc/cpu_blocked_memory_desc.h"
 
 namespace MKLDNNPlugin {
 
@@ -27,10 +27,12 @@ class BlockedDescCreator {
     makeFilteredRange(const CreatorsMap& map, unsigned rank, const std::vector<LayoutType>& supportedTypes);
     static std::pair<CreatorsMapFilterConstIterator, CreatorsMapFilterConstIterator>
     makeFilteredRange(const CreatorsMap& map, Predicate predicate);
-    virtual BlockedMemoryDesc createDesc(const InferenceEngine::Precision& precision, const InferenceEngine::SizeVector& srcDims) const = 0;
-    std::unique_ptr<BlockedMemoryDesc> createUniqueDesc(const InferenceEngine::Precision& precision, const InferenceEngine::SizeVector& srcDims) const {
-        return MKLDNNPlugin::make_unique<BlockedMemoryDesc>(createDesc(precision, srcDims));
+    virtual CpuBlockedMemoryDesc createDesc(const InferenceEngine::Precision& precision, const Shape& srcShape) const = 0;
+
+    std::shared_ptr<CpuBlockedMemoryDesc> createSharedDesc(const InferenceEngine::Precision& precision, const Shape& srcShape) const {
+        return std::make_shared<CpuBlockedMemoryDesc>(createDesc(precision, srcShape));
     }
+
     virtual size_t getMinimalRank() const = 0;
     virtual ~BlockedDescCreator() = default;
 };
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.cpp
index 4bf60d6eb21f4a..fb185be8103d91 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.cpp
@@ -21,16 +21,20 @@ using namespace InferenceEngine;
 using namespace mkldnn;
 using namespace mkldnn::impl::cpu::x64;
 
-bool MKLDNNAdaptivePoolingNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNAdaptivePoolingNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         if (one_of(op->get_type_info(), ngraph::op::v8::AdaptiveAvgPool::type_info)) {
-            auto adaPool = std::dynamic_pointer_cast<ngraph::opset8::AdaptiveAvgPool>(op);
+            auto adaPool = std::dynamic_pointer_cast<const ngraph::opset8::AdaptiveAvgPool>(op);
             if (!adaPool) {
                 errorMessage = "Only opset8 AdaptiveAvgPooling operation is supported";
                 return false;
             }
         } else if (one_of(op->get_type_info(), ngraph::op::v8::AdaptiveMaxPool::type_info)) {
-            auto adaPool = std::dynamic_pointer_cast<ngraph::opset8::AdaptiveMaxPool>(op);
+            auto adaPool = std::dynamic_pointer_cast<const ngraph::opset8::AdaptiveMaxPool>(op);
             if (!adaPool) {
                 errorMessage = "Only opset8 AdaptiveMaxPooling operation is supported";
                 return false;
@@ -69,19 +73,19 @@ void MKLDNNAdaptivePoolingNode::getSupportedDescriptors() {
     if (getChildEdges().size() != (algorithm == AdaptivePoolingMax ? 2 : 1))
         IE_THROW() << errorPrefix << "has incorrect number of output edges: " << getParentEdges().size();
 
-    auto parentDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    auto childDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto parentDims = getInputShapeAtPort(0).getStaticDims();
+    auto childDims = getOutputShapeAtPort(0).getStaticDims();
 
     spatialDimsCount = parentDims.size() - 2;
     if (!one_of(spatialDimsCount, 1, 2, 3)) {
-        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getParentEdgeAt(0)->getShape().getRank();
+        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getInputShapeAtPort(0).getRank();
     }
 
-    if (getParentEdgeAt(1)->getShape().getRank() != 1) {
-        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getParentEdgeAt(1)->getShape().getRank();
+    if (getInputShapeAtPort(1).getRank() != 1) {
+        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getInputShapeAtPort(1).getRank();
     }
 
-    if (getChildEdgeAt(0)->getShape().getRank() != getParentEdgeAt(0)->getShape().getRank()) {
+    if (getOutputShapeAtPort(0).getRank() != getInputShapeAtPort(0).getRank()) {
         IE_THROW() << errorPrefix << "must keep data rank";
     }
 }
@@ -99,7 +103,7 @@ void MKLDNNAdaptivePoolingNode::initSupportedPrimitiveDescriptors() {
     config.outConfs.resize((algorithm == Algorithm::AdaptivePoolingAvg ? 1 : 2));
 
     std::vector<LayoutType> dataFormats{ LayoutType::ncsp };
-    if (getParentEdgeAt(0)->getShape().getStaticDims()[1] != 1) {
+    if (getInputShapeAtPort(0).getStaticDims()[1] != 1) {
         dataFormats.push_back(LayoutType::nspc);
         dataFormats.push_back(LayoutType::nCsp16c);
         dataFormats.push_back(LayoutType::nCsp8c);
@@ -118,8 +122,8 @@ void MKLDNNAdaptivePoolingNode::initSupportedPrimitiveDescriptors() {
 }
 
 void MKLDNNAdaptivePoolingNode::execute(mkldnn::stream strm) {
-    auto inputPrec = getParentEdgeAt(0)->getMemory().GetDescriptor().data.data_type;
-    auto outputPrec = getChildEdgeAt(0)->getMemory().GetDescriptor().data.data_type;
+    auto inputPrec = getParentEdgeAt(0)->getMemory().GetDataType();
+    auto outputPrec = getChildEdgeAt(0)->getMemory().GetDataType();
     if (!(inputPrec == mkldnn_f32 && outputPrec == mkldnn_f32))
         IE_THROW() << errorPrefix << "doesn't support demanded precisions";
 
@@ -131,21 +135,22 @@ void MKLDNNAdaptivePoolingNode::execute(mkldnn::stream strm) {
         indexDst = reinterpret_cast<int *>(getChildEdgeAt(1)->getMemoryPtr()->GetPtr());
     }
 
-    auto srcBlockDesc = srcMemory0.GetDescriptor().data.format_desc.blocking;
+    auto isPlainFmt = srcMemory0.getDesc().hasLayoutType(LayoutType::ncsp);
+    auto isTailCFmt = srcMemory0.getDesc().hasLayoutType(LayoutType::nspc);
+    auto isBlkFmt = srcMemory0.getDesc().hasLayoutType(LayoutType::nCsp16c) || srcMemory0.getDesc().hasLayoutType(LayoutType::nCsp8c);
 
-    int blockSize = srcBlockDesc.inner_nblks > 0 ? srcBlockDesc.inner_blks[0] : 1;
-    auto isPlainFmt = srcMemory0.GetDesc().hasLayoutType(LayoutType::ncsp);
-    auto isTailCFmt = srcMemory0.GetDesc().hasLayoutType(LayoutType::nspc);
+    auto srcBlockDesc = srcMemory0.GetDescWithType<BlockedMemoryDesc>();
+    int blockSize = isBlkFmt ? srcBlockDesc->getBlockDims().back() : 1;
 
     const auto *src = reinterpret_cast<const float *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     const auto *srcPooledSpatialShapes = reinterpret_cast<const int *>(getParentEdgeAt(1)->getMemoryPtr()->GetPtr());
     auto *dst = reinterpret_cast<float *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
 
-    if (srcMemory1.GetElementsCount() != spatialDimsCount)
-        IE_THROW() << errorPrefix << "has input spatial dimension (" << srcMemory1.GetElementsCount()
+    if (srcMemory1.GetShape().getElementsCount() != spatialDimsCount)
+        IE_THROW() << errorPrefix << "has input spatial dimension (" << srcMemory1.GetShape().getElementsCount()
                    << ") inconsistent with pooling vector size (" << spatialDimsCount << ")";
 
-    auto inputDimVector = srcMemory0.GetDims();
+    auto inputDimVector = srcMemory0.getStaticDims();
     const int N = static_cast<int>(inputDimVector[0]);
     const int C = static_cast<int>(inputDimVector[1]);
     const int ID = static_cast<int>(spatialDimsCount == 3 ? inputDimVector[2] : 1);
@@ -159,14 +164,14 @@ void MKLDNNAdaptivePoolingNode::execute(mkldnn::stream strm) {
     const int iHW = IH * IW;
     const int oDHW = OD * OH * OW, oHW = OH * OW;
 
-    const int chPadding = srcMemory0.GetDescriptor().data.padded_dims[1];
+    const int chPadding = blockSize * (isBlkFmt ? srcBlockDesc->getBlockDims()[1] : srcMemory0.GetShape().getStaticDims()[1]);
     const int blockCount = (isTailCFmt ? 1 :  chPadding / blockSize);
     auto selectedPrimitiveDescriptor = getSelectedPrimitiveDescriptor();
     if (!selectedPrimitiveDescriptor)
         IE_THROW() << errorPrefix << "doesn't have primitive descriptors.";
     auto config = selectedPrimitiveDescriptor->getConfig();
-    auto srcStrides = getParentEdgesAtPort(0)[0]->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
-    auto dstStrides = getChildEdgesAtPort(0)[0]->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    auto srcStrides = srcBlockDesc->getStrides();
+    auto dstStrides = getChildEdgesAtPort(0)[0]->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
 
     // unified strides array
     const size_t tailDimsOffset = (isTailCFmt ? -1 : 0);
@@ -233,20 +238,20 @@ void MKLDNNAdaptivePoolingNode::execute(mkldnn::stream strm) {
         [&](int n, int blkIdx, int od, int oh, int ow) {
         auto srcData = src + n * inStrides[0] + blkIdx * inStrides[1];
         auto dstData = dst + n * outStrides[0] + blkIdx * outStrides[1] +
-                      od * outStrides[2] + oh * outStrides[3] + ow * outStrides[4];
+                       od * outStrides[2] + oh * outStrides[3] + ow * outStrides[4];
         int cStart = 0, cEnd = C, inResidual = 0, outResidual = 0;
         if (!isTailCFmt) {
-           cStart = blkIdx * blockSize;
-           cEnd = (blkIdx == blockCount - 1 ? C : cStart + blockSize);
+            cStart = blkIdx * blockSize;
+            cEnd = (blkIdx == blockCount - 1 ? C : cStart + blockSize);
         }
         for (int c = cStart; c < cEnd; c++) {
-           if (isTailCFmt) {
-               inResidual = c * inStrides[1];
-               outResidual = c * outStrides[1];
-           } else if (!isPlainFmt) {
-               inResidual = outResidual = c % blockSize;
-           }
-           pool(srcData + inResidual, dstData + outResidual, od, oh, ow, n * C + c);
+            if (isTailCFmt) {
+                inResidual = c * inStrides[1];
+                outResidual = c * outStrides[1];
+            } else if (!isPlainFmt) {
+                inResidual = outResidual = c % blockSize;
+            }
+            pool(srcData + inResidual, dstData + outResidual, od, oh, ow, n * C + c);
         }});
 }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.h
index 386e57f4dcf01f..77a7e14d87a1ce 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.h
@@ -22,7 +22,7 @@ class MKLDNNAdaptivePoolingNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     int spatialDimsCount;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.cpp
index 8700a70c5b6450..43b8fa708ad589 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.cpp
@@ -16,8 +16,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNBatchToSpaceNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNBatchToSpaceNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto batchToSpace = std::dynamic_pointer_cast<const ngraph::opset2::BatchToSpace>(op);
         if (!batchToSpace) {
             errorMessage = "Only opset2 BatchToSpace operation is supported";
@@ -47,8 +51,8 @@ MKLDNNBatchToSpaceNode::MKLDNNBatchToSpaceNode(const std::shared_ptr<ngraph::Nod
     if (op->get_input_size() != 4 || op->get_output_size() != 1)
         IE_THROW() << errorPrefix << " has incorrect number of input or output edges!";
 
-    inDims = op->get_input_shape(0);
-    outDims = op->get_output_shape(0);
+    inDims = getInputShapeAtPort(0).getStaticDims();
+    outDims = getOutputShapeAtPort(0).getStaticDims();
     if (inDims.size() < 4 || inDims.size() > 5)
         IE_THROW() << errorPrefix << " has unsupported 'data' input rank: " << inDims.size();
     if (inDims.size() != outDims.size())
@@ -114,14 +118,14 @@ void MKLDNNBatchToSpaceNode::batchToSpaceKernel() {
 
     auto srcDesc = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
 
-    const bool blocked = srcDesc.hasLayoutType(LayoutType::nCsp8c) || srcDesc.hasLayoutType(LayoutType::nCsp16c);
+    const bool blocked = srcDesc->hasLayoutType(LayoutType::nCsp8c) || srcDesc->hasLayoutType(LayoutType::nCsp16c);
     const auto dimsSize = inDims.size();
 
     auto inShape5D = getShape5D(inDims);
     auto outShape5D = getShape5D(outDims);
     auto blockShape = getShape5D(blockShapeIn);
 
-    if (srcDesc.hasLayoutType(LayoutType::nspc) && one_of(srcDesc.getShape().getRank(), 4, 5)) {
+    if (srcDesc->hasLayoutType(LayoutType::nspc) && one_of(srcDesc->getShape().getRank(), 4, 5)) {
         inShape5D.push_back(inShape5D[1]);
         inShape5D.erase(inShape5D.begin() + 1);
         outShape5D.push_back(outShape5D[1]);
@@ -132,9 +136,9 @@ void MKLDNNBatchToSpaceNode::batchToSpaceKernel() {
 
     auto dstDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
 
-    const size_t blockSize = blocked ? dstDesc.getBlockDims().back() : 1lu;
-    const size_t blockCountInput = srcDesc.getBlockDims()[1];
-    const size_t blockCountOutput = dstDesc.getBlockDims()[1];
+    const size_t blockSize = blocked ? dstDesc->getBlockDims().back() : 1lu;
+    const size_t blockCountInput = srcDesc->getBlockDims()[1];
+    const size_t blockCountOutput = dstDesc->getBlockDims()[1];
     const auto blockRemainder = inShape5D[1] % blockSize;
     const auto lastBlock = blockRemainder == 0 ? blockSize : blockRemainder;
 
@@ -169,7 +173,7 @@ void MKLDNNBatchToSpaceNode::batchToSpaceKernel() {
             oAdd[2] = dimsSize == 5 ? bIdx % blockShapeIn[2] - cropsBeginIn[2] : 0lu;
             bIdx = dimsSize == 5 ? bIdx / blockShapeIn[2] : bIdx;
             oAdd[1] = bIdx % blockShapeIn[1] - cropsBeginIn[1];
-            if (srcDesc.hasLayoutType(LayoutType::nspc) && one_of(srcDesc.getShape().getRank(), 4, 5)) {
+            if (srcDesc->hasLayoutType(LayoutType::nspc) && one_of(srcDesc->getShape().getRank(), 4, 5)) {
                 oAdd.push_back(oAdd[1]);
                 oAdd.erase(oAdd.begin() + 1);
             }
@@ -224,13 +228,13 @@ void MKLDNNBatchToSpaceNode::batchToSpaceKernel() {
 }
 
 void MKLDNNBatchToSpaceNode::execute(mkldnn::stream strm) {
-    switch (getParentEdgeAt(0)->getMemory().GetDesc().getPrecision().size()) {
+    switch (getParentEdgeAt(0)->getMemory().getDesc().getPrecision().size()) {
         case 1: batchToSpaceKernel<PrecisionTrait<Precision::U8>::value_type>();  break;
         case 2: batchToSpaceKernel<PrecisionTrait<Precision::U16>::value_type>(); break;
         case 4: batchToSpaceKernel<PrecisionTrait<Precision::I32>::value_type>(); break;
         default:
             IE_THROW() << "BatchToSpace layer does not support precision '" <<
-                std::string(getParentEdgeAt(0)->getMemory().GetDesc().getPrecision().name()) << "'";
+                std::string(getParentEdgeAt(0)->getMemory().getDesc().getPrecision().name()) << "'";
     }
 }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.h
index 353ea634511dc3..e262108ded04d7 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_batch_to_space_node.h
@@ -22,7 +22,7 @@ class MKLDNNBatchToSpaceNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     template<typename T>
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.cpp
index 183bc158ff2399..efe30a1c668bf4 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.cpp
@@ -872,8 +872,13 @@ struct jit_uni_bin_conv_kernel_f32 : public jit_uni_bin_conv_kernel, public jit_
     }
 };
 
-bool MKLDNNBinaryConvolutionNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNBinaryConvolutionNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto binConv = std::dynamic_pointer_cast<const ngraph::opset1::BinaryConvolution>(op);
         if (!binConv) {
             errorMessage = "Only opset1 BinaryConvolution operation is supported";
@@ -942,16 +947,16 @@ void MKLDNNBinaryConvolutionNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << "has incorrect number of output edges";
 
-    if (getParentEdgeAt(0)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getParentEdgeAt(0)->getShape().getRank();
+    if (getInputShapeAtPort(0).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getInputShapeAtPort(0).getRank();
     }
 
-    if (getParentEdgeAt(1)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getParentEdgeAt(1)->getShape().getRank();
+    if (getInputShapeAtPort(1).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getInputShapeAtPort(1).getRank();
     }
 
-    if (getChildEdgeAt(0)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getChildEdgeAt(0)->getShape().getRank();
+    if (getOutputShapeAtPort(0).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getOutputShapeAtPort(0).getRank();
     }
 }
 
@@ -979,20 +984,20 @@ void MKLDNNBinaryConvolutionNode::initSupportedPrimitiveDescriptors() {
 
         //activation
         auto nspcCreator = BlockedDescCreator::getCommonCreators().at(LayoutType::nspc);
-        config.inConfs[0].desc = nspcCreator->createUniqueDesc(Precision::BIN, getParentEdgeAt(0)->getShape().getStaticDims());
+        config.inConfs[0].desc = nspcCreator->createSharedDesc(Precision::BIN, getInputShapeAtPort(0));
 
         //weights
         size_t weiFirstDimBlockSize = implType == impl_desc_type::jit_avx512 ? 16 : 8; //memory::format_tag::OIhw16o32i : memory::format_tag::OIhw8o32i;
-        auto weiDims = getParentEdgeAt(1)->getShape().getStaticDims();
+        auto weiDims = getInputShapeAtPort(1).getStaticDims();
         std::vector<size_t> weiBlockDims = {div_up(weiDims[0], weiFirstDimBlockSize), div_up(weiDims[1], 32),
                                             weiDims[2], weiDims[3], weiFirstDimBlockSize, 32};
         std::vector<size_t> weiOrder = {0, 1, 2, 3, 0, 1};
 
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(Precision::BIN, weiDims, weiBlockDims, weiOrder);
+        config.inConfs[1].desc = std::make_shared<CpuBlockedMemoryDesc>(Precision::BIN, Shape(weiDims), weiBlockDims, weiOrder);
 
         //result
         auto outputPrecision = withBinarization ? Precision::BIN : Precision::FP32;
-        config.outConfs[0].desc = nspcCreator->createUniqueDesc(outputPrecision, getChildEdgeAt(0)->getShape().getStaticDims());
+        config.outConfs[0].desc = nspcCreator->createSharedDesc(outputPrecision, getOutputShapeAtPort(0));
         if (withSum) {
             config.inConfs.push_back(config.outConfs[0]);
             config.outConfs[0].inPlace = 2;
@@ -1003,9 +1008,9 @@ void MKLDNNBinaryConvolutionNode::initSupportedPrimitiveDescriptors() {
         auto weiCreator = BlockedDescCreator::getCommonCreators().at(LayoutType::ncsp);
         auto nspcCreator = BlockedDescCreator::getCommonCreators().at(LayoutType::nspc);
 
-        config.inConfs[0].desc = nspcCreator->createUniqueDesc(Precision::BIN, getParentEdgeAt(0)->getShape().getStaticDims());
-        config.inConfs[1].desc = weiCreator->createUniqueDesc(Precision::BIN, getParentEdgeAt(1)->getShape().getStaticDims());
-        config.outConfs[0].desc = nspcCreator->createUniqueDesc(Precision::FP32, getChildEdgeAt(0)->getShape().getStaticDims());
+        config.inConfs[0].desc = nspcCreator->createSharedDesc(Precision::BIN, getInputShapeAtPort(0));
+        config.inConfs[1].desc = weiCreator->createSharedDesc(Precision::BIN, getInputShapeAtPort(1));
+        config.outConfs[0].desc = nspcCreator->createSharedDesc(Precision::FP32, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.push_back({config, implType});
     }
 }
@@ -1015,9 +1020,9 @@ void MKLDNNBinaryConvolutionNode::createPrimitive() {
     if (!selectedPrimitiveDescriptor)
         IE_THROW() << "CPU binary convolution with name '" << getName() << "' doesn't have primitive descriptors.";
 
-    auto srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    auto weiDims = getParentEdgeAt(1)->getShape().getStaticDims();
-    auto dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto srcDims = getParentEdgesAtPort(0)[0]->getMemory().getStaticDims();
+    auto weiDims = getParentEdgesAtPort(1)[0]->getMemory().getStaticDims();
+    auto dstDims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
 
     auto implType = selectedPrimitiveDescriptor->getImplementationType();
 
@@ -1071,8 +1076,8 @@ void MKLDNNBinaryConvolutionNode::createPrimitive() {
 
     jcp.nb_oc_blocking = nstl::min(implType == impl_desc_type::jit_sse42 ? 2 : implType == impl_desc_type::jit_avx2 ? 4 : 6, jcp.nb_oc);
 
-    auto srcPrecision = getParentEdgeAt(0)->getMemory().GetDesc().getPrecision();
-    auto dstPrecision = getChildEdgeAt(0)->getMemory().GetDesc().getPrecision();
+    auto srcPrecision = getParentEdgeAt(0)->getMemory().getDesc().getPrecision();
+    auto dstPrecision = getChildEdgeAt(0)->getMemory().getDesc().getPrecision();
 
     jcp.dst_dt = MKLDNNExtensionUtils::IEPrecisionToDataType(dstPrecision);
     jcp.typesize_in = srcPrecision == Precision::BIN ? 1 : srcPrecision.size();
@@ -1295,21 +1300,21 @@ void MKLDNNBinaryConvolutionNode::execute(mkldnn::stream strm) {
     auto dst = reinterpret_cast<uint8_t*>(dstMemory->GetPtr());
 
     auto srcDesc = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    std::vector<size_t> srcStride(srcDesc.getStrides().size());
+    std::vector<size_t> srcStride(srcDesc->getStrides().size());
     for (int i = 0; i < srcStride.size(); i++) {
-        srcStride[srcDesc.getOrder()[i]] = srcDesc.getStrides()[i];
+        srcStride[srcDesc->getOrder()[i]] = srcDesc->getStrides()[i];
     }
 
     auto weiDesc = getParentEdgeAt(1)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    std::vector<size_t> weightsStride(weiDesc.getShape().getRank());
+    std::vector<size_t> weightsStride(weiDesc->getShape().getRank());
     for (int i = 0; i < weightsStride.size(); i++) {
-        weightsStride[weiDesc.getOrder()[i]] = weiDesc.getStrides()[i];
+        weightsStride[weiDesc->getOrder()[i]] = weiDesc->getStrides()[i];
     }
 
     auto dstDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    std::vector<size_t> dstStride(dstDesc.getStrides().size());
+    std::vector<size_t> dstStride(dstDesc->getStrides().size());
     for (int i = 0; i < dstStride.size(); i++) {
-        dstStride[dstDesc.getOrder()[i]] = dstDesc.getStrides()[i];
+        dstStride[dstDesc->getOrder()[i]] = dstDesc->getStrides()[i];
     }
 
     auto selectedPrimitiveDescriptor = getSelectedPrimitiveDescriptor();
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.h
index f67070f8440dc1..f868375aaf9cce 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bin_conv_node.h
@@ -87,7 +87,7 @@ class MKLDNNBinaryConvolutionNode : public MKLDNNNode {
     void setPostOps(mkldnn::primitive_attr &attr);
     bool canFuse(const MKLDNNNodePtr& node) const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
     impl_desc_type getImplType() { return implType; }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.cpp
index ef9c14ad0d4eef..6bef76d3c7ec44 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.cpp
@@ -17,8 +17,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNBroadcastNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNBroadcastNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto broadcast = std::dynamic_pointer_cast<const ngraph::opset1::Broadcast>(op);
         if (!broadcast) {
             errorMessage = "Only opset1 Broadcast operation is supported";
@@ -67,13 +71,13 @@ void MKLDNNBroadcastNode::initSupportedPrimitiveDescriptors() {
 }
 
 void MKLDNNBroadcastNode::execute(mkldnn::stream strm) {
-    size_t shape_size = (getParentEdgeAt(BROADCAST_SHAPE)->getMemory().GetDesc().getShape().getStaticDims())[0];
-    SizeVector dst_dims = getChildEdgeAt(0)->getMemory().GetDesc().getShape().getStaticDims();
-    SizeVector src_dims = getParentEdgeAt(BROADCAST_INPUT)->getMemory().GetDesc().getShape().getStaticDims();
+    size_t shape_size = (getParentEdgeAt(BROADCAST_SHAPE)->getMemory().getStaticDims())[0];
+    SizeVector dst_dims = getChildEdgeAt(0)->getMemory().getStaticDims();
+    SizeVector src_dims = getParentEdgeAt(BROADCAST_INPUT)->getMemory().getStaticDims();
 
     auto srcDesc = getParentEdgeAt(BROADCAST_INPUT)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    SizeVector srcStrides = srcDesc.getStrides();
-    size_t data_size = srcDesc.getPrecision().size();
+    SizeVector srcStrides = srcDesc->getStrides();
+    size_t data_size = srcDesc->getPrecision().size();
 
     if (!src_dims.size())
         src_dims = SizeVector(1, 1);
@@ -89,7 +93,7 @@ void MKLDNNBroadcastNode::execute(mkldnn::stream strm) {
     }
 
     auto dstDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    InferenceEngine::SizeVector dstStrides = dstDesc.getStrides();
+    InferenceEngine::SizeVector dstStrides = dstDesc->getStrides();
     InferenceEngine::SizeVector src_aligned(dst_dims.size());
     InferenceEngine::SizeVector srcStrides_aligned(dst_dims.size());
     size_t prefix_size = dst_dims.size() - src_dims.size();
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.h
index 0d86a2a99efce7..932bded6c7c000 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_broadcast_node.h
@@ -22,7 +22,7 @@ class MKLDNNBroadcastNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     static const size_t BROADCAST_INPUT = 0;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp
index 602f4954c3ba91..4567d11548976e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.cpp
@@ -13,8 +13,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNBucketizeNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNBucketizeNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto bucketsize = std::dynamic_pointer_cast<const ngraph::opset3::Bucketize>(op);
         if (!bucketsize) {
             errorMessage = "Only opset3 Bucketize operation is supported";
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.h
index 472e6aee3cfb03..cafb8b11f1d4f4 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_bucketize_node.h
@@ -19,7 +19,7 @@ class MKLDNNBucketizeNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     template <typename T, typename T_BOUNDARIES, typename T_IND>
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.cpp
index 12567b74c0ff92..1a8b591a934e83 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.cpp
@@ -11,7 +11,6 @@
 
 #include "mkldnn.hpp"
 #include "mkldnn/iml_type_mapper.h"
-#include "mkldnn_dims.h"
 #include "mkldnn_edge.h"
 #include "mkldnn_memory.h"
 #include "ie_parallel.hpp"
@@ -22,7 +21,7 @@
 #include <limits>
 #include "common/cpu_memcpy.h"
 #include "common/blocked_desc_creator.h"
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -34,6 +33,11 @@ namespace {
 
 bool MKLDNNConcatNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto concatOp = ngraph::as_type_ptr<const ngraph::op::v0::Concat>(op);
         if (!concatOp) {
             errorMessage = "Node is not an instance of the Concat operation.";
@@ -62,9 +66,9 @@ MKLDNNConcatNode::MKLDNNConcatNode(const std::shared_ptr<ngraph::Node>& op, cons
 }
 
 void MKLDNNConcatNode::getSupportedDescriptors() {
-    auto& firstParentDims = getParentEdgeAt(0)->getShape().getStaticDims();
+    auto& firstParentDims = getInputShapeAtPort(0).getStaticDims();
     for (size_t i = 1; i < getParentEdges().size(); i++) {
-        auto& dims = getParentEdgeAt(i)->getShape().getStaticDims();
+        auto& dims = getInputShapeAtPort(i).getStaticDims();
         bool incorrectDims = false;
         for (size_t j = 0; j < firstParentDims.size(); j++) {
             if (j == axis)
@@ -78,6 +82,11 @@ void MKLDNNConcatNode::getSupportedDescriptors() {
             IE_THROW() << "Incorrect input dimensions for concat node " << getName();
         }
     }
+
+    // we need the first dims before axis to be 1 to avoid the reorder in the edge between the first parent and this concat
+    const auto& childDims = outputShapes[0].getStaticDims();
+    if (std::all_of(childDims.begin(), childDims.begin() + axis, [](size_t dim) { return  dim == 1; }))
+        canBeInPlace = true;
 }
 
 void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
@@ -87,7 +96,7 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
     auto& originInputPrecisions = getOriginalInputPrecisions();
     inputPrecision = originInputPrecisions[0];
     bool isMixedPrecision = false;
-    for (int i = 1; i < getOriginalInputsNumber(); i++) {
+    for (int i = 1; i < inputShapes.size(); i++) {
         if (originInputPrecisions[0] != originInputPrecisions[i]) {
             isMixedPrecision = true;
             break;
@@ -101,19 +110,19 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
     // Concat supports only equal precisions for inputs and output
     outputPrecision = inputPrecision;
 
-    auto& dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    const auto& dstShape = getOutputShapeAtPort(0);
     std::vector<LayoutType> tdCreatorTypes = {LayoutType::ncsp, LayoutType::nspc};
 
     // check if blocked layouts are available the channels size should be evenly divided by the block size to avoid slow oneDNN ref implementation
-    if (dstDims.size() > channelAxis) {
+    if (dstShape.getRank() > channelAxis) {
         for (auto item : { std::make_pair(8lu, LayoutType::nCsp8c), std::make_pair(16lu, LayoutType::nCsp16c)}) {
-            SizeVector blkDims = dstDims;
+            const VectorDims &blkDims = dstShape.getStaticDims();
             if (blkDims[channelAxis] % item.first)
                 continue;
 
             bool blocked = true;
             for (size_t i = 0; i < getParentEdges().size(); i++) {
-                auto& srcDims = getParentEdgeAt(i)->getShape().getStaticDims();
+                auto& srcDims = getInputShapeAtPort(i).getStaticDims();
                 if (srcDims[channelAxis] % item.first) {
                     blocked = false;
                     break;
@@ -128,7 +137,8 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
     std::vector<size_t> pdIndexesToReuse;
 
     auto& creatorsMap = BlockedDescCreator::getCommonCreators();
-    auto itrRange = BlockedDescCreator::makeFilteredRange(creatorsMap, static_cast<unsigned>(dstDims.size()), tdCreatorTypes);
+
+    auto itrRange = BlockedDescCreator::makeFilteredRange(creatorsMap, static_cast<unsigned>(dstShape.getRank()), tdCreatorTypes);
     for (auto itr = itrRange.first; itr != itrRange.second; ++itr) {
         NodeConfig config;
 
@@ -136,15 +146,14 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
         config.outConfs.resize(1);
         config.outConfs[0].inPlace = -1;
         config.outConfs[0].constant = false;
-        config.outConfs[0].desc = itr->second->createUniqueDesc(outputPrecision, dstDims);
+        config.outConfs[0].desc = itr->second->createSharedDesc(outputPrecision, dstShape);
 
         config.inConfs.resize(getParentEdges().size());
 
         for (size_t i = 0; i < getParentEdges().size(); ++i) {
             config.inConfs[i].inPlace = -1;
             config.inConfs[i].constant = false;
-            config.inConfs[i].desc = MemoryDescUtils::applyUndefinedOffset(
-                    itr->second->createDesc(inputPrecision, getParentEdgeAt(i)->getShape().getStaticDims()));
+            config.inConfs[i].desc = MemoryDescUtils::cloneWithUndefStridesAndOffset(itr->second->createDesc(inputPrecision, getInputShapeAtPort(i)));
         }
         supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::ref);
         if (itr->first != LayoutType::nspc) {
@@ -158,7 +167,7 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
             return;
         }
     }
-    if (axis != channelAxis)
+    if (!canBeInPlace)
         return;
 
     // Optimized inplace case
@@ -167,8 +176,8 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
         const auto& refConfig = supportedPrimitiveDescriptors[refPdIndex].getConfig();
         auto config = refConfig;
 
-        const auto &order = refConfig.outConfs[0].desc->as<BlockedMemoryDesc>()->getOrder();
-        const auto &blkDims = refConfig.outConfs[0].desc->as<BlockedMemoryDesc>()->getBlockDims();
+        const auto &order = refConfig.outConfs[0].desc->as<CpuBlockedMemoryDesc>()->getOrder();
+        const auto &blkDims = refConfig.outConfs[0].desc->as<CpuBlockedMemoryDesc>()->getBlockDims();
         auto numOfDim = blkDims.size();
 
         SizeVector offsets(numOfDim, 0lu);
@@ -184,14 +193,14 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
             }
         }
 
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(outputPrecision, dstDims, blkDims, order, offset, offsets, strides);
+        config.outConfs[0].desc = std::make_shared<CpuBlockedMemoryDesc>(outputPrecision, dstShape, blkDims, order, offset, offsets, strides);
 
         for (size_t i = 0; i < getParentEdges().size(); i++) {
-            const auto& srcBlkDims = refConfig.inConfs[i].desc->as<BlockedMemoryDesc>()->getBlockDims();
-            const auto& dims = refConfig.inConfs[i].desc->getShape().getStaticDims();
+            const auto& srcBlkDims = refConfig.inConfs[i].desc->as<CpuBlockedMemoryDesc>()->getBlockDims();
+            const auto& shape = refConfig.inConfs[i].desc->getShape();
 
             config.inConfs[i].inPlace = 0;
-            config.inConfs[i].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(inputPrecision, dims, srcBlkDims, order, offset, offsets, strides);
+            config.inConfs[i].desc = std::make_shared<CpuBlockedMemoryDesc>(inputPrecision, shape, srcBlkDims, order, offset, offsets, strides);
         }
         supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::unknown);
     }
@@ -200,24 +209,17 @@ void MKLDNNConcatNode::initSupportedPrimitiveDescriptors() {
 void MKLDNNConcatNode::selectOptimalPrimitiveDescriptor() {
     std::vector<size_t> canSelectPrimitive;
 
-    bool canOptimize = true;
-
     // The double connection marks that some tensor should
     // be replicated. Inplace approach is not applicable
     // for that case.
     for (int i = 0; i < getParentEdges().size(); i++) {
         for (int j = i + 1; j < getParentEdges().size(); j++) {
-            if (getParentEdgeAt(i) == getParentEdgeAt(j)) canOptimize = false;
+            if (getParentEdgeAt(i) == getParentEdgeAt(j)) canBeInPlace = false;
         }
     }
 
-    if (axis != channelAxis) {
-        canOptimize = false;
-    }
-
     std::map<LayoutType, size_t> formatFrequency;
     std::vector<LayoutType> supportedLayouts = {LayoutType::ncsp, LayoutType::nspc, LayoutType::nCsp8c, LayoutType::nCsp16c};
-
     for (size_t i = 0; i < getParentEdges().size(); i++) {
         auto parentEdge = getParentEdgeAt(i);
         auto parent = parentEdge->getParent();
@@ -257,7 +259,7 @@ void MKLDNNConcatNode::selectOptimalPrimitiveDescriptor() {
     }
 
     size_t maxCount = 0;
-    auto outDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto outDims = getOutputShapeAtPort(0).getStaticDims();
     LayoutType convertTo = LayoutType::ncsp;
     for (auto &it : formatFrequency) {
         if (it.second > maxCount) {
@@ -279,7 +281,7 @@ void MKLDNNConcatNode::selectOptimalPrimitiveDescriptor() {
                 break;
             }
             for (size_t i = 0; i < getParentEdges().size(); i++) {
-                auto& inpDims = getParentEdgeAt(i)->getShape().getStaticDims();
+                auto& inpDims = getInputShapeAtPort(i).getStaticDims();
                 if (inpDims[1] % item.first != 0) {
                     convertTo = LayoutType::ncsp;
                     break;
@@ -290,7 +292,7 @@ void MKLDNNConcatNode::selectOptimalPrimitiveDescriptor() {
 
     for (size_t i = 0; i < supportedPrimitiveDescriptors.size(); ++i) {
         if (supportedPrimitiveDescriptors[i].getConfig().outConfs[0].desc->hasLayoutType(convertTo)) {
-            if (IMPLICATION(supportedPrimitiveDescriptors[i].getImplementationType() == impl_desc_type::unknown, canOptimize)) {
+            if (IMPLICATION(supportedPrimitiveDescriptors[i].getImplementationType() == impl_desc_type::unknown, canBeInPlace)) {
                 canSelectPrimitive.push_back(i);
             }
         }
@@ -311,7 +313,7 @@ void MKLDNNConcatNode::selectOptimalPrimitiveDescriptor() {
 
     // if there are no matching data layouts, select first optimized implementation
     for (size_t i = 0; i < supportedPrimitiveDescriptors.size(); i++) {
-        if (canOptimize && supportedPrimitiveDescriptors[i].getImplementationType() == impl_desc_type::unknown) {
+        if (canBeInPlace && supportedPrimitiveDescriptors[i].getImplementationType() == impl_desc_type::unknown) {
             selectPrimitiveDescriptorByIndex(static_cast<int>(i));
             return;
         }
@@ -339,7 +341,7 @@ void MKLDNNConcatNode::createPrimitive() {
         IE_THROW() << "Preferable primitive descriptor is not set.";
 
     //check if selected Tensor descriptor has nspc layout and concat axis is C
-    if (axis == channelAxis && getChildEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc)) {
+    if (axis == channelAxis && getChildEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nspc)) {
         canOptimizeNspc = true;
         return;
     }
@@ -353,9 +355,9 @@ void MKLDNNConcatNode::createPrimitive() {
             IE_THROW() << "Source memory from " << parent->getName() << " didn't allocate for node "
                                << getName() << ".";
         }
-
-        auto desc = srcMemPtr->GetDescriptor();
-        auto& dims = getParentEdgeAt(i)->getShape().getStaticDims();
+// DnnlBlockedMemoryDesc
+        auto desc = srcMemPtr->GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc();
+        auto& dims = getInputShapeAtPort(i).getStaticDims();
         for (size_t j = 0; j < dims.size(); j++) {
             desc.data.dims[j] = dims[j];
         }
@@ -363,8 +365,8 @@ void MKLDNNConcatNode::createPrimitive() {
         srcs_d.emplace_back(desc);
     }
 
-    auto desc = getChildEdgeAt(0)->getMemory().GetDescriptor();
-    auto& dims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto desc = getChildEdgeAt(0)->getMemory().GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc();
+    auto& dims = getOutputShapeAtPort(0).getStaticDims();
     for (size_t i = 0; i < dims.size(); i++) {
         desc.data.dims[i] = dims[i];
         desc.data.padded_dims[i] = dims[i];
@@ -393,14 +395,12 @@ void MKLDNNConcatNode::initOptimalPrimitiveDescriptor() {
         auto config = selected_pd->getConfig();
         if (!isConfigDefined(config)) {
             for (size_t i = 0; i < config.inConfs.size(); i++) {
-                config.inConfs[i].desc = getDefinedInputDesc(config, i);
                 // Concat doesn't support different precision on inputs
-                config.inConfs[i].desc->setPrecision(inputPrecision);
+                config.inConfs[i].desc = MemoryDescUtils::cloneWithNewPrecision(*getDefinedInputDesc(config, i), inputPrecision);
             }
 
             for (size_t i = 0; i < config.outConfs.size(); i++) {
-                config.outConfs[i].desc = getDefinedOutputDesc(config, i);
-                config.outConfs[i].desc->setPrecision(outputPrecision);
+                config.outConfs[i].desc = MemoryDescUtils::cloneWithNewPrecision(*getDefinedOutputDesc(config, i), outputPrecision);
             }
 
             initDescriptor(config);
@@ -418,47 +418,49 @@ void MKLDNNConcatNode::initOptimalPrimitiveDescriptor() {
         int num = getChildEdgeAt(i)->getOutputNum();
         if (num >= 0) {
             auto childConf = getChildEdgeAt(i)->getChild()->getSelectedPrimitiveDescriptor()->getConfig().inConfs[num];
-            childConf.desc->setPrecision(config.outConfs[i].desc->getPrecision());
+            childConf.desc = MemoryDescUtils::cloneWithNewPrecision(*childConf.desc, config.outConfs[i].desc->getPrecision());
 
             if (getChildEdgeAt(i)->getChild()->getSelectedPrimitiveDescriptor()) {
                 if (!childConf.desc->isDefined() && childConf.inPlace >= 0)
                     getChildEdgeAt(i)->getChild()->initOptimalPrimitiveDescriptor();
 
                 if (childConf.desc->isDefined() && childConf.desc->isCompatible(*config.outConfs[i].desc)) {
-                    config.outConfs[i].desc = childConf.desc->clone();
+                    config.outConfs[i].desc = childConf.desc;
                     continue;
                 }
             }
         }
 
         // reset undefined offsets
-        config.outConfs[i].desc = MemoryDescUtils::resetOffset(config.outConfs[i].desc.get());
+        config.outConfs[i].desc = MemoryDescUtils::cloneWithDefaultStridesAndOffset(*config.outConfs[i].desc);
     }
-    auto firstOutBlockingDesc = MemoryDescUtils::convertToBlockedDescriptor(*config.outConfs[0].desc);
+    auto firstOutBlockingDesc = config.outConfs[0].desc->as<BlockedMemoryDesc>();
     size_t offset = 0;
     for (size_t i = 0; i < config.inConfs.size(); i++) {
-        auto inpBlockingDesc = MemoryDescUtils::convertToBlockedDescriptor(*config.inConfs[i].desc);
-        config.inConfs[i].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(inpBlockingDesc.getPrecision(),
-                                                                inpBlockingDesc.getShape().getStaticDims(),
-                                                                inpBlockingDesc.getBlockDims(),
-                                                                inpBlockingDesc.getOrder(),
-                                                                firstOutBlockingDesc.getOffsetPadding() + offset,
-                                                                firstOutBlockingDesc.getOffsetPaddingToData(),
-                                                                firstOutBlockingDesc.getStrides());
+        auto oldDesc = config.inConfs[i].desc;
+        auto inpBlockingDesc = oldDesc->as<BlockedMemoryDesc>();
+
+        config.inConfs[i].desc = std::make_shared<CpuBlockedMemoryDesc>(inpBlockingDesc->getPrecision(),
+                                                                                 inpBlockingDesc->getShape(),
+                                                                                 inpBlockingDesc->getBlockDims(),
+                                                                                 inpBlockingDesc->getOrder(),
+                                                                                 firstOutBlockingDesc->getOffsetPadding() + offset,
+                                                                                 firstOutBlockingDesc->getOffsetPaddingToData(),
+                                                                                 firstOutBlockingDesc->getStrides());
         size_t axisSize = 1;
 
-        auto firstInpBlockingDesc = MemoryDescUtils::convertToBlockedDescriptor(*config.inConfs[0].desc);
-        if (firstInpBlockingDesc.hasLayoutType(LayoutType::nspc)) {
+        auto firstInpBlockingDesc = config.inConfs[0].desc->as<BlockedMemoryDesc>();
+        if (firstInpBlockingDesc->hasLayoutType(LayoutType::nspc)) {
             // This is more general and works for any "direct" Layout (such as nchw or nhwc), but it doesn't work for blocked
-            size_t realAxis = inverseOrder(firstInpBlockingDesc.getOrder(), axis);
-            for (size_t j = realAxis; j < inpBlockingDesc.getBlockDims().size(); j++) {
-                size_t jj = firstInpBlockingDesc.getOrder()[j];
-                axisSize *= inpBlockingDesc.getBlockDims()[jj];
+            size_t realAxis = inverseOrder(firstInpBlockingDesc->getOrder(), axis);
+            for (size_t j = realAxis; j < inpBlockingDesc->getBlockDims().size(); j++) {
+                size_t jj = firstInpBlockingDesc->getOrder()[j];
+                axisSize *= inpBlockingDesc->getBlockDims()[jj];
             }
         } else {
             // This works for nchw and nchw8c/nchw16c
-            for (size_t j = axis; j < inpBlockingDesc.getBlockDims().size(); j++) {
-                axisSize *= inpBlockingDesc.getBlockDims()[j];
+            for (size_t j = axis; j < inpBlockingDesc->getBlockDims().size(); j++) {
+                axisSize *= inpBlockingDesc->getBlockDims()[j];
             }
         }
         offset += axisSize;
@@ -502,7 +504,7 @@ void MKLDNNConcatNode::execNspcSpecCase() {
 
     for (size_t i = 0; i < num_src; i++) {
         const MKLDNNMemory& src_mem = getParentEdgeAt(i)->getMemory();
-        const size_t num_channels = src_mem.GetDims()[channelAxis];
+        const size_t num_channels = src_mem.getStaticDims()[channelAxis];
 
         channelsDataSize.push_back(num_channels * dataSize);
         src_ptrs.push_back(reinterpret_cast<const uint8_t*>(src_mem.GetData()));
@@ -520,4 +522,4 @@ void MKLDNNConcatNode::execNspcSpecCase() {
     });
 }
 
-REG_MKLDNN_PRIM_FOR(MKLDNNConcatNode, Concatenation);
+REG_MKLDNN_PRIM_FOR(MKLDNNConcatNode, Concatenation);
\ No newline at end of file
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.h
index f29c1feca90c15..abb3a38ac17ffe 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_concat_node.h
@@ -30,6 +30,7 @@ class MKLDNNConcatNode : public MKLDNNNode {
 
 private:
     size_t axis = 0;
+    bool canBeInPlace = false;
     bool canOptimizeNspc = false;
 
     size_t inverseOrder(const InferenceEngine::SizeVector& order, size_t axis);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.cpp
index 4bff8260c7900a..b0707cee41d0b6 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.cpp
@@ -18,14 +18,20 @@
 #include <ngraph/ops.hpp>
 #include <cpu/x64/jit_generator.hpp>
 #include "common/cpu_convert.h"
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNConvolutionNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNConvolutionNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (!ngraph::is_type<ngraph::op::v1::Convolution>(op) && !ngraph::is_type<ngraph::op::v1::GroupConvolution>(op)) {
             errorMessage = "Only opset1 Convolution and GroupConvolution operations are supported";
             return false;
@@ -194,8 +200,7 @@ void MKLDNNConvolutionNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << "Incorrect number of output edges for layer " << getName();
 
-    int ndims = getParentEdgesAtPort(0)[0]->getShape().getRank();
-    MKLDNNDims weightsDims = MKLDNNDims(weightDims);
+    int ndims = getInputShapeAtPort(0).getRank();
 
     withDWConv = isFusedWith(Convolution);
 
@@ -226,9 +231,9 @@ void MKLDNNConvolutionNode::getSupportedDescriptors() {
 
             for (int j = 0; j < paddingR.size(); j++) {
                 int with_group = isGrouped ? 1 : 0;
-                int krn = weightsDims[with_group + 2 + j];
-                int src = getParentEdgeAt(0)->getShape().getStaticDims()[2 + j];
-                int dst = getChildEdgeAt(0)->getShape().getStaticDims()[2 + j];
+                int krn = weightDims[with_group + 2 + j];
+                int src = getInputShapeAtPort(0).getStaticDims()[2 + j];
+                int dst = getOutputShapeAtPort(0).getStaticDims()[2 + j];
 
                 krn = (krn - 1)*(dilation[j] + 1) + 1;
                 int calc_dst = (src - krn + paddingL[j]) / stride[j] + 1;
@@ -244,11 +249,11 @@ void MKLDNNConvolutionNode::getSupportedDescriptors() {
             outputDataType = memory::data_type::f32;
         if (eltwisePrecision == Precision::BF16)
             eltwisePrecision = Precision::FP32;
-        in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(),
+        in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(0),
                                                      inputDataType, ndims == 5 ? memory::format_tag::ndhwc : memory::format_tag::nhwc);
-        out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(),
+        out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(getOutputShapeAtPort(0),
                                                       outputDataType, ndims == 5 ? memory::format_tag::ndhwc : memory::format_tag::nhwc);
-        createDescriptor({ in_candidate.get() }, { out_candidate.get() });
+        createDescriptor({ in_candidate }, { out_candidate });
     } else {
         inputDataType = (getOriginalInputPrecisionAtPort(0) == Precision::BF16
                 && !(isDepthWise() && ndims == 5)) ? memory::data_type::bf16 : memory::data_type::f32;
@@ -285,36 +290,36 @@ void MKLDNNConvolutionNode::getSupportedDescriptors() {
             memory::format_tag nCsp16c = ndims == 4 ? memory::format_tag::nChw16c : memory::format_tag::nCdhw16c;
             memory::format_tag nCsp8c = ndims == 4 ? memory::format_tag::nChw8c : memory::format_tag::nCdhw8c;
 
-            auto inputDims = getParentEdgeAt(0)->getShape().getStaticDims();
-            auto outputDims = getChildEdgeAt(0)->getShape().getStaticDims();
+            auto inputShape = getInputShapeAtPort(0);
+            auto outputShape = getOutputShapeAtPort(0);
 
             if (IC == 1 && groupOC == 1) {
-                in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(inputDims, inputDataType, ncsp);
-                out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(outputDims, outputDataType, ncsp);
-                createDescriptor({ in_candidate.get() }, { out_candidate.get() });
+                in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inputShape, inputDataType, ncsp);
+                out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(outputShape, outputDataType, ncsp);
+                createDescriptor({ in_candidate }, { out_candidate });
             } else if (IC < 4) {
-                in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(inputDims, inputDataType, ncsp);
-                out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(outputDims, outputDataType, nCsp16c);
-                createDescriptor({ in_candidate.get() }, { out_candidate.get() });
-                out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(outputDims, outputDataType, nCsp8c);
-                createDescriptor({ in_candidate.get() }, { out_candidate.get() });
+                in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inputShape, inputDataType, ncsp);
+                out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(outputShape, outputDataType, nCsp16c);
+                createDescriptor({ in_candidate }, { out_candidate });
+                out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(outputShape, outputDataType, nCsp8c);
+                createDescriptor({ in_candidate }, { out_candidate });
             } else {
-                in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(inputDims, inputDataType, nCsp16c);
-                out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(outputDims, outputDataType, nCsp16c);
-                createDescriptor({ in_candidate.get() }, { out_candidate.get() });
-                in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(inputDims, inputDataType, nCsp8c);
-                out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(outputDims, outputDataType, nCsp8c);
-                createDescriptor({ in_candidate.get() }, { out_candidate.get() });
+                in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inputShape, inputDataType, nCsp16c);
+                out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(outputShape, outputDataType, nCsp16c);
+                createDescriptor({ in_candidate }, { out_candidate });
+                in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inputShape, inputDataType, nCsp8c);
+                out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(outputShape, outputDataType, nCsp8c);
+                createDescriptor({ in_candidate }, { out_candidate });
             }
 
-            in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(inputDims, inputDataType, ncsp);
-            out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(outputDims, outputDataType, ncsp);
-            createDescriptor({ in_candidate.get() }, { out_candidate.get() });
+            in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inputShape, inputDataType, ncsp);
+            out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(outputShape, outputDataType, ncsp);
+            createDescriptor({ in_candidate }, { out_candidate });
 
             if (inputDataType != memory::data_type::bf16 && isNspcAvailable()) {
-                in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(inputDims, inputDataType, nspc);
-                out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(outputDims, outputDataType, nspc);
-                createDescriptor({ in_candidate.get() }, { out_candidate.get() });
+                in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inputShape, inputDataType, nspc);
+                out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(outputShape, outputDataType, nspc);
+                createDescriptor({ in_candidate }, { out_candidate });
             }
         }
     }
@@ -395,11 +400,12 @@ void MKLDNNConvolutionNode::initSupportedPrimitiveDescriptors() {
                 PortConfig dataConfig;
                 dataConfig.inPlace = -1;
                 dataConfig.constant = false;
-                auto srcDesc = getSrcMemDesc(itpd, i);
-                if (isGrouped || srcDesc->getFormatKind() != dnnl_format_kind_t::dnnl_blocked)
-                    dataConfig.desc = std::move(srcDesc);
-                else
-                    dataConfig.desc = MemoryDescUtils::applyUndefinedOffset(*srcDesc);
+                auto desc = getSrcMemDesc(itpd, i);
+                if (desc->getType() & MemoryDescType::Blocked && !isGrouped) {
+                    dataConfig.desc = MemoryDescUtils::cloneWithUndefStridesAndOffset(*desc);
+                } else {
+                    dataConfig.desc = std::move(desc);
+                }
 
                 config.inConfs.push_back(dataConfig);
             }
@@ -414,10 +420,10 @@ void MKLDNNConvolutionNode::initSupportedPrimitiveDescriptors() {
                 PortConfig dataConfig;
                 dataConfig.inPlace = -1;
                 dataConfig.constant = false;
-                dataConfig.desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(dwWeightsDims, weightsPrc, memory::format_tag::Goihw8g);
+                dataConfig.desc = std::make_shared<DnnlBlockedMemoryDesc>(Shape(dwWeightsDims), weightsPrc, memory::format_tag::Goihw8g);
                 config.inConfs.push_back(dataConfig);
 
-                dataConfig.desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(dwBiasesDims, biasPrc, memory::format_tag::x);
+                dataConfig.desc = std::make_shared<DnnlBlockedMemoryDesc>(Shape(dwBiasesDims), biasPrc, memory::format_tag::x);
                 config.inConfs.push_back(dataConfig);
             }
 
@@ -428,18 +434,18 @@ void MKLDNNConvolutionNode::initSupportedPrimitiveDescriptors() {
                 }
 
                 dataConfig.constant = false;
-
-                auto dstDesc = getDstMemDesc(itpd, i);
-                if (isGrouped || dstDesc->getFormatKind() != dnnl_format_kind_t::dnnl_blocked)
-                    dataConfig.desc = std::move(dstDesc);
-                else
-                    dataConfig.desc = MemoryDescUtils::applyUndefinedOffset(*dstDesc);
+                auto desc = getDstMemDesc(itpd, i);
+                if (desc->getType() & MemoryDescType::Blocked && !isGrouped) {
+                    dataConfig.desc = MemoryDescUtils::cloneWithUndefStridesAndOffset(*desc);
+                } else {
+                    dataConfig.desc = std::move(desc);
+                }
 
                 config.outConfs.push_back(dataConfig);
 
                 if (withSum) {
                     dataConfig.inPlace = -1;
-                    dataConfig.desc->setPrecision(eltwisePrecision);
+                    dataConfig.desc = MemoryDescUtils::cloneWithNewPrecision(*dataConfig.desc, dataConfig.desc->getPrecision());
                     config.inConfs.push_back(dataConfig);
                 }
             }
@@ -480,21 +486,19 @@ bool MKLDNNConvolutionNode::created() const {
     return getType() == Convolution;
 }
 
-void MKLDNNConvolutionNode::createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                                             const std::vector<const MemoryDesc*>& outputDesc) {
-    auto inDesc = MemoryDescUtils::convertToMKLDNNMemoryDesc(*inputDesc[0]);
-    auto outDesc = MemoryDescUtils::convertToMKLDNNMemoryDesc(*outputDesc[0]);
+void MKLDNNConvolutionNode::createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                                             const std::vector<MemoryDescPtr>& outputDesc) {
+    const auto inDesc = MemoryDescUtils::convertToDnnlMemoryDesc(inputDesc[0])->getDnnlDesc();
+    const auto outDesc = MemoryDescUtils::convertToDnnlMemoryDesc(outputDesc[0])->getDnnlDesc();
 
-    memory::data_type wdt = MKLDNNExtensionUtils::IEPrecisionToDataType(inDesc.getPrecision());
+    memory::data_type wdt = static_cast<memory::data_type>(inDesc.data.data_type);
     memory::data_type bdt = memory::data_type::f32;
 
-    if (inDesc.getPrecision() == Precision::U8 || inDesc.getPrecision() == Precision::I8) {
+    if (inDesc.data.data_type == mkldnn_s8 || inDesc.data.data_type == mkldnn_u8) {
         wdt = memory::data_type::s8;
     }
 
-    MKLDNNDims blocked_weightDims(weightDims);
-    MKLDNNDims blocked_biasesDims(biasesDims);
-    mkldnn::memory::desc wgh_candidate(blocked_weightDims, wdt, memory::format_tag::any);
+    mkldnn::memory::desc wgh_candidate(MKLDNNExtensionUtils::convertToDnnlDims(weightDims), wdt, memory::format_tag::any);
 
     std::vector<mkldnn::algorithm> algorithms;
 
@@ -506,7 +510,7 @@ void MKLDNNConvolutionNode::createDescriptor(const std::vector<const MemoryDesc*
         try {
             std::shared_ptr<mkldnn::convolution_forward::desc> conv_desc;
             if (withBiases) {
-                mkldnn::memory::desc bias_candidate(blocked_biasesDims, bdt, memory::format_tag::any);
+                mkldnn::memory::desc bias_candidate(MKLDNNExtensionUtils::convertToDnnlDims(biasesDims), bdt, memory::format_tag::any);
 
                 conv_desc.reset(new convolution_forward::desc(prop_kind::forward_scoring, alg,
                             inDesc, wgh_candidate, bias_candidate, outDesc,
@@ -556,13 +560,9 @@ void MKLDNNConvolutionNode::initDescriptor(const NodeConfig& config) {
     if (canBeExecutedInInt8()) {
         isStridedBlobsSupported = false;
     }
-    // TODO [NM]: fix strided blobs feature support for dynamic weights
-    // if (getOriginalInputsNumber() != 1) {
-    //     isStridedBlobsSupported = false;
-    // }
 
     if (isStridedBlobsSupported) {
-        createDescriptor({config.inConfs[0].desc.get()}, {config.outConfs[0].desc.get()});
+        createDescriptor({config.inConfs[0].desc}, {config.outConfs[0].desc});
     }
 
     mkldnn::primitive_attr attr;
@@ -600,10 +600,10 @@ void MKLDNNConvolutionNode::initDescriptor(const NodeConfig& config) {
                 PortConfig dataConfig;
                 dataConfig.inPlace = -1;
                 dataConfig.constant = false;
-                dataConfig.desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(dwWeightsDims, weightsPrc, memory::format_tag::Goihw8g);
+                dataConfig.desc = std::make_shared<DnnlBlockedMemoryDesc>(Shape(dwWeightsDims), weightsPrc, memory::format_tag::Goihw8g);
                 cfg.inConfs.push_back(dataConfig);
 
-                dataConfig.desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(dwBiasesDims, biasPrc, memory::format_tag::x);
+                dataConfig.desc = std::make_shared<DnnlBlockedMemoryDesc>(Shape(dwBiasesDims), biasPrc, memory::format_tag::x);
                 cfg.inConfs.push_back(dataConfig);
             }
 
@@ -614,7 +614,7 @@ void MKLDNNConvolutionNode::initDescriptor(const NodeConfig& config) {
                 dataConfig.desc = getDstMemDesc(itpd, j);
                 if (withSum) {
                     auto eltwiseConfig = dataConfig;
-                    eltwiseConfig.desc->setPrecision(eltwisePrecision);
+                    eltwiseConfig.desc = MemoryDescUtils::cloneWithNewPrecision(*eltwiseConfig.desc, eltwisePrecision);
                     cfg.inConfs.push_back(eltwiseConfig);
                     dataConfig.inPlace = getParentEdges().size() - 1;
                 }
@@ -659,12 +659,12 @@ void MKLDNNConvolutionNode::filterSupportedDescriptors() {
         while (itd != descs.end()) {
             bool isSuitableDesc = true;
             if (!inputMemoryFormatsFilter.empty()) {
-                MKLDNNMemoryDesc src_tdesc(std::shared_ptr<mkldnn::convolution_forward::desc>(*itd)->data.src_desc);
-                isSuitableDesc &= src_tdesc.isSame(inputMemoryFormatsFilter[0]);
+                auto src_tdesc = MKLDNNExtensionUtils::makeDescriptor(std::shared_ptr<mkldnn::convolution_forward::desc>(*itd)->data.src_desc);
+                isSuitableDesc &= src_tdesc->isSame(inputMemoryFormatsFilter[0]);
             }
             if (!outputMemoryFormatsFilter.empty()) {
-                MKLDNNMemoryDesc dst_tdesc(std::shared_ptr<mkldnn::convolution_forward::desc>(*itd)->data.dst_desc);
-                isSuitableDesc &= dst_tdesc.isSame(outputMemoryFormatsFilter[0]);
+                auto dst_tdesc = MKLDNNExtensionUtils::makeDescriptor(std::shared_ptr<mkldnn::convolution_forward::desc>(*itd)->data.dst_desc);
+                isSuitableDesc &= dst_tdesc->isSame(outputMemoryFormatsFilter[0]);
             }
             if (!isSuitableDesc) {
                 itd = descs.erase(itd);
@@ -698,21 +698,21 @@ bool MKLDNNConvolutionNode::isPossibleToSkipInitConfig(MKLDNNDescriptor &desc) c
             isPossibleJitPlanar = false;
 
     std::shared_ptr<mkldnn::convolution_forward::desc> convDesc(desc);
-    auto srcMemDesc = MKLDNNMemoryDesc {convDesc->data.src_desc};
-    auto dstMemDesc = MKLDNNMemoryDesc {convDesc->data.dst_desc};
+    auto srcMemDesc = MKLDNNExtensionUtils::makeDescriptor(convDesc->data.src_desc);
+    auto dstMemDesc = MKLDNNExtensionUtils::makeDescriptor(convDesc->data.dst_desc);
     auto srcDataType = convDesc->data.src_desc.data_type;
     auto dstDataType = convDesc->data.dst_desc.data_type;
-    bool isPlanarFloatConv = srcMemDesc.hasLayoutType(LayoutType::ncsp)
-                             && dstMemDesc.hasLayoutType(LayoutType::ncsp)
+    bool isPlanarFloatConv = srcMemDesc->hasLayoutType(LayoutType::ncsp)
+                             && dstMemDesc->hasLayoutType(LayoutType::ncsp)
                              && srcDataType == memory::data_type::f32
                              && dstDataType == memory::data_type::f32;
 
     return !isPossibleJitPlanar && isPlanarFloatConv;
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNConvolutionNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
-    auto desc = idx > 0 ? MKLDNNMemoryDesc(primitive_desc_it.weights_desc(idx - 1)) : MKLDNNMemoryDesc(primitive_desc_it.src_desc(idx));
-    return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::move(desc));
+std::shared_ptr<MemoryDesc> MKLDNNConvolutionNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+    auto desc = idx > 0 ? primitive_desc_it.weights_desc(idx - 1) : primitive_desc_it.src_desc(idx);
+    return MKLDNNExtensionUtils::makeDescriptor(desc);
 }
 
 bool MKLDNNConvolutionNode::canFuse(const MKLDNNNodePtr& node) const {
@@ -755,8 +755,8 @@ bool MKLDNNConvolutionNode::isNspcAvailable() const {
     }
 
     // A bunch of heuristics are designed to cut off not optimal nspc convolution applications
-    auto inpDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    auto outDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto inpDims = getInputShapeAtPort(0).getStaticDims();
+    auto outDims = getOutputShapeAtPort(0).getStaticDims();
     auto ndims = inpDims.size();
 
     if (isDepthWise()) {
@@ -826,7 +826,7 @@ InferenceEngine::Blob::Ptr MKLDNNConvolutionNode::createInternalBlob(InferenceEn
     if (blb == nullptr)
         IE_THROW() << "Cannot get const blob for node " << getName() << ".";
 
-    auto const elementsCount = blb->GetElementsCount();
+    auto const elementsCount = blb->GetDescWithType<BlockedMemoryDesc>()->getPaddedElementsCount();
 
     InferenceEngine::TensorDesc desc(InferenceEngine::Precision::FP32, dims, getWeightsLayoutByDims(dims, isGrouped));
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.h
index 7fa5ed80bb8040..b787f71068691e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_conv_node.h
@@ -18,10 +18,10 @@ class MKLDNNConvolutionNode : public MKLDNNNode {
 public:
     MKLDNNConvolutionNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache);
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
     void getSupportedDescriptors() override;
-    void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                          const std::vector<const MemoryDesc*>& outputDesc) override;
+    void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                          const std::vector<MemoryDescPtr>& outputDesc) override;
     void initDescriptor(const NodeConfig& config) override;
     void createPrimitive() override;
     void selectOptimalPrimitiveDescriptor() override;
@@ -32,7 +32,7 @@ class MKLDNNConvolutionNode : public MKLDNNNode {
         return false;
     }
     InferenceEngine::Precision getRuntimePrecision() const override;
-    std::unique_ptr<MKLDNNMemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
+    std::shared_ptr<MemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
 
     const mkldnn::memory& getWeights() const;
     const mkldnn::memory& getBias() const;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.cpp
index 00a403c8bb6782..d91c291d86236c 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.cpp
@@ -7,13 +7,19 @@
 #include "common/cpu_convert.h"
 #include "common/blocked_desc_creator.h"
 #include <ngraph/opsets/opset1.hpp>
+#include "utils/ngraph_utils.hpp"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNConvertNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNConvertNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto convert = std::dynamic_pointer_cast<const ngraph::opset1::Convert>(op);
         if (!convert) {
             errorMessage = "Only opset1 Convert operation is supported";
@@ -59,6 +65,13 @@ void MKLDNNConvertNode::getSupportedDescriptors() {
         IE_THROW() << errorPrefix << " has incorrect number of output edges";
 }
 
+bool MKLDNNConvertNode::isSupportedDesc(const MemoryDesc &desc) {
+    bool isSupported = desc.getType() & MemoryDescType::Blocked;
+    if (desc.getType() == MemoryDescType::DnnlBlocked)
+        isSupported &= desc.as<const DnnlMemoryDesc>()->hasEmptyExtraData();
+    return isSupported;
+}
+
 void MKLDNNConvertNode::initSupportedPrimitiveDescriptors() {
     if (!supportedPrimitiveDescriptors.empty())
         return;
@@ -69,21 +82,28 @@ void MKLDNNConvertNode::initSupportedPrimitiveDescriptors() {
 
     config.dynBatchSupport = false;
 
-    // if input and output pointers are not null, then the inp/output tensor descriptors were set using setDescs method, so
-    // they should be used as the actual descriptors.
+    bool canInitExternalDesc = false;
     if (input && output) {
-        dataIn.desc = input->clone();
+        canInitExternalDesc = true;
+        canInitExternalDesc &= isSupportedDesc(*input);
+        canInitExternalDesc &= isSupportedDesc(*output);
+    }
+
+    // if input and output pointers are not null and not contain extra data, then the inp/output tensor descriptors were set using setDescs method, so
+    // they should be used as the actual descriptors.
+    if (canInitExternalDesc) {
+        dataIn.desc = input;
         config.inConfs.push_back(dataIn);
 
         // inp/out layouts must be the same
-        dataConfigOut.desc = config.inConfs[0].desc->clone();
-        dataConfigOut.desc->setPrecision(output->getPrecision());
+        dataConfigOut.desc = config.inConfs[0].desc;
+        dataConfigOut.desc = MemoryDescUtils::cloneWithNewPrecision(*dataConfigOut.desc, output->getPrecision());
         config.outConfs.push_back(dataConfigOut);
         supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::unknown);
-    } else if (getOriginalInputsNumber() == 1 && getOriginalOutputsNumber() == 1) {
-        const Shape& insShape = getParentEdgeAt(0)->getShape();
+    } else if (inputShapes.size() == 1 && outputShapes.size() == 1) {
+        const Shape& insShape = getInputShapeAtPort(0);
         auto insPrecision = getOriginalInputPrecisionAtPort(0);
-        const Shape& outputShape = getChildEdgeAt(0)->getShape();
+        const Shape& outputShape = getOutputShapeAtPort(0);
         auto outPrecision = getOriginalOutputPrecisionAtPort(0);
 
         config.inConfs.push_back(dataIn);
@@ -93,8 +113,8 @@ void MKLDNNConvertNode::initSupportedPrimitiveDescriptors() {
         auto range = BlockedDescCreator::makeFilteredRange(creators, insShape.getRank());
 
         for (auto itr = range.first; itr != range.second; ++itr) {
-            config.inConfs[0].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(itr->second->createDesc(insPrecision, insShape.getDims()));
-            config.outConfs[0].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(itr->second->createDesc(outPrecision, outputShape.getDims()));
+            config.inConfs[0].desc = std::make_shared<CpuBlockedMemoryDesc>(itr->second->createDesc(insPrecision, insShape));
+            config.outConfs[0].desc = std::make_shared<CpuBlockedMemoryDesc>(itr->second->createDesc(outPrecision, outputShape));
 
             supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::unknown);
         }
@@ -117,12 +137,16 @@ void MKLDNNConvertNode::createPrimitive() {
 void MKLDNNConvertNode::execute(mkldnn::stream strm) {
     auto& parentMem = getParentEdgeAt(0)->getMemory();
     auto& childMem = getChildEdgeAt(0)->getMemory();
-    if (parentMem.GetElementsCount() != childMem.GetElementsCount())
+
+    const auto parentPaddElemCount = parentMem.GetDescWithType<BlockedMemoryDesc>()->getPaddedElementsCount();
+    const auto childPaddElemCount = childMem.GetDescWithType<BlockedMemoryDesc>()->getPaddedElementsCount();
+
+    if (parentPaddElemCount != childPaddElemCount)
         IE_THROW() << errorPrefix << " has different elements number in input and output buffers";
 
     void* srcPtr = parentMem.GetPtr();
     void* dstPtr = childMem.GetPtr();
-    cpu_convert(srcPtr, dstPtr, parentMem.GetDesc().getPrecision(), childMem.GetDesc().getPrecision(), parentMem.GetElementsCount());
+    cpu_convert(srcPtr, dstPtr, parentMem.getDesc().getPrecision(), childMem.getDesc().getPrecision(), parentPaddElemCount);
 }
 
 bool MKLDNNConvertNode::created() const {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.h
index 38707385f7a8ba..9ed32a4d17ee78 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_convert_node.h
@@ -38,11 +38,13 @@ class MKLDNNConvertNode : public MKLDNNNode {
     const MemoryDesc& getInput() const { return *input; }
     const MemoryDesc& getOutput() const { return *output; }
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
+
+    static bool isSupportedDesc(const MemoryDesc &desc);
 
 private:
-    std::unique_ptr<MemoryDesc> input;
-    std::unique_ptr<MemoryDesc> output;
+    MemoryDescPtr input;
+    MemoryDescPtr output;
 
     std::string errorPrefix;
 };
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.cpp
index 2bf514fffda72e..bc4e88b3f955ac 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.cpp
@@ -12,8 +12,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNCTCGreedyDecoderNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNCTCGreedyDecoderNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto greedyDecOp = ngraph::as_type_ptr<const ngraph::op::v0::CTCGreedyDecoder>(op);
         if (!greedyDecOp) {
             errorMessage = "Node is not an instance of the CTCGreedyDecoder operation from operation set v0.";
@@ -69,9 +73,9 @@ void MKLDNNCTCGreedyDecoderNode::execute(mkldnn::stream strm) {
     const float* sequenceMask = reinterpret_cast<const float *>(getParentEdgeAt(SEQUENCE_LENGTH_INDEX)->getMemoryPtr()->GetPtr());
     float* outputSequences = reinterpret_cast<float *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
 
-    const size_t T = getParentEdgeAt(DATA_INDEX)->getShape().getStaticDims()[0];
-    const size_t B = getParentEdgeAt(DATA_INDEX)->getShape().getStaticDims()[1];
-    const int C = getParentEdgeAt(DATA_INDEX)->getShape().getStaticDims()[2];
+    const size_t T = getParentEdgeAt(DATA_INDEX)->getMemory().getStaticDims()[0];
+    const size_t B = getParentEdgeAt(DATA_INDEX)->getMemory().getStaticDims()[1];
+    const int C = getParentEdgeAt(DATA_INDEX)->getMemory().getStaticDims()[2];
     const size_t BC = B * C;
     const size_t CB1 = C * (B - 1);
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.h
index 26554ae7333dca..aa42dda6a97f5b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_node.h
@@ -19,7 +19,7 @@ class MKLDNNCTCGreedyDecoderNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     const size_t DATA_INDEX = 0lu;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.cpp
index acd273a9ad9b82..ab6a5c79e0a69e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.cpp
@@ -12,8 +12,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNCTCGreedyDecoderSeqLenNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNCTCGreedyDecoderSeqLenNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto greedyDecOp = ngraph::as_type_ptr<const ngraph::op::v6::CTCGreedyDecoderSeqLen>(op);
         if (!greedyDecOp) {
             errorMessage = "Node is not an instance of the CTCGreedyDecoderSeqLen operation from operation set v6.";
@@ -58,9 +62,9 @@ void MKLDNNCTCGreedyDecoderSeqLenNode::initSupportedPrimitiveDescriptors() {
         IE_THROW() << errorPrefix << "has unsupported 'sequence_length' input precision: " << seqLenPrecision;
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
+    inDataConf.reserve(inputShapes.size());
     inDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
-    for (int i = 1; i < getOriginalInputsNumber(); ++i)
+    for (int i = 1; i < inputShapes.size(); ++i)
         inDataConf.emplace_back(LayoutType::ncsp, Precision::I32);
 
     addSupportedPrimDesc(inDataConf,
@@ -75,9 +79,9 @@ void MKLDNNCTCGreedyDecoderSeqLenNode::execute(mkldnn::stream strm) {
     int* decodedClasses =  reinterpret_cast<int *>(getChildEdgesAtPort(DECODED_CLASSES_INDEX)[0]->getMemoryPtr()->GetPtr());
     int* decodedClassesLength = reinterpret_cast<int *>(getChildEdgesAtPort(DECODED_CLASSES_LENGTH_INDEX)[0]->getMemoryPtr()->GetPtr());
 
-    const size_t B = getParentEdgeAt(DATA_INDEX)->getShape().getStaticDims()[0];;
-    const size_t T = getParentEdgeAt(DATA_INDEX)->getShape().getStaticDims()[1];;
-    const int C = getParentEdgeAt(DATA_INDEX)->getShape().getStaticDims()[2];;
+    const size_t B = getParentEdgeAt(DATA_INDEX)->getMemory().getStaticDims()[0];;
+    const size_t T = getParentEdgeAt(DATA_INDEX)->getMemory().getStaticDims()[1];;
+    const int C = getParentEdgeAt(DATA_INDEX)->getMemory().getStaticDims()[2];;
     const size_t TC = T * C;
 
     int blankIndex = C - 1;
@@ -90,7 +94,7 @@ void MKLDNNCTCGreedyDecoderSeqLenNode::execute(mkldnn::stream strm) {
             std::string errorMsg = errorPrefix
                                    + ". Sequence length " + std::to_string(sequenceLengths[b])
                                    + " cannot be greater than according decoded classes dimension size "
-                                   + std::to_string(getChildEdgesAtPort(DECODED_CLASSES_INDEX)[0]->getShape().getStaticDims()[1]);
+                                   + std::to_string(getChildEdgesAtPort(DECODED_CLASSES_INDEX)[0]->getMemory().getStaticDims()[1]);
             IE_THROW() << errorMsg;
         }
         workAmount += sequenceLengths[b];
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.h
index b1d5ab6d9ffef3..95ef66222c198f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_greedy_decoder_seq_len_node.h
@@ -19,7 +19,7 @@ class MKLDNNCTCGreedyDecoderSeqLenNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     const size_t DATA_INDEX = 0lu;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.cpp
index 47da05014863bf..d3e0f149c7c943 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.cpp
@@ -11,8 +11,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNCTCLossNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNCTCLossNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto ctcLossOp = ngraph::as_type_ptr<const ngraph::op::v4::CTCLoss>(op);
         if (!ctcLossOp) {
             errorMessage = "Node is not an instance of the CTCLoss operation from operation set v4.";
@@ -47,9 +51,9 @@ void MKLDNNCTCLossNode::initSupportedPrimitiveDescriptors() {
         return;
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
+    inDataConf.reserve(inputShapes.size());
     inDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
-    for (int i = 1; i < getOriginalInputsNumber(); ++i)
+    for (int i = 1; i < inputShapes.size(); ++i)
         inDataConf.emplace_back(LayoutType::ncsp, Precision::I32);
 
     addSupportedPrimDesc(inDataConf,
@@ -66,9 +70,10 @@ void MKLDNNCTCLossNode::execute(mkldnn::stream strm) {
     const int* labelsLength = reinterpret_cast<const int *>(getParentEdgeAt(3)->getMemoryPtr()->GetPtr());
     float* dstData = reinterpret_cast<float *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
 
-    const size_t batchNum = getParentEdgeAt(0)->getShape().getStaticDims()[0];
-    const size_t maxTime = getParentEdgeAt(0)->getShape().getStaticDims()[1];
-    const size_t classesNum = getParentEdgeAt(0)->getShape().getStaticDims()[2];
+    const auto &inDims = getParentEdgeAt(0)->getMemory().getStaticDims();
+    const size_t batchNum = inDims[0];
+    const size_t maxTime = inDims[1];
+    const size_t classesNum = inDims[2];
 
     int blankIndex = classesNum - 1;
     if (inputShapes.size() > 4) {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.h
index b46ff413e829be..8b5a0253b36868 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_ctc_loss_node.h
@@ -19,7 +19,7 @@ class MKLDNNCTCLossNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     bool ctcMergeRepeated;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp
index 5124409cf8b9d8..542ca78f3ea26a 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.cpp
@@ -16,8 +16,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNCumSumNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNCumSumNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto cumsum = std::dynamic_pointer_cast<const ngraph::opset3::CumSum>(op);
         if (!cumsum) {
             errorMessage = "Only opset3 CumSum operation is supported";
@@ -71,16 +75,16 @@ void MKLDNNCumSumNode::initSupportedPrimitiveDescriptors() {
         dataPrecision != Precision::FP32 && dataPrecision != Precision::I64 && dataPrecision != Precision::U64 && dataPrecision != Precision::BF16)
         IE_THROW() << errorPrefix << " has unsupported 'data' input precision: " << dataPrecision.name();
 
-    if (getOriginalInputsNumber() == numOfInputs) {
+    if (inputShapes.size() == numOfInputs) {
         const auto &axisTensorPrec = getOriginalInputPrecisionAtPort(AXIS);
         if (axisTensorPrec != Precision::I32 && axisTensorPrec != Precision::I64)
             IE_THROW() << errorPrefix << " has unsupported 'axis' input precision: " << axisTensorPrec.name();
     }
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
+    inDataConf.reserve(inputShapes.size());
     inDataConf.emplace_back(LayoutType::ncsp, dataPrecision);
-    for (int i = 1; i < getOriginalInputsNumber(); ++i)
+    for (int i = 1; i < inputShapes.size(); ++i)
         inDataConf.emplace_back(LayoutType::ncsp, Precision::I32);
 
     addSupportedPrimDesc(inDataConf,
@@ -133,7 +137,7 @@ template <typename dataType>
 void MKLDNNCumSumNode::exec() {
     const auto *input = reinterpret_cast<const dataType *>(getParentEdgeAt(CUM_SUM_DATA)->getMemoryPtr()->GetPtr());
     auto *output = reinterpret_cast<dataType *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
-    const std::vector<size_t> strides = getParentEdgeAt(CUM_SUM_DATA)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    const VectorDims strides = getParentEdgeAt(CUM_SUM_DATA)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
 
     if (reverse) {
         if (exclusive) {
@@ -151,7 +155,7 @@ void MKLDNNCumSumNode::exec() {
 }
 
 template <bool reverse, bool exclusive, typename dataType>
-void MKLDNNCumSumNode::cumSum(const dataType *input, dataType *output, const std::vector<size_t> &strides) {
+void MKLDNNCumSumNode::cumSum(const dataType *input, dataType *output, const VectorDims &strides) {
     SizeVector iterationRange(numOfDims - 1);
     size_t j = 0;
     for (size_t i = 0; i < shape.size(); i++) {
@@ -248,8 +252,8 @@ inline size_t MKLDNNCumSumNode::getStartOffset(const std::vector<size_t> &forSta
 }
 
 size_t MKLDNNCumSumNode::getAxis(const MKLDNNMemory& _axis, const MKLDNNMemory& _data) const {
-    const auto& axisPrecision = _axis.GetDesc().getPrecision();
-    const int64_t dataShapeSize = static_cast<int64_t>(_data.GetDesc().getShape().getRank());
+    const auto& axisPrecision = _axis.getDesc().getPrecision();
+    const int64_t dataShapeSize = static_cast<int64_t>(_data.GetShape().getRank());
     int64_t axisValueFromBlob;
     switch (axisPrecision) {
         case Precision::I32 : {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.h
index bbe180f5544910..2836af15660519 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_cum_sum_node.h
@@ -19,7 +19,7 @@ class MKLDNNCumSumNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     template <typename dataType>
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.cpp
index 62c173c72f5a29..3bf3a41f8e832a 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.cpp
@@ -16,14 +16,20 @@
 #include <ngraph/opsets/opset1.hpp>
 #include <cpu/x64/cpu_isa_traits.hpp>
 #include <nodes/common/cpu_memcpy.h>
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNDeconvolutionNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNDeconvolutionNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (std::dynamic_pointer_cast<const ngraph::opset1::ConvolutionBackpropData>(op) == nullptr &&
                 std::dynamic_pointer_cast<const ngraph::opset1::GroupConvolutionBackpropData>(op) == nullptr) {
             errorMessage = "Only opset1 ConvolutionBackpropData and GroupConvolutionBackpropData operations are supported";
@@ -42,8 +48,8 @@ bool MKLDNNDeconvolutionNode::isSupportedOperation(const std::shared_ptr<ngraph:
 
 MKLDNNDeconvolutionNode::MKLDNNDeconvolutionNode(const std::shared_ptr<ngraph::Node>& op,
                                                  const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache) : MKLDNNNode(op, eng, cache) {
-    internalBlobDesc.emplace_back([&](primitive_desc_iterator &primitive_desc_it, size_t idx) -> MKLDNNMemoryDesc {
-        return MKLDNNMemoryDesc(primitive_desc_it.weights_desc(0));
+    internalBlobDesc.emplace_back([&](primitive_desc_iterator &primitive_desc_it, size_t idx) -> DnnlMemoryDescPtr {
+        return MKLDNNExtensionUtils::makeDescriptor(primitive_desc_it.weights_desc(0));
     });
     std::string errorMessage;
     if (isSupportedOperation(op, errorMessage)) {
@@ -146,13 +152,17 @@ InferenceEngine::Blob::Ptr MKLDNNDeconvolutionNode::createWeiBlobAsIO(InferenceE
 }
 
 bool MKLDNNDeconvolutionNode::canBeExecutedInInt8() const {
+    if (std::dynamic_pointer_cast<MKLDNNInputNode>(getParentEdgeAt(1)->getParent()) == nullptr) {
+        return false;
+    }
+
     // todo: [antonvor] added these checks to fix performance problems
     if (kernel.size() == 3)
         return false;
     if (!withGroups && stride.back() > 3)
         return false;
     if (!impl::cpu::x64::mayiuse(impl::cpu::x64::avx512_common)) {
-        auto inDims = getChildEdgeAt(0)->getShape().getStaticDims();
+        auto inDims = getOutputShapeAtPort(0).getStaticDims();
         // heuristicConst = 2^26
         // heuristicParam = IC^2 * SP
         auto heuristicConst = 67108864;
@@ -231,8 +241,8 @@ void MKLDNNDeconvolutionNode::getSupportedDescriptors() {
     for (int i = 0; i < paddingR.size(); i++) {
         int with_group = getAlgorithm() == DeconvolutionGrouped ? 1 : 0;
         int krn = weightDims[with_group + 2 + i];
-        int src = getChildEdgeAt(0)->getShape().getStaticDims()[2 + i];
-        int dst = getParentEdgeAt(0)->getShape().getStaticDims()[2 + i];
+        int src = getOutputShapeAtPort(0).getStaticDims()[2 + i];
+        int dst = getInputShapeAtPort(0).getStaticDims()[2 + i];
 
         krn = (krn - 1)*(dilation[i] + 1) + 1;
         int calc_dst = (src - krn + paddingL[i]) / stride[i] + 1;
@@ -243,15 +253,15 @@ void MKLDNNDeconvolutionNode::getSupportedDescriptors() {
         //  WA: if int8 deconvolution is supported, we create internal weights blob in IO format
         std::swap(weightDims[withGroups + 0], weightDims[withGroups + 1]);
         internalBlobs.push_back(createWeiBlobAsIO(weightDims));
-        auto format = getParentEdgeAt(0)->getShape().getRank() == 5 ? dnnl::memory::format_tag::ndhwc : dnnl::memory::format_tag::nhwc;
-        MKLDNNMemoryDesc in_candidate(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType, format);
-        MKLDNNMemoryDesc out_candidate(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType, format);
-        createDescriptor({&in_candidate}, {&out_candidate});
+        auto format = getInputShapeAtPort(0).getRank() == 5 ? dnnl::memory::format_tag::ndhwc : dnnl::memory::format_tag::nhwc;
+        MemoryDescPtr in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(0), inputDataType, format);
+        MemoryDescPtr out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(getOutputShapeAtPort(0), outputDataType, format);
+        createDescriptor({in_candidate}, {out_candidate});
     } else {
-        for (auto format : getAvailableFormatsForDims(getParentEdgeAt(0)->getShape())) {
-            MKLDNNMemoryDesc in_candidate(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType, format);
-            MKLDNNMemoryDesc out_candidate(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType, format);
-            createDescriptor({&in_candidate}, {&out_candidate});
+        for (auto format : getAvailableFormatsForDims(getInputShapeAtPort(0))) {
+            MemoryDescPtr in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(0), inputDataType, format);
+            MemoryDescPtr out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(getOutputShapeAtPort(0), outputDataType, format);
+            createDescriptor({in_candidate}, {out_candidate});
         }
     }
     setPostOps(attr);
@@ -292,20 +302,20 @@ void MKLDNNDeconvolutionNode::filterSupportedDescriptors() {
             bool isSuitableDesc = true;
             if (!inputMemoryFormatsFilter.empty()) {
                 if (isInt8) {
-                    auto src_tdesc = MKLDNNMemoryDesc(std::shared_ptr<dnnl::deconvolution_forward::desc>(*itd)->data.src_desc);
-                    isSuitableDesc &= src_tdesc.isSame(inputMemoryFormatsFilter[0]);
+                    auto src_tdesc = MKLDNNExtensionUtils::makeDescriptor(std::shared_ptr<dnnl::deconvolution_forward::desc>(*itd)->data.src_desc);
+                    isSuitableDesc &= src_tdesc->isSame(inputMemoryFormatsFilter[0]);
                 } else {
-                    auto src_tdesc = MKLDNNMemoryDesc(std::shared_ptr<mkldnn::convolution_backward_data::desc>(*itd)->data.diff_src_desc);
-                    isSuitableDesc &= src_tdesc.isSame(inputMemoryFormatsFilter[0]);
+                    auto src_tdesc = MKLDNNExtensionUtils::makeDescriptor(std::shared_ptr<mkldnn::convolution_backward_data::desc>(*itd)->data.diff_src_desc);
+                    isSuitableDesc &= src_tdesc->isSame(inputMemoryFormatsFilter[0]);
                 }
             }
             if (!outputMemoryFormatsFilter.empty()) {
                 if (isInt8) {
-                    auto dst_tdesc = MKLDNNMemoryDesc(std::shared_ptr<mkldnn::deconvolution_forward::desc>(*itd)->data.dst_desc);
-                    isSuitableDesc &= dst_tdesc.isSame(outputMemoryFormatsFilter[0]);
+                    auto dst_tdesc = MKLDNNExtensionUtils::makeDescriptor(std::shared_ptr<mkldnn::deconvolution_forward::desc>(*itd)->data.dst_desc);
+                    isSuitableDesc &= dst_tdesc->isSame(outputMemoryFormatsFilter[0]);
                 } else {
-                    auto dst_tdesc = MKLDNNMemoryDesc(std::shared_ptr<mkldnn::convolution_backward_data::desc>(*itd)->data.diff_dst_desc);
-                    isSuitableDesc &= dst_tdesc.isSame(outputMemoryFormatsFilter[0]);
+                    auto dst_tdesc = MKLDNNExtensionUtils::makeDescriptor(std::shared_ptr<mkldnn::convolution_backward_data::desc>(*itd)->data.diff_dst_desc);
+                    isSuitableDesc &= dst_tdesc->isSame(outputMemoryFormatsFilter[0]);
                 }
             }
             if (!isSuitableDesc) {
@@ -347,10 +357,10 @@ void MKLDNNDeconvolutionNode::createPrimitive() {
     }
 }
 
-void MKLDNNDeconvolutionNode::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc,
-                                               const std::vector<const MemoryDesc*> &outputDesc) {
-    const MKLDNNMemoryDesc in_candidate = MemoryDescUtils::convertToMKLDNNMemoryDesc(*inputDesc[0]);
-    const MKLDNNMemoryDesc out_candidate = MemoryDescUtils::convertToMKLDNNMemoryDesc(*outputDesc[0]);
+void MKLDNNDeconvolutionNode::createDescriptor(const std::vector<MemoryDescPtr> &inputDesc,
+                                               const std::vector<MemoryDescPtr> &outputDesc) {
+    const auto in_candidate = MemoryDescUtils::convertToDnnlBlockedMemoryDesc(*inputDesc[0]);
+    const auto out_candidate = MemoryDescUtils::convertToDnnlBlockedMemoryDesc(*outputDesc[0]);
 
     // grouping and autoblicking is not compatible
     if ((withGroups && !isDW) && (in_candidate.blocksExtended() || out_candidate.blocksExtended()))
@@ -361,29 +371,27 @@ void MKLDNNDeconvolutionNode::createDescriptor(const std::vector<const MemoryDes
     };
 
     if (isInt8) {
-        MKLDNNDims weightsDims = MKLDNNDims(weightDims);
-        mkldnn::memory::desc wgh_candidate(weightsDims, memory::data_type::s8, memory::format_tag::any);
+        mkldnn::memory::desc wgh_candidate(MKLDNNExtensionUtils::convertToDnnlDims(weightDims), memory::data_type::s8, memory::format_tag::any);
         std::shared_ptr<mkldnn::deconvolution_forward::desc> deconv_desc;
         deconv_desc.reset(new deconvolution_forward::desc(prop_kind::forward_inference, mkldnn::algorithm::deconvolution_direct,
-                                                          in_candidate, wgh_candidate, out_candidate,
+                                                          in_candidate.getDnnlDesc(), wgh_candidate, out_candidate.getDnnlDesc(),
                                                           convertDims(stride), convertDims(dilation),
                                                           convertDims(paddingL), convertDims(paddingR)));
         descs.emplace_back(deconv_desc);
     } else {
-        MKLDNNDims weightsDims = MKLDNNDims(weightDims);
-        mkldnn::memory::desc wgh_candidate(weightsDims, in_candidate.getDataType(), memory::format_tag::any);
+        mkldnn::memory::desc wgh_candidate(MKLDNNExtensionUtils::convertToDnnlDims(weightDims), in_candidate.getDataType(), memory::format_tag::any);
         for (auto alg : {mkldnn::algorithm::convolution_winograd, mkldnn::algorithm::convolution_direct}) {
             std::shared_ptr<mkldnn::convolution_forward::desc> conv_desc;
             conv_desc.reset(new convolution_forward::desc(prop_kind::forward_inference, alg,
-                                                          out_candidate, wgh_candidate, in_candidate,
+                                                          out_candidate.getDnnlDesc(), wgh_candidate, in_candidate.getDnnlDesc(),
                                                           convertDims(stride),
                                                           convertDims(dilation),
                                                           convertDims(paddingL),
                                                           convertDims(paddingR)));
 
             std::shared_ptr<mkldnn::convolution_backward_data::desc> deconv_desc;
-            deconv_desc.reset(new convolution_backward_data::desc(alg, out_candidate, wgh_candidate,
-                                                                  in_candidate,
+            deconv_desc.reset(new convolution_backward_data::desc(alg, out_candidate.getDnnlDesc(), wgh_candidate,
+                                                                  in_candidate.getDnnlDesc(),
                                                                   convertDims(stride),
                                                                   convertDims(dilation),
                                                                   convertDims(paddingL),
@@ -400,21 +408,18 @@ void MKLDNNDeconvolutionNode::createDescriptor(const std::vector<const MemoryDes
     }
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNDeconvolutionNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+std::shared_ptr<MemoryDesc> MKLDNNDeconvolutionNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
     if (idx == 2) {
-        auto dataType = MKLDNNExtensionUtils::IEPrecisionToDataType(getOriginalInputPrecisionAtPort(2));
-        return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(2)->getShape().getStaticDims(), dataType,
-                                             MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(2)->getShape().getRank()));
+        return std::make_shared<CpuBlockedMemoryDesc>(getOriginalInputPrecisionAtPort(2), Shape(getInputShapeAtPort(2).getStaticDims()));
     }
 
-    MKLDNNMemoryDesc desc = idx > 0 ? MKLDNNMemoryDesc(primitive_desc_it.weights_desc(idx - 1))
-            : isInt8 ? MKLDNNMemoryDesc(primitive_desc_it.src_desc(idx)) : MKLDNNMemoryDesc(primitive_desc_it.diff_dst_desc(idx));
-    return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::move(desc));
+    auto desc = idx > 0 ? primitive_desc_it.weights_desc(idx - 1) : isInt8 ? primitive_desc_it.src_desc(idx) : primitive_desc_it.diff_dst_desc(idx);
+    return MKLDNNExtensionUtils::makeDescriptor(desc);
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNDeconvolutionNode::getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
-    return isInt8 ? MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(primitive_desc_it.dst_desc(idx)) :
-            MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(primitive_desc_it.diff_src_desc(idx));
+std::shared_ptr<MemoryDesc> MKLDNNDeconvolutionNode::getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+    auto desc =  isInt8 ? primitive_desc_it.dst_desc(idx) : primitive_desc_it.diff_src_desc(idx);
+    return MKLDNNExtensionUtils::makeDescriptor(desc);
 }
 
 InferenceEngine::Precision MKLDNNDeconvolutionNode::getRuntimePrecision() const {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.h
index 15ee71d6af74ac..a01941b9ef7f64 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_deconv_node.h
@@ -17,8 +17,8 @@ class MKLDNNDeconvolutionNode : public MKLDNNNode {
     MKLDNNDeconvolutionNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache);
 
     void getSupportedDescriptors() override;
-    void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                          const std::vector<const MemoryDesc*>& outputDesc) override;
+    void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                          const std::vector<MemoryDescPtr>& outputDesc) override;
     void createPrimitive() override;
     void filterSupportedPrimitiveDescriptors() override;
     void filterSupportedDescriptors();
@@ -31,12 +31,12 @@ class MKLDNNDeconvolutionNode : public MKLDNNNode {
         return static_cast<size_t>(getParentEdges().size());
     }
 
-    std::unique_ptr<MKLDNNMemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
-    std::unique_ptr<MKLDNNMemoryDesc> getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
+    std::shared_ptr<MemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
+    std::shared_ptr<MemoryDesc> getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
 
     InferenceEngine::Precision getRuntimePrecision() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
     bool canFuse(const MKLDNNNodePtr& node) const override;
 
 private:
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp
index 370524be475d32..603d479ebdda99 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_def_conv_node.cpp
@@ -14,6 +14,7 @@
 #include <mkldnn_extension_utils.h>
 #include <cpu/x64/jit_generator.hpp>
 #include "ie_parallel.hpp"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -741,6 +742,10 @@ struct jit_uni_def_conv_kernel_f32 : public jit_uni_def_conv_kernel, public jit_
 
 bool MKLDNNDeformableConvolutionNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         if (!one_of(op->get_type_info(),
                 ngraph::op::v1::DeformableConvolution::type_info,
                 ngraph::op::v8::DeformableConvolution::type_info)) {
@@ -793,20 +798,20 @@ void MKLDNNDeformableConvolutionNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << "has incorrect number of output edges";
 
-    if (getParentEdgeAt(0)->getShape().getRank() != 4) {
+    if (getInputShapeAtPort(0).getRank() != 4) {
         IE_THROW() << "Deformable convolution layer. Unsupported mode. Only 4D blobs are supported as input.";
     }
 
-    if (getParentEdgeAt(1)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getParentEdgeAt(1)->getShape().getRank();
+    if (getInputShapeAtPort(1).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getInputShapeAtPort(1).getRank();
     }
 
-    if (getParentEdgeAt(2)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support 2nd input with rank: " << getParentEdgeAt(2)->getShape().getRank();
+    if (getInputShapeAtPort(2).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support 2nd input with rank: " << getInputShapeAtPort(2).getRank();
     }
 
-    if (getChildEdgeAt(0)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getChildEdgeAt(0)->getShape().getRank();
+    if (getOutputShapeAtPort(0).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getOutputShapeAtPort(0).getRank();
     }
 }
 
@@ -853,45 +858,45 @@ void MKLDNNDeformableConvolutionNode::initSupportedPrimitiveDescriptors() {
         auto weiFormat = group > 1 ? mayiuse(avx512_common) ? memory::format_tag::gOIhw16i16o : memory::format_tag::gOIhw8i8o
                                    : mayiuse(avx512_common) ? memory::format_tag::OIhw16i16o : memory::format_tag::OIhw8i8o;
 
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(),
+        config.inConfs[0].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(0),
                                                                               memory::data_type::f32, dataFormat);
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(1)->getShape().getStaticDims(),
+        config.inConfs[1].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(1),
                                                                               memory::data_type::f32, offFormat);
 
-        auto& wDims = getParentEdgeAt(2)->getShape().getStaticDims();
+        auto& wDims = getInputShapeAtPort(2).getStaticDims();
         if (group > 1 && wDims.size() != 5) {
             auto new_dims = InferenceEngine::SizeVector({group, div_up(wDims[0], group)});
             for (int i = 1; i < wDims.size(); i++) {
                 new_dims.push_back(wDims[i]);
             }
-            config.inConfs[2].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(2)->getShape().getStaticDims(),
+            config.inConfs[2].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(2),
                                                                                  memory::data_type::f32, weiFormat);
         } else {
-            config.inConfs[2].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(2)->getShape().getStaticDims(),
+            config.inConfs[2].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(2),
                                                                                  memory::data_type::f32, weiFormat);
         }
 
 
         if (inputsNumber > 3) {
-            config.inConfs[3].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(3)->getShape().getStaticDims(),
+            config.inConfs[3].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(3),
                                                                                  memory::data_type::f32, memory::format_tag::nchw);
         }
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(),
+        config.outConfs[0].desc = std::make_shared<DnnlBlockedMemoryDesc>(getOutputShapeAtPort(0),
                                                                               memory::data_type::f32, dataFormat);
         supportedPrimitiveDescriptors.push_back({config, impl_type});
     } else {
         // reference implementation
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), memory::data_type::f32,
+        config.inConfs[0].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(0), memory::data_type::f32,
                                                                memory::format_tag::nchw);
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(1)->getShape().getStaticDims(), memory::data_type::f32,
+        config.inConfs[1].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(1), memory::data_type::f32,
                                                                memory::format_tag::nchw);
-        config.inConfs[2].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(2)->getShape().getStaticDims(), memory::data_type::f32,
+        config.inConfs[2].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(2), memory::data_type::f32,
                                                                memory::format_tag::oihw);
         if (inputsNumber > 3) {
-            config.inConfs[3].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(3)->getShape().getStaticDims(), memory::data_type::f32,
+            config.inConfs[3].desc = std::make_shared<DnnlBlockedMemoryDesc>(getInputShapeAtPort(3), memory::data_type::f32,
                                                                                  memory::format_tag::nchw);
         }
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), memory::data_type::f32,
+        config.outConfs[0].desc = std::make_shared<DnnlBlockedMemoryDesc>(getOutputShapeAtPort(0), memory::data_type::f32,
                                                                 memory::format_tag::nchw);
         supportedPrimitiveDescriptors.push_back({config, impl_type});
     }
@@ -903,9 +908,9 @@ void MKLDNNDeformableConvolutionNode::createPrimitive() {
         IE_THROW() << "CPU deformable convolution with name '" << getName() << "' doesn't have primitive descriptors.";
     auto config = selectedPrimitiveDescriptor->getConfig();
 
-    auto srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    auto weiDims = getParentEdgeAt(2)->getShape().getStaticDims();
-    auto dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto srcDims = getParentEdgeAt(0)->getMemory().getStaticDims();
+    auto weiDims = getParentEdgeAt(2)->getMemory().getStaticDims();
+    auto dstDims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
 
     jcp.dg = deformable_group;
 
@@ -1136,23 +1141,23 @@ void MKLDNNDeformableConvolutionNode::execute(mkldnn::stream strm) {
     auto config = selectedPrimitiveDescriptor->getConfig();
 
     auto src_block_desc = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    std::vector<size_t> src_strides(src_block_desc.getStrides().size());
+    std::vector<size_t> src_strides(src_block_desc->getStrides().size());
     for (int i = 0; i < src_strides.size(); i++) {
-        src_strides[src_block_desc.getOrder()[i]] = src_block_desc.getStrides()[i];
+        src_strides[src_block_desc->getOrder()[i]] = src_block_desc->getStrides()[i];
     }
 
     auto dst_block_desc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    std::vector<size_t> dst_strides(dst_block_desc.getStrides().size());
+    std::vector<size_t> dst_strides(dst_block_desc->getStrides().size());
     for (int i = 0; i < dst_strides.size(); i++) {
-        dst_strides[dst_block_desc.getOrder()[i]] = dst_block_desc.getStrides()[i];
+        dst_strides[dst_block_desc->getOrder()[i]] = dst_block_desc->getStrides()[i];
     }
 
 
-    auto off_strides =  getParentEdgeAt(1)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
-    auto wei_strides =  getParentEdgeAt(2)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    auto off_strides =  getParentEdgeAt(1)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
+    auto wei_strides =  getParentEdgeAt(2)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
     InferenceEngine::SizeVector modulation_strides;
     if (inputsNumber > 3) {
-        modulation_strides = getParentEdgeAt(3)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+        modulation_strides = getParentEdgeAt(3)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
     }
 
 
@@ -1171,4 +1176,4 @@ InferenceEngine::Precision MKLDNNDeformableConvolutionNode::getRuntimePrecision(
     return getMaxPrecision(getInputPrecisions());
 }
 
-REG_MKLDNN_PRIM_FOR(MKLDNNDeformableConvolutionNode, DeformableConvolution);
+REG_MKLDNN_PRIM_FOR(MKLDNNDeformableConvolutionNode, DeformableConvolution);
\ No newline at end of file
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.cpp
index a117d3acbdcd4d..c341e98a78bcf4 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.cpp
@@ -21,8 +21,12 @@ using namespace mkldnn;
 using namespace mkldnn::impl;
 using namespace mkldnn::impl::cpu::x64;
 
-bool MKLDNNDepthToSpaceNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNDepthToSpaceNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto depthToSpace = std::dynamic_pointer_cast<const ngraph::opset1::DepthToSpace>(op);
         if (!depthToSpace) {
             errorMessage = "Only opset1 DepthToSpace operation is supported";
@@ -99,7 +103,7 @@ void MKLDNNDepthToSpaceNode::initSupportedPrimitiveDescriptors() {
         return;
 
     InferenceEngine::Precision precision = getOriginalInputPrecisionAtPort(0);
-    auto srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
+    auto srcDims = getInputShapeAtPort(0).getStaticDims();
     const size_t nDims = srcDims.size();
 
     impl_desc_type impl_type;
@@ -140,8 +144,8 @@ void MKLDNNDepthToSpaceNode::initSupportedPrimitiveDescriptors() {
     auto range = BlockedDescCreator::makeFilteredRange(creators, nDims, supportedTypes);
 
     for (auto itr = range.first; itr != range.second; ++itr) {
-        config.inConfs[0].desc = itr->second->createUniqueDesc(precision, getParentEdgeAt(0)->getShape().getStaticDims());
-        config.outConfs[0].desc = itr->second->createUniqueDesc(precision, getChildEdgeAt(0)->getShape().getStaticDims());
+        config.inConfs[0].desc = itr->second->createSharedDesc(precision, getInputShapeAtPort(0));
+        config.outConfs[0].desc = itr->second->createSharedDesc(precision, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.emplace_back(config, impl_type);
     }
 }
@@ -156,13 +160,12 @@ void MKLDNNDepthToSpaceNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         THROW_ERROR << "has unidentified preferable primitive descriptor";
 
-    SizeVector srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    SizeVector dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    VectorDims srcDims = srcMemPtr->getStaticDims();
 
     size_t nDims = srcDims.size();
     const size_t nSpatialDims = nDims - 2;
-    const bool isBlocked = getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c) ||
-                           getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c);
+    const bool isBlocked = getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c) ||
+                           getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c);
     const size_t reshapedRank = nDims + nSpatialDims + static_cast<int>(isBlocked) + static_cast<int>(isBlocked && mode == Mode::DEPTH_FIRST);
     const size_t lastIdx = reshapedRank - 1;
     size_t firstSpatialOrder = 2;
@@ -194,8 +197,7 @@ void MKLDNNDepthToSpaceNode::createPrimitive() {
     };
 
     if (isBlocked) {
-        SizeVector srcBlockedDims = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getBlockDims();
-        SizeVector dstBlockedDims = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getBlockDims();
+        VectorDims srcBlockedDims = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getBlockDims();
 
         size_t orderShiftForBlocks, orderShiftForDims;
         if (mode == Mode::BLOCKS_FIRST) {
@@ -224,11 +226,9 @@ void MKLDNNDepthToSpaceNode::createPrimitive() {
         }
 
         reshapeAndSetPermOrder(orderShiftForDims, orderShiftForBlocks, firstSpatialOrder, srcBlockedDims);
-    } else if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc)) {
+    } else if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nspc)) {
         srcDims.push_back(srcDims[1]);
-        dstDims.push_back(dstDims[1]);
         srcDims.erase(srcDims.begin() + 1);
-        dstDims.erase(dstDims.begin() + 1);
         firstSpatialOrder = 1;
 
         size_t shift = static_cast<size_t>(mode == DEPTH_FIRST) + nSpatialDims + 1;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.h
index a7c0145fc8153f..0ab0b3bd940b06 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_depth_to_space_node.h
@@ -21,7 +21,7 @@ class MKLDNNDepthToSpaceNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     enum Mode {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.cpp
index 1d44dd3f7475e5..a2822931efd6ac 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.cpp
@@ -4,11 +4,14 @@
 
 #include <string>
 #include <vector>
+#include <mutex>
 
+#include "mkldnn/ie_mkldnn.h"
 #include <ngraph/op/detection_output.hpp>
 #include "ie_parallel.hpp"
 #include "mkldnn_detection_output_node.h"
 
+using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
@@ -24,8 +27,12 @@ bool SortScorePairDescend<std::pair<int, int>>(const std::pair<float, std::pair<
     return (pair1.first > pair2.first) || (pair1.first == pair2.first && pair1.second.second < pair2.second.second);
 }
 
-bool MKLDNNDetectionOutputNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNDetectionOutputNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto doOp = ngraph::as_type_ptr<const ngraph::op::v0::DetectionOutput>(op);
         if (!doOp) {
             errorMessage = "Node is not an instance of the DetectionOutput from the operations set v0.";
@@ -49,66 +56,79 @@ MKLDNNDetectionOutputNode::MKLDNNDetectionOutputNode(const std::shared_ptr<ngrap
         IE_THROW(NotImplemented) << errorMessage;
     }
 
-    errorPrefix = "DetectionOutput layer with name '" + op->get_friendly_name() + "' ";
+    errorPrefix = "DetectionOutput node with name '" + getName() + "' ";
 
     if (getOriginalInputsNumber() != 3 && getOriginalInputsNumber() != 5)
-        IE_THROW() << errorPrefix <<  " has incorrect number of input edges.";
+        IE_THROW() << errorPrefix <<  "has incorrect number of input edges.";
 
     if (getOriginalOutputsNumber() != 1)
-        IE_THROW() << errorPrefix << " has incorrect number of output edges.";
+        IE_THROW() << errorPrefix << "has incorrect number of output edges.";
 
     auto doOp = ngraph::as_type_ptr<const ngraph::op::v0::DetectionOutput>(op);
     auto attributes = doOp->get_attrs();
 
-    _num_classes = attributes.num_classes;
-    _background_label_id = attributes.background_label_id;
-    _top_k = attributes.top_k;
-    _variance_encoded_in_target = attributes.variance_encoded_in_target;
-    _keep_top_k = attributes.keep_top_k[0];
-    _nms_threshold = attributes.nms_threshold;
-    _confidence_threshold = attributes.confidence_threshold;
-    _share_location = attributes.share_location;
-    _clip_before_nms = attributes.clip_before_nms;
-    _clip_after_nms = attributes.clip_after_nms;
-    _decrease_label_id = attributes.decrease_label_id;
-    _normalized = attributes.normalized;
-    _image_height = attributes.input_height;
-    _image_width = attributes.input_width;
-    _prior_size = _normalized ? 4 : 5;
-    _offset = _normalized ? 0 : 1;
-    _num_loc_classes = _share_location ? 1 : _num_classes;
-
-    with_add_box_pred = getOriginalInputsNumber() == 5;
-    _objectness_score = attributes.objectness_score;
-
-    _code_type = (details::CaselessEq<std::string>()(attributes.code_type, "caffe.PriorBoxParameter.CENTER_SIZE") ?
+    classesNum = attributes.num_classes;
+    backgroundClassId = attributes.background_label_id;
+    topK = attributes.top_k;
+    varianceEncodedInTarget = attributes.variance_encoded_in_target;
+    keepTopK = attributes.keep_top_k[0];
+    NMSThreshold = attributes.nms_threshold;
+    confidenceThreshold = attributes.confidence_threshold;
+    isShareLoc = attributes.share_location;
+    clipBeforeNMS = attributes.clip_before_nms;
+    clipAfterNMS = attributes.clip_after_nms;
+    decreaseClassId = attributes.decrease_label_id;
+    normalized = attributes.normalized;
+    imgHeight = attributes.input_height;
+    imgWidth = attributes.input_width;
+    priorSize = normalized ? 4 : 5;
+    coordOffset = normalized ? 0 : 1;
+    locNumForClasses = isShareLoc ? 1 : classesNum;
+
+    withAddBoxPred = getOriginalInputsNumber() == 5;
+    objScore = attributes.objectness_score;
+
+    codeType = (details::CaselessEq<std::string>()(attributes.code_type, "caffe.PriorBoxParameter.CENTER_SIZE") ?
                   CodeType::CENTER_SIZE : CodeType::CORNER);
 
-    _num_priors = static_cast<int>(op->get_input_shape(idx_priors).back() / _prior_size);
-    _priors_batches = op->get_input_shape(idx_priors).front() != 1;
-
-    if (_num_priors * _num_loc_classes * 4 != static_cast<int>(op->get_input_shape(idx_location)[1]))
-        IE_THROW() << errorPrefix << " has incorrect number of priors must match number of location predictions ("
-                   << _num_priors * _num_loc_classes * 4 << " vs "
-                   << op->get_input_shape(idx_location)[1] << ")";
-
-    if (_num_priors * _num_classes != static_cast<int>(op->get_input_shape(idx_confidence).back()))
-        IE_THROW() << " has incorrect number of priors must match number of confidence predictions.";
-
-    if (_decrease_label_id && _background_label_id != 0)
-        IE_THROW() << errorPrefix << " cannot use decrease_label_id and background_label_id parameter simultaneously.";
-
-    _num = static_cast<int>(op->get_input_shape(idx_confidence)[0]);
-
-    _decoded_bboxes.resize(_num * _num_classes * _num_priors * 4);
-    _buffer.resize(_num * _num_classes * _num_priors);
-    _indices.resize(_num * _num_classes * _num_priors);
-    _detections_count.resize(_num * _num_classes);
-    _bbox_sizes.resize(_num * _num_classes * _num_priors);
-    _num_priors_actual.resize(_num);
-
-    const auto &confSize = op->get_input_shape(idx_confidence);
-    _reordered_conf.resize(std::accumulate(confSize.begin(), confSize.end(), 1, std::multiplies<size_t>()));
+    priorsNum = static_cast<int>(op->get_input_shape(ID_PRIOR).back() / priorSize);
+    isPriorsPerImg = op->get_input_shape(ID_PRIOR).front() != 1;
+
+    if (priorsNum * locNumForClasses * 4 != static_cast<int>(op->get_input_shape(ID_LOC)[1]))
+        IE_THROW() << errorPrefix << "has incorrect number of priors, which must match number of location predictions ("
+                   << priorsNum * locNumForClasses * 4 << " vs "
+                   << op->get_input_shape(ID_LOC)[1] << ")";
+
+    if (priorsNum * classesNum != static_cast<int>(op->get_input_shape(ID_CONF).back()))
+        IE_THROW() << errorPrefix << "has incorrect number of priors, which must match number of confidence predictions.";
+
+    if (decreaseClassId && backgroundClassId != 0)
+        IE_THROW() << errorPrefix << "cannot use decrease_label_id and background_label_id parameter simultaneously.";
+
+    imgNum = static_cast<int>(op->get_input_shape(ID_CONF)[0]);
+
+    decodedBboxes.resize(imgNum * classesNum * priorsNum * 4);
+    bboxSizes.resize(imgNum * classesNum * priorsNum);
+    indicesBuffer.resize(imgNum * classesNum * priorsNum);
+    indices.resize(imgNum * classesNum * priorsNum);
+    // prior info for shared_location
+    if (isShareLoc)
+        confInfoForPrior.resize(imgNum * priorsNum);
+
+    // confs...count...indices for caffe style and sparsity case.
+    // caffe: conf_info for sparsity or indices for dense --> topk(buffer) --> nms(indices)
+    //        --> g_topk(vector<>(all detections) --> indices per class))
+    // MXNet: max conf for prior within img, filter(indices) --> topk_img(buffer) --> nms_cls(indices)
+    //        --> g_topk(vector<>(all detections) --> indices per class))
+    int cacheSizeL3 = utils::get_cache_size(3, true);
+    isSparsityWorthwhile =
+        (confidenceThreshold > sparsityThreshold) &&
+        ((classesNum * priorsNum * sizeof(float) * 2) > cacheSizeL3);
+    confInfoLen = (!decreaseClassId && isSparsityWorthwhile) ? (2 * priorsNum + 1) : priorsNum;
+    reorderedConf.resize(imgNum * classesNum * confInfoLen);
+
+    detectionsCount.resize(imgNum * classesNum);
+    numPriorsActual.resize(imgNum);
 }
 
 void MKLDNNDetectionOutputNode::initSupportedPrimitiveDescriptors() {
@@ -116,8 +136,8 @@ void MKLDNNDetectionOutputNode::initSupportedPrimitiveDescriptors() {
         return;
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
-    for (int i = 0; i < getOriginalInputsNumber(); ++i)
+    inDataConf.reserve(inputShapes.size());
+    for (int i = 0; i < inputShapes.size(); ++i)
         inDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
 
     addSupportedPrimDesc(inDataConf,
@@ -125,480 +145,747 @@ void MKLDNNDetectionOutputNode::initSupportedPrimitiveDescriptors() {
                          impl_desc_type::ref_any);
 }
 
+struct ConfidenceComparatorDO {
+    explicit ConfidenceComparatorDO(const float* confDataIn) : confData(confDataIn) {}
+
+    bool operator()(int idx1, int idx2) {
+        if (confData[idx1] > confData[idx2]) return true;
+        if (confData[idx1] < confData[idx2]) return false;
+        return idx1 < idx2;
+    }
+
+    const float* confData;
+};
+
 void MKLDNNDetectionOutputNode::execute(mkldnn::stream strm) {
-    float *dst_data = reinterpret_cast<float *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
-
-    const float *loc_data    = reinterpret_cast<const float *>(getParentEdgeAt(idx_location)->getMemoryPtr()->GetPtr());
-    const float *conf_data   = reinterpret_cast<const float *>(getParentEdgeAt(idx_confidence)->getMemoryPtr()->GetPtr());
-    const float *prior_data  = reinterpret_cast<const float *>(getParentEdgeAt(idx_priors)->getMemoryPtr()->GetPtr());
-    const float *arm_conf_data = inputShapes.size() > 3 ?
-            reinterpret_cast<const float *>(getParentEdgeAt(idx_arm_confidence)->getMemoryPtr()->GetPtr()) : nullptr;
-    const float *arm_loc_data = inputShapes.size() > 4 ?
-            reinterpret_cast<const float *>(getParentEdgeAt(idx_arm_location)->getMemoryPtr()->GetPtr()) : nullptr;
-
-    const int N = getParentEdgeAt(idx_confidence)->getShape().getStaticDims()[0];
-
-    float *decoded_bboxes_data = _decoded_bboxes.data();
-    float *reordered_conf_data = _reordered_conf.data();
-    float *bbox_sizes_data     = _bbox_sizes.data();
-    int *detections_data       = _detections_count.data();
-    int *buffer_data           = _buffer.data();
-    int *indices_data          = _indices.data();
-    int *num_priors_actual     = _num_priors_actual.data();
-
-    for (int n = 0; n < N; ++n) {
-        const float *ppriors = prior_data;
-        const float *prior_variances = prior_data + _num_priors*_prior_size;
-        if (_priors_batches) {
-            ppriors += _variance_encoded_in_target ? n*_num_priors*_prior_size : 2*n*_num_priors*_prior_size;
-            prior_variances += _variance_encoded_in_target ? 0 : 2*n*_num_priors*_prior_size;
+    float *dstData = reinterpret_cast<float *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
+
+    const float *locData     = reinterpret_cast<const float *>(getParentEdgeAt(ID_LOC)->getMemoryPtr()->GetPtr());
+    const float *confData    = reinterpret_cast<const float *>(getParentEdgeAt(ID_CONF)->getMemoryPtr()->GetPtr());
+    const float *priorData   = reinterpret_cast<const float *>(getParentEdgeAt(ID_PRIOR)->getMemoryPtr()->GetPtr());
+    const float *ARMConfData = inputShapes.size() > 3 ?
+            reinterpret_cast<const float *>(getParentEdgeAt(ID_ARM_CONF)->getMemoryPtr()->GetPtr()) : nullptr;
+    const float *ARMLocData = inputShapes.size() > 4 ?
+            reinterpret_cast<const float *>(getParentEdgeAt(ID_ARM_LOC)->getMemoryPtr()->GetPtr()) : nullptr;
+
+    float *reorderedConfData = reorderedConf.data();
+    int *reorderedConfDataIndices = reinterpret_cast<int*>(reorderedConf.data());
+
+    float *decodedBboxesData = decodedBboxes.data();
+    float *bboxSizesData     = bboxSizes.data();
+    int *indicesData         = indices.data();
+    int *indicesBufData      = indicesBuffer.data();
+    int *detectionsData      = detectionsCount.data();
+
+    memset(detectionsData, 0, imgNum * classesNum * sizeof(int));
+
+    int priorsBatch = isPriorsPerImg ? imgNum : 1;
+    int *numPriorsActualdata = numPriorsActual.data();
+    for (int n = 0; n < priorsBatch; ++n) {
+        const float *ppriors = priorData;
+        ppriors += varianceEncodedInTarget ? (n * priorsNum * priorSize) : (2 * n * priorsNum * priorSize);
+        getActualPriorNum(ppriors, numPriorsActualdata, n);
+    }
+    if (!isPriorsPerImg && imgNum > 1)
+        std::fill_n(numPriorsActualdata + 1, imgNum - 1, numPriorsActualdata[0]);
+
+    if (!isSparsityWorthwhile) {
+        confReorderDense(confData, ARMConfData, reorderedConfData);
+
+        if (!decreaseClassId) {
+            confFilterCF(reorderedConfData, indicesData, indicesBufData, detectionsData);
+        } else {
+            confFilterMX(confData, ARMConfData, reorderedConfData, indicesData, indicesBufData, detectionsData);
+        }
+    } else { // sparsity
+        if (!decreaseClassId) {
+            confReorderAndFilterSparsityCF(confData, ARMConfData, reorderedConfData, indicesData, indicesBufData, detectionsData);
+        } else {
+            confReorderAndFilterSparsityMX(confData, ARMConfData, reorderedConfData, indicesData, indicesBufData, detectionsData);
         }
+    }
+
+    int *confInfoV = confInfoForPrior.data();
 
-        if (_share_location) {
-            const float *ploc = loc_data + n*4*_num_priors;
-            float *pboxes = decoded_bboxes_data + n*4*_num_priors;
-            float *psizes = bbox_sizes_data + n*_num_priors;
+    for (int n = 0; n < imgNum; ++n) {
+        const float *ppriors = priorData;
+        const float *priorVariances = priorData + priorsNum * priorSize;
+        if (isPriorsPerImg) {
+            int priorSizePerImg = varianceEncodedInTarget ? (n * priorsNum * priorSize) : (2 * n * priorsNum * priorSize);
+            ppriors += priorSizePerImg;
+            priorVariances += varianceEncodedInTarget ? 0 : priorSizePerImg;
+        }
 
-            if (with_add_box_pred) {
-                const float *p_arm_loc = arm_loc_data + n*4*_num_priors;
-                decodeBBoxes(ppriors, p_arm_loc, prior_variances, pboxes, psizes, num_priors_actual, n, _offset, _prior_size);
-                decodeBBoxes(pboxes, ploc, prior_variances, pboxes, psizes, num_priors_actual, n, 0, 4, false);
+        if (isShareLoc) {
+            int locShift = n * priorsNum;
+            int coordShift = locShift * 4;
+            const float *ploc = locData + coordShift;
+            float *pboxes = decodedBboxesData + coordShift;
+            float *psizes = bboxSizesData + locShift;
+            int *confInfoVB = confInfoV + locShift;
+
+            if (withAddBoxPred) {
+                const float *pARMLoc = ARMLocData + coordShift;
+                decodeBBoxes(ppriors, pARMLoc, priorVariances, pboxes, psizes, numPriorsActualdata, n, coordOffset, priorSize, true, nullptr, confInfoVB);
+                decodeBBoxes(pboxes, ploc, priorVariances, pboxes, psizes, numPriorsActualdata, n, 0, 4, false, nullptr, confInfoVB);
             } else {
-                decodeBBoxes(ppriors, ploc, prior_variances, pboxes, psizes, num_priors_actual, n, _offset, _prior_size);
+                decodeBBoxes(ppriors, ploc, priorVariances, pboxes, psizes, numPriorsActualdata, n, coordOffset, priorSize, true, nullptr, confInfoVB);
             }
         } else {
-            for (int c = 0; c < _num_loc_classes; ++c) {
-                if (c == _background_label_id) {
+            for (int c = 0; c < locNumForClasses; ++c) {
+                if (c == backgroundClassId) {
                     continue;
                 }
-                const float *ploc = loc_data + n*4*_num_loc_classes*_num_priors + c*4;
-                float *pboxes = decoded_bboxes_data + n*4*_num_loc_classes*_num_priors + c*4*_num_priors;
-                float *psizes = bbox_sizes_data + n*_num_loc_classes*_num_priors + c*_num_priors;
-                if (with_add_box_pred) {
-                    const float *p_arm_loc = arm_loc_data + n*4*_num_loc_classes*_num_priors + c*4;
-                    decodeBBoxes(ppriors, p_arm_loc, prior_variances, pboxes, psizes, num_priors_actual, n, _offset, _prior_size);
-                    decodeBBoxes(pboxes, ploc, prior_variances, pboxes, psizes, num_priors_actual, n, 0, 4, false);
+                int locShift = n * priorsNum * locNumForClasses;
+                int coordShift = locShift * 4;
+                const float *ploc = locData + coordShift + c * 4;
+                float *pboxes = decodedBboxesData + coordShift + c * 4 * priorsNum;
+                float *psizes = bboxSizesData + locShift + c * priorsNum;
+                int *confInfoHBC = reorderedConfDataIndices + n * confInfoLen * classesNum + c*confInfoLen;
+                if (withAddBoxPred) {
+                    const float *pARMLoc = ARMLocData + n * 4 * locNumForClasses * priorsNum + c * 4;
+                    decodeBBoxes(ppriors, pARMLoc, priorVariances, pboxes, psizes, numPriorsActualdata, n, coordOffset, priorSize, true, confInfoHBC);
+                    decodeBBoxes(pboxes, ploc, priorVariances, pboxes, psizes, numPriorsActualdata, n, 0, 4, false, confInfoHBC);
                 } else {
-                    decodeBBoxes(ppriors, ploc, prior_variances, pboxes, psizes, num_priors_actual, n, _offset, _prior_size);
+                    decodeBBoxes(ppriors, ploc, priorVariances, pboxes, psizes, numPriorsActualdata, n, coordOffset, priorSize, true, confInfoHBC);
                 }
             }
         }
     }
 
-    if (with_add_box_pred) {
-        for (int n = 0; n < N; ++n) {
-            for (int p = 0; p < _num_priors; ++p) {
-                if (arm_conf_data[n*_num_priors*2 + p * 2 + 1] < _objectness_score) {
-                    for (int c = 0; c < _num_classes; ++c) {
-                        reordered_conf_data[n*_num_priors*_num_classes + c*_num_priors + p] = c == _background_label_id ? 1.0f : 0.0f;
-                    }
-                } else {
-                    for (int c = 0; c < _num_classes; ++c) {
-                        reordered_conf_data[n*_num_priors*_num_classes + c*_num_priors + p] = conf_data[n*_num_priors*_num_classes + p*_num_classes + c];
-                    }
-                }
-            }
-        }
-    } else {
-        for (int n = 0; n < N; ++n) {
-            for (int c = 0; c < _num_classes; ++c) {
-                for (int p = 0; p < _num_priors; ++p) {
-                    reordered_conf_data[n*_num_priors*_num_classes + c*_num_priors + p] = conf_data[n*_num_priors*_num_classes + p*_num_classes + c];
-                }
-            }
-        }
-    }
-
-    memset(detections_data, 0, N*_num_classes*sizeof(int));
-
-    for (int n = 0; n < N; ++n) {
-        int detections_total = 0;
-
-        if (!_decrease_label_id) {
+    // NMS
+    for (int n = 0; n < imgNum; ++n) {
+        if (!decreaseClassId) {
             // Caffe style
-            parallel_for(_num_classes, [&](int c) {
-                if (c != _background_label_id) {  // Ignore background class
-                    int *pindices    = indices_data + n*_num_classes*_num_priors + c*_num_priors;
-                    int *pbuffer     = buffer_data + c*_num_priors;
-                    int *pdetections = detections_data + n*_num_classes + c;
+            parallel_for(classesNum, [&](int c) {
+                if (c != backgroundClassId) {  // Ignore background class
+                    int *pindices    = indicesData + n * classesNum * priorsNum + c * priorsNum;
+                    int *pbuffer     = indicesBufData + n * classesNum * priorsNum + c * priorsNum;
+                    int *pdetections = detectionsData + n * classesNum + c;
 
-                    const float *pconf = reordered_conf_data + n*_num_classes*_num_priors + c*_num_priors;
                     const float *pboxes;
                     const float *psizes;
-                    if (_share_location) {
-                        pboxes = decoded_bboxes_data + n*4*_num_priors;
-                        psizes = bbox_sizes_data + n*_num_priors;
+                    if (isShareLoc) {
+                        pboxes = decodedBboxesData + n * 4 * priorsNum;
+                        psizes = bboxSizesData + n * priorsNum;
                     } else {
-                        pboxes = decoded_bboxes_data + n*4*_num_classes*_num_priors + c*4*_num_priors;
-                        psizes = bbox_sizes_data + n*_num_classes*_num_priors + c*_num_priors;
+                        pboxes = decodedBboxesData + n * 4 * classesNum * priorsNum + c * 4 * priorsNum;
+                        psizes = bboxSizesData + n * classesNum * priorsNum + c * priorsNum;
                     }
 
-                    nms_cf(pconf, pboxes, psizes, pbuffer, pindices, *pdetections, num_priors_actual[n]);
+                    NMSCF(pbuffer, *pdetections, pindices, pboxes, psizes);
                 }
             });
         } else {
             // MXNet style
-            int *pindices = indices_data + n*_num_classes*_num_priors;
-            int *pbuffer = buffer_data;
-            int *pdetections = detections_data + n*_num_classes;
+            int *pbuffer = indicesBufData + n * classesNum * priorsNum;
+            int *pdetections = detectionsData + n * classesNum;
+            int *pindices = indicesData + n * classesNum * priorsNum;
+            const float *pboxes = decodedBboxesData + n * 4 * locNumForClasses * priorsNum;
+            const float *psizes = bboxSizesData + n * locNumForClasses * priorsNum;
 
-            const float *pconf = reordered_conf_data + n*_num_classes*_num_priors;
-            const float *pboxes = decoded_bboxes_data + n*4*_num_loc_classes*_num_priors;
-            const float *psizes = bbox_sizes_data + n*_num_loc_classes*_num_priors;
-
-            nms_mx(pconf, pboxes, psizes, pbuffer, pindices, pdetections, _num_priors);
+            NMSMX(pbuffer, pdetections, pindices, pboxes, psizes);
         }
 
-        for (int c = 0; c < _num_classes; ++c) {
-            detections_total += detections_data[n*_num_classes + c];
-        }
+        int detectionsTotal = 0;
+        detectionsTotal = parallel_sum(classesNum, detectionsTotal, [&](size_t c)->int {
+            return detectionsData[n * classesNum + c];
+        });
 
-        if (_keep_top_k > -1 && detections_total > _keep_top_k) {
-            std::vector<std::pair<float, std::pair<int, int>>> conf_index_class_map;
+        // combine detections of all class for this image and filter with global(image) topk(keep_topk)
+        if (keepTopK > -1 && detectionsTotal > keepTopK) {
+            std::vector<std::pair<float, std::pair<int, int>>> confIndicesClassMap;
 
-            for (int c = 0; c < _num_classes; ++c) {
-                int detections = detections_data[n*_num_classes + c];
-                int *pindices = indices_data + n*_num_classes*_num_priors + c*_num_priors;
+            std::mutex mtx;
+            parallel_for(classesNum, [&](int c) {
+                int detections = detectionsData[n * classesNum + c];
+                int *pindices = indicesData + n * classesNum * priorsNum + c * priorsNum;
 
-                float *pconf  = reordered_conf_data + n*_num_classes*_num_priors + c*_num_priors;
+                float *pconf  = reorderedConfData + n * classesNum * confInfoLen + c * confInfoLen;
 
                 for (int i = 0; i < detections; ++i) {
-                    int idx = pindices[i];
-                    conf_index_class_map.push_back(std::make_pair(pconf[idx], std::make_pair(c, idx)));
+                    int pr = pindices[i];
+                    mtx.lock();
+                    confIndicesClassMap.push_back(std::make_pair(pconf[pr], std::make_pair(c, pr)));
+                    mtx.unlock();
                 }
-            }
+            });
 
-            std::sort(conf_index_class_map.begin(), conf_index_class_map.end(),
+            std::sort(confIndicesClassMap.begin(), confIndicesClassMap.end(),
                       SortScorePairDescend<std::pair<int, int>>);
-            conf_index_class_map.resize(_keep_top_k);
+            confIndicesClassMap.resize(keepTopK);
 
-            // Store the new indices.
-            memset(detections_data + n*_num_classes, 0, _num_classes * sizeof(int));
+            // Store the new indices. Assign to class back
+            memset(detectionsData + n * classesNum, 0, classesNum * sizeof(int));
 
-            for (size_t j = 0; j < conf_index_class_map.size(); ++j) {
-                int label = conf_index_class_map[j].second.first;
-                int idx = conf_index_class_map[j].second.second;
-                int *pindices = indices_data + n * _num_classes * _num_priors + label * _num_priors;
-                pindices[detections_data[n*_num_classes + label]] = idx;
-                detections_data[n*_num_classes + label]++;
+            for (size_t j = 0; j < confIndicesClassMap.size(); ++j) {
+                int cls = confIndicesClassMap[j].second.first;
+                int pr = confIndicesClassMap[j].second.second;
+                int *pindices = indicesData + n * classesNum * priorsNum + cls * priorsNum;
+                pindices[detectionsData[n * classesNum + cls]] = pr;
+                detectionsData[n * classesNum + cls]++;
             }
         }
     }
 
-    const int num_results = getChildEdgesAtPort(0)[0]->getShape().getStaticDims()[2];
-    const int DETECTION_SIZE = getChildEdgesAtPort(0)[0]->getShape().getStaticDims()[3];
-    if (DETECTION_SIZE != 7) {
-        IE_THROW() << NOT_IMPLEMENTED;
-    }
-
-    int dst_data_size = 0;
-    if (_keep_top_k > 0)
-        dst_data_size = N * _keep_top_k * DETECTION_SIZE * sizeof(float);
-    else if (_top_k > 0)
-        dst_data_size = N * _top_k * _num_classes * DETECTION_SIZE * sizeof(float);
-    else
-        dst_data_size = N * _num_classes * _num_priors * DETECTION_SIZE * sizeof(float);
+    // get final output
+    generateOutput(reorderedConfData, indicesData, detectionsData, decodedBboxesData, dstData);
+}
 
-    if (dst_data_size > getChildEdgesAtPort(0)[0]->getMemory().GetSize()) {
-        IE_THROW() << OUT_OF_BOUNDS;
+inline void MKLDNNDetectionOutputNode::getActualPriorNum(const float *priorData, int* numPriorsActual, int n) {
+    numPriorsActual[n] = priorsNum;
+    if (!normalized) {
+        int num = 0;
+        for (; num < priorsNum; ++num) {
+            float imgId = priorData[num * priorSize];
+            if (imgId == -1.f) {
+                numPriorsActual[n] = num;
+                break;
+            }
+        }
     }
-    memset(dst_data, 0, dst_data_size);
+}
 
-    int count = 0;
-    for (int n = 0; n < N; ++n) {
-        const float *pconf   = reordered_conf_data + n * _num_priors * _num_classes;
-        const float *pboxes  = decoded_bboxes_data + n*_num_priors*4*_num_loc_classes;
-        const int *pindices  = indices_data + n*_num_classes*_num_priors;
-
-        for (int c = 0; c < _num_classes; ++c) {
-            for (int i = 0; i < detections_data[n*_num_classes + c]; ++i) {
-                int idx = pindices[c*_num_priors + i];
-
-                dst_data[count * DETECTION_SIZE + 0] = static_cast<float>(n);
-                dst_data[count * DETECTION_SIZE + 1] = static_cast<float>(_decrease_label_id ? c-1 : c);
-                dst_data[count * DETECTION_SIZE + 2] = pconf[c*_num_priors + idx];
-
-                float xmin = _share_location ? pboxes[idx*4 + 0] :
-                             pboxes[c*4*_num_priors + idx*4 + 0];
-                float ymin = _share_location ? pboxes[idx*4 + 1] :
-                             pboxes[c*4*_num_priors + idx*4 + 1];
-                float xmax = _share_location ? pboxes[idx*4 + 2] :
-                             pboxes[c*4*_num_priors + idx*4 + 2];
-                float ymax = _share_location ? pboxes[idx*4 + 3] :
-                             pboxes[c*4*_num_priors + idx*4 + 3];
-
-                if (_clip_after_nms) {
-                    xmin = (std::max)(0.0f, (std::min)(1.0f, xmin));
-                    ymin = (std::max)(0.0f, (std::min)(1.0f, ymin));
-                    xmax = (std::max)(0.0f, (std::min)(1.0f, xmax));
-                    ymax = (std::max)(0.0f, (std::min)(1.0f, ymax));
+inline void MKLDNNDetectionOutputNode::confReorderDense(const float *confData, const float *ARMConfData, float *reorderedConfData) {
+    if (withAddBoxPred) {
+        parallel_for2d(imgNum, priorsNum, [&](size_t n, size_t p) {
+            if (ARMConfData[n * priorsNum * 2 + p * 2 + 1] < objScore) {
+                for (int c = 0; c < classesNum; ++c) {
+                    reorderedConfData[n * priorsNum * classesNum + c * priorsNum + p] = c == backgroundClassId ? 1.0f : 0.0f;
                 }
+            } else {
+                for (int c = 0; c < classesNum; ++c) {
+                    reorderedConfData[n * priorsNum * classesNum + c * priorsNum + p] = confData[n * priorsNum * classesNum + p * classesNum + c];
+                }
+            }
+        });
+        return;
+    }
+    // withAddBoxPred is false
+    parallel_for2d(imgNum, classesNum, [&](size_t n, size_t c) {
+        int offset = n * priorsNum * classesNum;
+        for (int p = 0; p < priorsNum; ++p) {
+            reorderedConfData[offset + c * priorsNum + p] =
+            confData[offset + p * classesNum + c];
+        }
+    });
+}
 
-                dst_data[count * DETECTION_SIZE + 3] = xmin;
-                dst_data[count * DETECTION_SIZE + 4] = ymin;
-                dst_data[count * DETECTION_SIZE + 5] = xmax;
-                dst_data[count * DETECTION_SIZE + 6] = ymax;
-
-                ++count;
+inline void MKLDNNDetectionOutputNode::confFilterCF(float* reorderedConfData, int* indicesData, int* indicesBufData, int* detectionsData) {
+    parallel_for2d(imgNum, classesNum, [&](size_t n, size_t c) {
+        // in:  reorderedConf
+        // out: pindices count
+        if (c == backgroundClassId)
+            return;
+        int off = n * priorsNum * classesNum + c * priorsNum;
+        const float *pconf = reorderedConfData + off;
+        int *pindices = indicesData + off;
+        int *pbuffer = indicesBufData + off;
+
+        int count = 0;
+        for (int i = 0; i < numPriorsActual[n]; ++i) {
+            if (pconf[i] > confidenceThreshold) {
+                pindices[count] = i;
+                count++;
             }
         }
-    }
 
-    if (count < num_results) {
-        // marker at end of boxes list
-        dst_data[count * DETECTION_SIZE + 0] = -1;
-    }
+        // in:  pindices count
+        // out: buffer detectionCount
+        int k = (topK == -1 ? count : (std::min)(topK, count));
+        topk(pindices, pbuffer, pconf, count, k);
+        detectionsData[n*classesNum + c] = k;
+    });
 }
 
-struct ConfidenceComparator {
-    explicit ConfidenceComparator(const float* conf_data) : _conf_data(conf_data) {}
-
-    bool operator()(int idx1, int idx2) {
-        if (_conf_data[idx1] > _conf_data[idx2]) return true;
-        if (_conf_data[idx1] < _conf_data[idx2]) return false;
-        return idx1 < idx2;
+// MX filter is per image filter, max output is prior num(select max for all class within this prior)
+// NMS is per class, keep topk is per image, final output is per class
+inline void MKLDNNDetectionOutputNode::confFilterMX(const float* confData, const float* ARMConfData, float* reorderedConfData,
+    int* indicesData, int* indicesBufData, int* detectionsData) {
+    for (int n = 0; n < imgNum; ++n) {
+        int offB = n * priorsNum * classesNum;
+        std::mutex mtx;
+        parallel_for(numPriorsActual[n], [&](size_t p) {
+            // in:  origin conf
+            // out: pindices, detectionCount
+            // intentionally code branch from higher level
+            if (withAddBoxPred) {
+                bool isARMPrior = ARMConfData[n*priorsNum*2 + p * 2 + 1] < objScore;
+                float maxConf = -1;
+                int maxCIdx = 0;
+                for (int c = 1; c < classesNum; ++c) {
+                    float conf = confData[offB + p * classesNum + c];
+                    if (isARMPrior)
+                        conf = (c == backgroundClassId) ? 1.0f : 0.0f;  // still need refresh conf due to read from origin conf
+                    if (conf >= confidenceThreshold && conf > maxConf) {
+                        maxConf = conf;
+                        maxCIdx = c;
+                    }
+                }
+                if (maxCIdx > 0) {
+                    // include this prior
+                    mtx.lock();
+                    indicesData[offB + detectionsData[n*classesNum]] = maxCIdx*priorsNum + p;  // de-refer to get prior and class id.
+                    detectionsData[n*classesNum]++;
+                    mtx.unlock();
+                }
+            } else {
+                float maxConf = -1;
+                int maxCIdx = 0;
+                for (int c = 1; c < classesNum; ++c) {
+                    float conf = confData[offB + p * classesNum + c];
+                    if (conf >= confidenceThreshold && conf > maxConf) {
+                        maxConf = conf;
+                        maxCIdx = c;
+                    }
+                }
+                if (maxCIdx > 0) {
+                    // include this prior and class with max conf
+                    mtx.lock();
+                    indicesData[offB + detectionsData[n*classesNum]] = maxCIdx*priorsNum + p;  // de-refer to get prior and class id.
+                    detectionsData[n*classesNum]++;
+                    mtx.unlock();
+                }
+            }
+        });
+
+        // in:  pindices, detectionCount(filtered num)
+        // out: buffer, detectionCount(k)
+        int count = detectionsData[n*classesNum];
+        int k = (topK == -1 ? count : (std::min)(topK, count));
+
+        const float *pconf = reorderedConfData + offB;
+        int *indices = indicesData + offB;
+        int *pbuffer = indicesBufData + offB;
+        topk(indices, pbuffer, pconf, count, k);
+        detectionsData[n * classesNum] = k;
     }
+}
 
-    const float* _conf_data;
-};
-
-static inline float JaccardOverlap(const float *decoded_bbox,
-                                   const float *bbox_sizes,
-                                   const int idx1,
-                                   const int idx2) {
-    float xmin1 = decoded_bbox[idx1*4 + 0];
-    float ymin1 = decoded_bbox[idx1*4 + 1];
-    float xmax1 = decoded_bbox[idx1*4 + 2];
-    float ymax1 = decoded_bbox[idx1*4 + 3];
-
-    float xmin2 = decoded_bbox[idx2*4 + 0];
-    float ymin2 = decoded_bbox[idx2*4 + 1];
-    float xmax2 = decoded_bbox[idx2*4 + 2];
-    float ymax2 = decoded_bbox[idx2*4 + 3];
-
-    if (xmin2 > xmax1 || xmax2 < xmin1 || ymin2 > ymax1 || ymax2 < ymin1) {
-        return 0.0f;
+inline void MKLDNNDetectionOutputNode::confReorderAndFilterSparsityCF(const float* confData, const float* ARMConfData, float* reorderedConfData,
+    int* indicesData, int* indicesBufData, int* detectionsData) {
+    int* reorderedConfDataIndices = reinterpret_cast<int*>(reorderedConfData);
+    for (int n = 0; n < imgNum; ++n) {
+        int off = n * priorsNum * classesNum;
+        int offV = n * priorsNum;  // vertical info
+
+        int offH = n * confInfoLen * classesNum; // horizontal info
+        // reset count
+        parallel_for(classesNum, [&](size_t c) {
+            int countIdx = offH + c * confInfoLen + priorsNum;
+            reorderedConfDataIndices[countIdx] = 0;
+        });
+
+        std::mutex mtx;
+        parallel_for(numPriorsActual[n], [&](size_t p) {
+            // intentionally code branch from higher level
+            if (withAddBoxPred) {
+                bool isARMPrior = ARMConfData[n * priorsNum * 2 + p * 2 + 1] < objScore;
+                bool priorStatusSet = false;
+                if (isShareLoc)
+                    confInfoForPrior[offV + p] = -1;
+                int confIdxPrior = off + p * classesNum;
+                for (int c = 0; c < classesNum; ++c) {
+                    float conf = confData[confIdxPrior + c];
+                    if (isARMPrior)
+                        conf = (c == backgroundClassId) ? 1.0f : 0.0f;
+                    if (conf > confidenceThreshold) {
+                        int idx = offH + c * confInfoLen;
+                        reorderedConfData[idx + p] = conf;
+                        mtx.lock();
+                        reorderedConfDataIndices[idx + priorsNum]++;
+                        reorderedConfDataIndices[idx + priorsNum + reorderedConfDataIndices[idx + priorsNum]] = p;
+                        mtx.unlock();
+
+                        // vertical info for isShareLoc(flag to decode for each prior)
+                        if (!priorStatusSet && isShareLoc) {
+                            confInfoForPrior[offV + p] = 1; // 1 for decode
+                        }
+                    }
+                }
+            } else {
+                bool priorStatusSet = false;
+                if (isShareLoc)
+                    confInfoForPrior[offV + p] = -1;
+                int confIdxPrior = off + p * classesNum;
+                for (int c = 0; c < classesNum; ++c) {
+                    float conf = confData[confIdxPrior + c];
+                    if (conf > confidenceThreshold) {
+                        int idx = offH + c * confInfoLen;
+                        reorderedConfData[idx + p] = conf;
+                        mtx.lock();
+                        reorderedConfDataIndices[idx + priorsNum]++;
+                        reorderedConfDataIndices[idx + priorsNum + reorderedConfDataIndices[idx + priorsNum]] = p;
+                        mtx.unlock();
+
+                        if (!priorStatusSet && isShareLoc) {
+                            confInfoForPrior[offV + p] = 1;
+                        }
+                    }
+                }
+            }
+        });
+        // topk
+        parallel_for(classesNum, [&](size_t c) {
+            // in:  conf_h info
+            // out: buffer, detectionCount(k)
+            if (c == backgroundClassId)  // Ignore background class
+                return;
+            int countIdx = offH + c * confInfoLen + priorsNum;
+            int count = reorderedConfDataIndices[countIdx];
+            int k = (topK == -1 ? count : (std::min)(topK, count));
+
+            int *reorderedConfIndices = reorderedConfDataIndices + countIdx + 1;
+            int *pbuffer = indicesBufData + off + c * priorsNum;
+            const float *pconf = reorderedConfData + offH + c * confInfoLen;
+
+            topk(reorderedConfIndices, pbuffer, pconf, count, k);
+            detectionsData[n * classesNum + c] = k;
+        });
     }
+}
 
-    float intersect_xmin = (std::max)(xmin1, xmin2);
-    float intersect_ymin = (std::max)(ymin1, ymin2);
-    float intersect_xmax = (std::min)(xmax1, xmax2);
-    float intersect_ymax = (std::min)(ymax1, ymax2);
-
-    float intersect_width  = intersect_xmax - intersect_xmin;
-    float intersect_height = intersect_ymax - intersect_ymin;
-
-    if (intersect_width <= 0 || intersect_height <= 0) {
-        return 0.0f;
+inline void MKLDNNDetectionOutputNode::confReorderAndFilterSparsityMX(const float* confData, const float* ARMConfData, float* reorderedConfData,
+    int* indicesData, int* indicesBufData, int* detectionsData) {
+    for (int n = 0; n < imgNum; ++n) {
+        int off = n * priorsNum * classesNum;
+        int offV = n * priorsNum;  // vertical info
+
+        std::mutex mtx;
+        parallel_for(numPriorsActual[n], [&](size_t p) {
+            bool isARMPrior = false;
+            if (withAddBoxPred)
+                isARMPrior = ARMConfData[n * priorsNum * 2 + p * 2 + 1] < objScore;
+            bool priorStatusSet = false;
+            if (isShareLoc)
+                confInfoForPrior[offV + p] = -1;
+            float maxConf = -1;
+            int maxCIdx = 0;
+            int confIdxPrior = off + p * classesNum;
+            for (int c = 0; c < classesNum; ++c) {
+                float conf = confData[confIdxPrior + c];
+                if (withAddBoxPred && isARMPrior)
+                    conf = (c == backgroundClassId) ? 1.0f : 0.0f;
+                if (conf >= confidenceThreshold) {
+                    int idx = off + c * confInfoLen;
+                    reorderedConfData[idx + p] = conf;
+
+                    // vertical info for isShareLoc(flag to decode for each prior)
+                    if (!priorStatusSet && isShareLoc) {
+                        confInfoForPrior[offV + p] = 1; // 1 for decode
+                    }
+                    // vertical info for MXNet style(max conf for each prior)
+                    if (c != 0) {
+                        if (conf > maxConf) {
+                            maxConf = conf;
+                            maxCIdx = c;
+                        }
+                    }
+                }
+            }
+            // MXNet statistic, indices and detectionCount is for each image
+            if (maxCIdx > 0) {
+                mtx.lock();
+                indicesData[off + detectionsData[n * classesNum]] = maxCIdx * priorsNum + p;  // de-refer to get prior and class id.
+                detectionsData[n * classesNum]++;
+                mtx.unlock();
+            }
+        });
+        // topk
+        // in:  indicesData, detection_count(filtered num)
+        // out: buffer, detection_count(k)
+        int count = detectionsData[n * classesNum];
+        int k = (topK == -1 ? count : (std::min)(topK, count));
+
+        const float *pconf = reorderedConfData + off;
+        int *indices = indicesData + off;
+        int *pbuffer = indicesBufData + off;
+        topk(indices, pbuffer, pconf, count, k);
+        detectionsData[n * classesNum] = k;
     }
-
-    float intersect_size = intersect_width * intersect_height;
-    float bbox1_size = bbox_sizes[idx1];
-    float bbox2_size = bbox_sizes[idx2];
-
-    return intersect_size / (bbox1_size + bbox2_size - intersect_size);
 }
 
-void MKLDNNDetectionOutputNode::decodeBBoxes(const float *prior_data,
-                                       const float *loc_data,
-                                       const float *variance_data,
-                                       float *decoded_bboxes,
-                                       float *decoded_bbox_sizes,
-                                       int* num_priors_actual,
+inline void MKLDNNDetectionOutputNode::decodeBBoxes(const float *priorData,
+                                       const float *locData,
+                                       const float *varianceData,
+                                       float *decodedBboxes,
+                                       float *decodedBboxSizes,
+                                       int* numPriorsActual,
                                        int n,
                                        const int& offs,
-                                       const int& pr_size,
-                                       bool decodeType) {
-    num_priors_actual[n] = _num_priors;
-    if (!_normalized && decodeType) {
-        int num = 0;
-        for (; num < _num_priors; ++num) {
-            float batch_id = prior_data[num * pr_size + 0];
-            if (batch_id == -1.f) {
-                num_priors_actual[n] = num;
-                break;
-            }
-        }
+                                       const int& priorSize,
+                                       bool decodeType,
+                                       const int *confInfoH,
+                                       const int *confInfoV) {
+    int prNum = numPriorsActual[n];
+    if (!decodeType) {
+        prNum = priorsNum;
     }
-    parallel_for(num_priors_actual[n], [&](int p) {
-        float new_xmin = 0.0f;
-        float new_ymin = 0.0f;
-        float new_xmax = 0.0f;
-        float new_ymax = 0.0f;
-
-        float prior_xmin = prior_data[p*pr_size + 0 + offs];
-        float prior_ymin = prior_data[p*pr_size + 1 + offs];
-        float prior_xmax = prior_data[p*pr_size + 2 + offs];
-        float prior_ymax = prior_data[p*pr_size + 3 + offs];
-
-        float loc_xmin = loc_data[4*p*_num_loc_classes + 0];
-        float loc_ymin = loc_data[4*p*_num_loc_classes + 1];
-        float loc_xmax = loc_data[4*p*_num_loc_classes + 2];
-        float loc_ymax = loc_data[4*p*_num_loc_classes + 3];
-
-        if (!_normalized) {
-            prior_xmin /= _image_width;
-            prior_ymin /= _image_height;
-            prior_xmax /= _image_width;
-            prior_ymax /= _image_height;
+    if (isSparsityWorthwhile && !isShareLoc && !decreaseClassId && confInfoH[priorsNum] == 0) {
+        return;
+    }
+    parallel_for(prNum, [&](int p) {
+        if (isSparsityWorthwhile && isShareLoc && confInfoV[p] == -1) {
+            return;
+        }
+        float newXMin = 0.0f;
+        float newYMin = 0.0f;
+        float newXMax = 0.0f;
+        float newYMax = 0.0f;
+
+        float priorXMin = priorData[p * priorSize + 0 + offs];
+        float priorYMin = priorData[p * priorSize + 1 + offs];
+        float priorXMax = priorData[p * priorSize + 2 + offs];
+        float priorYMax = priorData[p * priorSize + 3 + offs];
+
+        float locXMin = locData[4 * p * locNumForClasses + 0];
+        float locYMin = locData[4 * p * locNumForClasses + 1];
+        float locXMax = locData[4 * p * locNumForClasses + 2];
+        float locYMax = locData[4 * p * locNumForClasses + 3];
+
+        if (!normalized) {
+            priorXMin /= imgWidth;
+            priorYMin /= imgHeight;
+            priorXMax /= imgWidth;
+            priorYMax /= imgHeight;
         }
 
-        if (_code_type == CodeType::CORNER) {
-            if (_variance_encoded_in_target) {
+        if (codeType == CodeType::CORNER) {
+            if (varianceEncodedInTarget) {
                 // variance is encoded in target, we simply need to add the offset predictions.
-                new_xmin = prior_xmin + loc_xmin;
-                new_ymin = prior_ymin + loc_ymin;
-                new_xmax = prior_xmax + loc_xmax;
-                new_ymax = prior_ymax + loc_ymax;
+                newXMin = priorXMin + locXMin;
+                newYMin = priorYMin + locYMin;
+                newXMax = priorXMax + locXMax;
+                newYMax = priorYMax + locYMax;
             } else {
-                new_xmin = prior_xmin + variance_data[p*4 + 0] * loc_xmin;
-                new_ymin = prior_ymin + variance_data[p*4 + 1] * loc_ymin;
-                new_xmax = prior_xmax + variance_data[p*4 + 2] * loc_xmax;
-                new_ymax = prior_ymax + variance_data[p*4 + 3] * loc_ymax;
+                newXMin = priorXMin + varianceData[p * 4 + 0] * locXMin;
+                newYMin = priorYMin + varianceData[p * 4 + 1] * locYMin;
+                newXMax = priorXMax + varianceData[p * 4 + 2] * locXMax;
+                newYMax = priorYMax + varianceData[p * 4 + 3] * locYMax;
             }
-        } else if (_code_type == CodeType::CENTER_SIZE) {
-            float prior_width    =  prior_xmax - prior_xmin;
-            float prior_height   =  prior_ymax - prior_ymin;
-            float prior_center_x = (prior_xmin + prior_xmax) / 2.0f;
-            float prior_center_y = (prior_ymin + prior_ymax) / 2.0f;
+        } else if (codeType == CodeType::CENTER_SIZE) {
+            float priorWidth    =  priorXMax - priorXMin;
+            float priorHeight   =  priorYMax - priorYMin;
+            float priorCenterX = (priorXMin + priorXMax) / 2.0f;
+            float priorCenterY = (priorYMin + priorYMax) / 2.0f;
 
-            float decode_bbox_center_x, decode_bbox_center_y;
-            float decode_bbox_width, decode_bbox_height;
+            float decodeBboxCenterX, decodeBboxCenterY;
+            float decodeBboxWidth, decodeBboxHeight;
 
-            if (_variance_encoded_in_target) {
+            if (varianceEncodedInTarget) {
                 // variance is encoded in target, we simply need to restore the offset predictions.
-                decode_bbox_center_x = loc_xmin * prior_width  + prior_center_x;
-                decode_bbox_center_y = loc_ymin * prior_height + prior_center_y;
-                decode_bbox_width  = std::exp(loc_xmax) * prior_width;
-                decode_bbox_height = std::exp(loc_ymax) * prior_height;
+                decodeBboxCenterX = locXMin * priorWidth  + priorCenterX;
+                decodeBboxCenterY = locYMin * priorHeight + priorCenterY;
+                decodeBboxWidth  = std::exp(locXMax) * priorWidth;
+                decodeBboxHeight = std::exp(locYMax) * priorHeight;
             } else {
                 // variance is encoded in bbox, we need to scale the offset accordingly.
-                decode_bbox_center_x = variance_data[p*4 + 0] * loc_xmin * prior_width + prior_center_x;
-                decode_bbox_center_y = variance_data[p*4 + 1] * loc_ymin * prior_height + prior_center_y;
-                decode_bbox_width    = std::exp(variance_data[p*4 + 2] * loc_xmax) * prior_width;
-                decode_bbox_height   = std::exp(variance_data[p*4 + 3] * loc_ymax) * prior_height;
+                decodeBboxCenterX = varianceData[p*4 + 0] * locXMin * priorWidth + priorCenterX;
+                decodeBboxCenterY = varianceData[p*4 + 1] * locYMin * priorHeight + priorCenterY;
+                decodeBboxWidth    = std::exp(varianceData[p*4 + 2] * locXMax) * priorWidth;
+                decodeBboxHeight   = std::exp(varianceData[p*4 + 3] * locYMax) * priorHeight;
             }
 
-            new_xmin = decode_bbox_center_x - decode_bbox_width  / 2.0f;
-            new_ymin = decode_bbox_center_y - decode_bbox_height / 2.0f;
-            new_xmax = decode_bbox_center_x + decode_bbox_width  / 2.0f;
-            new_ymax = decode_bbox_center_y + decode_bbox_height / 2.0f;
+            newXMin = decodeBboxCenterX - decodeBboxWidth  / 2.0f;
+            newYMin = decodeBboxCenterY - decodeBboxHeight / 2.0f;
+            newXMax = decodeBboxCenterX + decodeBboxWidth  / 2.0f;
+            newYMax = decodeBboxCenterY + decodeBboxHeight / 2.0f;
         }
 
-        if (_clip_before_nms) {
-            new_xmin = (std::max)(0.0f, (std::min)(1.0f, new_xmin));
-            new_ymin = (std::max)(0.0f, (std::min)(1.0f, new_ymin));
-            new_xmax = (std::max)(0.0f, (std::min)(1.0f, new_xmax));
-            new_ymax = (std::max)(0.0f, (std::min)(1.0f, new_ymax));
+        if (clipBeforeNMS) {
+            newXMin = (std::max)(0.0f, (std::min)(1.0f, newXMin));
+            newYMin = (std::max)(0.0f, (std::min)(1.0f, newYMin));
+            newXMax = (std::max)(0.0f, (std::min)(1.0f, newXMax));
+            newYMax = (std::max)(0.0f, (std::min)(1.0f, newYMax));
         }
 
-        decoded_bboxes[p*4 + 0] = new_xmin;
-        decoded_bboxes[p*4 + 1] = new_ymin;
-        decoded_bboxes[p*4 + 2] = new_xmax;
-        decoded_bboxes[p*4 + 3] = new_ymax;
+        decodedBboxes[p*4 + 0] = newXMin;
+        decodedBboxes[p*4 + 1] = newYMin;
+        decodedBboxes[p*4 + 2] = newXMax;
+        decodedBboxes[p*4 + 3] = newYMax;
 
-        decoded_bbox_sizes[p] = (new_xmax - new_xmin) * (new_ymax - new_ymin);
+        decodedBboxSizes[p] = (newXMax - newXMin) * (newYMax - newYMin);
     });
 }
 
-void MKLDNNDetectionOutputNode::nms_cf(const float* conf_data,
-                                 const float* bboxes,
-                                 const float* sizes,
-                                 int* buffer,
-                                 int* indices,
-                                 int& detections,
-                                 int num_priors_actual) {
-    int count = 0;
-    for (int i = 0; i < num_priors_actual; ++i) {
-        if (conf_data[i] > _confidence_threshold) {
-            indices[count] = i;
-            count++;
-        }
+inline void MKLDNNDetectionOutputNode::topk(const int *indicesIn, int *indicesOut, const float *conf, int n, int k) {
+    std::partial_sort_copy(indicesIn, indicesIn + n,
+                           indicesOut, indicesOut + k,
+                           ConfidenceComparatorDO(conf));
+}
+
+static inline float JaccardOverlap(const float *decodedBbox,
+                                   const float *bboxSizes,
+                                   const int idx1,
+                                   const int idx2) {
+    float xmin1 = decodedBbox[idx1 * 4 + 0];
+    float ymin1 = decodedBbox[idx1 * 4 + 1];
+    float xmax1 = decodedBbox[idx1 * 4 + 2];
+    float ymax1 = decodedBbox[idx1 * 4 + 3];
+
+    float xmin2 = decodedBbox[idx2 * 4 + 0];
+    float ymin2 = decodedBbox[idx2 * 4 + 1];
+    float xmax2 = decodedBbox[idx2 * 4 + 2];
+    float ymax2 = decodedBbox[idx2 * 4 + 3];
+
+    if (xmin2 > xmax1 || xmax2 < xmin1 || ymin2 > ymax1 || ymax2 < ymin1) {
+        return 0.0f;
     }
 
-    int num_output_scores = (_top_k == -1 ? count : (std::min)(_top_k, count));
+    float intersectXMin = (std::max)(xmin1, xmin2);
+    float intersectYMin = (std::max)(ymin1, ymin2);
+    float intersectXMax = (std::min)(xmax1, xmax2);
+    float intersectYMax = (std::min)(ymax1, ymax2);
 
-    std::partial_sort_copy(indices, indices + count,
-                           buffer, buffer + num_output_scores,
-                           ConfidenceComparator(conf_data));
+    float intersectWidth  = intersectXMax - intersectXMin;
+    float intersectHeight = intersectYMax - intersectYMin;
 
-    for (int i = 0; i < num_output_scores; ++i) {
-        const int idx = buffer[i];
+    if (intersectWidth <= 0 || intersectHeight <= 0) {
+        return 0.0f;
+    }
+
+    float intersectSize = intersectWidth * intersectHeight;
+    float bbox1Size = bboxSizes[idx1];
+    float bbox2Size = bboxSizes[idx2];
+
+    return intersectSize / (bbox1Size + bbox2Size - intersectSize);
+}
+
+inline void MKLDNNDetectionOutputNode::NMSCF(int* indicesIn,
+                                        int& detections,
+                                        int* indicesOut,
+                                        const float* bboxes,
+                                        const float* boxSizes) {
+    // nms for this class
+    int countIn = detections;
+    detections = 0;
+    for (int i = 0; i < countIn; ++i) {
+        const int prior = indicesIn[i];
 
         bool keep = true;
         for (int k = 0; k < detections; ++k) {
-            const int kept_idx = indices[k];
-            float overlap = JaccardOverlap(bboxes, sizes, idx, kept_idx);
-            if (overlap > _nms_threshold) {
+            const int keptPrior = indicesOut[k];
+            float overlap = JaccardOverlap(bboxes, boxSizes, prior, keptPrior);
+            if (overlap > NMSThreshold) {
                 keep = false;
                 break;
             }
         }
         if (keep) {
-            indices[detections] = idx;
+            indicesOut[detections] = prior;
             detections++;
         }
     }
 }
 
-void MKLDNNDetectionOutputNode::nms_mx(const float* conf_data,
-                                 const float* bboxes,
-                                 const float* sizes,
-                                 int* buffer,
-                                 int* indices,
-                                 int* detections,
-                                 int num_priors_actual) {
-    int count = 0;
-    for (int i = 0; i < num_priors_actual; ++i) {
-        float conf = -1;
-        int id = 0;
-        for (int c = 1; c < _num_classes; ++c) {
-            float temp = conf_data[c*_num_priors + i];
-            if (temp > conf) {
-                conf = temp;
-                id = c;
-            }
-        }
-
-        if (id > 0 && conf >= _confidence_threshold) {
-            indices[count++] = id*_num_priors + i;
-        }
-    }
-
-    int num_output_scores = (_top_k == -1 ? count : (std::min)(_top_k, count));
-
-    std::partial_sort_copy(indices, indices + count,
-                           buffer, buffer + num_output_scores,
-                           ConfidenceComparator(conf_data));
-
-    for (int i = 0; i < num_output_scores; ++i) {
-        const int idx = buffer[i];
-        const int cls = idx/_num_priors;
-        const int prior = idx%_num_priors;
-
+inline void MKLDNNDetectionOutputNode::NMSMX(int* indicesIn,
+                                    int* detections,
+                                    int* indicesOut,
+                                    const float* bboxes,
+                                    const float* sizes) {
+    // Input is candidate for image, output is candidate for each class within image
+    int countIn = detections[0];
+    detections[0] = 0;
+
+    for (int i = 0; i < countIn; ++i) {
+        const int idx = indicesIn[i];
+        const int cls = idx / priorsNum;
+        const int prior = idx % priorsNum;
+
+        // nms within this class
         int &ndetection = detections[cls];
-        int *pindices = indices + cls*_num_priors;
+        int *pindices = indicesOut + cls * priorsNum;
 
         bool keep = true;
         for (int k = 0; k < ndetection; ++k) {
-            const int kept_idx = pindices[k];
+            const int keptPrior = pindices[k];
             float overlap = 0.0f;
-            if (_share_location) {
-                overlap = JaccardOverlap(bboxes, sizes, prior, kept_idx);
+            if (isShareLoc) {
+                overlap = JaccardOverlap(bboxes, sizes, prior, keptPrior);
             } else {
-                overlap = JaccardOverlap(bboxes, sizes, cls*_num_priors + prior, cls*_num_priors + kept_idx);
+                overlap = JaccardOverlap(bboxes, sizes, cls * priorsNum + prior, cls * priorsNum + keptPrior);
             }
-            if (overlap > _nms_threshold) {
+            if (overlap > NMSThreshold) {
                 keep = false;
                 break;
             }
         }
+
         if (keep) {
             pindices[ndetection++] = prior;
         }
     }
 }
 
+inline void MKLDNNDetectionOutputNode::generateOutput(float* reorderedConfData, int* indicesData, int* detectionsData, float* decodedBboxesData,
+    float* dstData) {
+    const auto outDims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
+    const int numResults = outDims[2];
+    const int DETECTION_SIZE = outDims[3];
+    if (DETECTION_SIZE != 7) {
+        IE_THROW() << errorPrefix << NOT_IMPLEMENTED;
+    }
+
+    int dstDataSize = 0;
+    if (keepTopK > 0)
+        dstDataSize = imgNum * keepTopK * DETECTION_SIZE * sizeof(float);
+    else if (topK > 0)
+        dstDataSize = imgNum * topK * classesNum * DETECTION_SIZE * sizeof(float);
+    else
+        dstDataSize = imgNum * classesNum * priorsNum * DETECTION_SIZE * sizeof(float);
+
+    if (dstDataSize > getChildEdgesAtPort(0)[0]->getMemory().GetSize()) {
+        IE_THROW() << errorPrefix << OUT_OF_BOUNDS;
+    }
+    memset(dstData, 0, dstDataSize);
+
+    // set final detection result to output blob
+    int count = 0;
+    for (int n = 0; n < imgNum; ++n) {
+        const float *pconf   = reorderedConfData + n * confInfoLen * classesNum;
+        const float *pboxes  = decodedBboxesData + n * priorsNum * 4 * locNumForClasses;
+        const int *pindices  = indicesData + n * classesNum * priorsNum;
+
+        for (int c = 0; c < classesNum; ++c) {
+            for (int i = 0; i < detectionsData[n * classesNum + c]; ++i) {
+                int prIdx = pindices[c * priorsNum + i];
+
+                dstData[count * DETECTION_SIZE + 0] = static_cast<float>(n);
+                dstData[count * DETECTION_SIZE + 1] = static_cast<float>(decreaseClassId ? c-1 : c);
+                dstData[count * DETECTION_SIZE + 2] = pconf[c * confInfoLen + prIdx];
+
+                float xmin = isShareLoc ? pboxes[prIdx * 4 + 0] :
+                             pboxes[c * 4 * priorsNum + prIdx * 4 + 0];
+                float ymin = isShareLoc ? pboxes[prIdx * 4 + 1] :
+                             pboxes[c * 4 * priorsNum + prIdx * 4 + 1];
+                float xmax = isShareLoc ? pboxes[prIdx * 4 + 2] :
+                             pboxes[c * 4 * priorsNum + prIdx * 4 + 2];
+                float ymax = isShareLoc ? pboxes[prIdx * 4 + 3] :
+                             pboxes[c * 4 * priorsNum + prIdx * 4 + 3];
+
+                if (clipAfterNMS) {
+                    xmin = (std::max)(0.0f, (std::min)(1.0f, xmin));
+                    ymin = (std::max)(0.0f, (std::min)(1.0f, ymin));
+                    xmax = (std::max)(0.0f, (std::min)(1.0f, xmax));
+                    ymax = (std::max)(0.0f, (std::min)(1.0f, ymax));
+                }
+
+                dstData[count * DETECTION_SIZE + 3] = xmin;
+                dstData[count * DETECTION_SIZE + 4] = ymin;
+                dstData[count * DETECTION_SIZE + 5] = xmax;
+                dstData[count * DETECTION_SIZE + 6] = ymax;
+
+                ++count;
+            }
+        }
+    }
+
+    if (count < numResults) {
+        // marker at end of boxes list
+        dstData[count * DETECTION_SIZE + 0] = -1;
+    }
+}
+
 bool MKLDNNDetectionOutputNode::created() const {
     return getType() == DetectionOutput;
 }
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.h
index dbf9bde760907c..360a697202e1cd 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_detection_output_node.h
@@ -6,6 +6,7 @@
 
 #include <ie_common.h>
 #include <mkldnn_node.h>
+#include "common/permute_kernel.h"
 
 namespace MKLDNNPlugin {
 
@@ -19,66 +20,87 @@ class MKLDNNDetectionOutputNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
-    const int idx_location = 0;
-    const int idx_confidence = 1;
-    const int idx_priors = 2;
-    const int idx_arm_confidence = 3;
-    const int idx_arm_location = 4;
-
-    int _num_classes = 0;
-    int _background_label_id = 0;
-    int _top_k = 0;
-    int _variance_encoded_in_target = 0;
-    int _keep_top_k = 0;
-    int _code_type = 0;
-
-    bool _share_location    = false;
-    bool _clip_before_nms   = false;  // clip bounding boxes before nms step
-    bool _clip_after_nms    = false;  // clip bounding boxes after nms step
-    bool _decrease_label_id = false;
-
-    bool with_add_box_pred = false;
-
-    int _image_width = 0;
-    int _image_height = 0;
-    int _prior_size = 4;
-    bool _normalized = true;
-    int _offset = 0;
-
-    float _nms_threshold = 0.0f;
-    float _confidence_threshold = 0.0f;
-    float _objectness_score = 0.0f;
-
-    int _num = 0;
-    int _num_loc_classes = 0;
-    int _num_priors = 0;
-    bool _priors_batches = false;
+    static const int ID_LOC = 0;
+    static const int ID_CONF = 1;
+    static const int ID_PRIOR = 2;
+    static const int ID_ARM_CONF = 3;
+    static const int ID_ARM_LOC = 4;
+
+    int imgNum = 0;
+    int priorsNum = 0;
+    int classesNum = 0;
+    int priorSize = 4;
+    bool isPriorsPerImg = false;
+    bool isShareLoc = false;
+    int locNumForClasses = 0;
+    bool withAddBoxPred = false;
+    float objScore = 0.0f;
+
+    float confidenceThreshold = 0.0f;
+    float sparsityThreshold = 0.03f;
+    int topK = 0;
+    float NMSThreshold = 0.0f;
+    bool clipBeforeNMS   = false;
+    bool clipAfterNMS    = false;
+    int backgroundClassId = 0;
+    bool decreaseClassId = false;
+    int keepTopK = 0;
+
+    bool varianceEncodedInTarget = false;
+    bool normalized = false;
+    int codeType = 1;
+    int imgWidth = 0;
+    int imgHeight = 0;
+    int coordOffset = 0;
 
     enum CodeType {
         CORNER = 1,
         CENTER_SIZE = 2,
     };
 
-    void decodeBBoxes(const float *prior_data, const float *loc_data, const float *variance_data,
-                      float *decoded_bboxes, float *decoded_bbox_sizes, int* num_priors_actual, int n, const int& offs, const int& pr_size,
-                      bool decodeType = true); // after ARM = false
+    int confInfoLen = 0;
+    bool isSparsityWorthwhile = false;
 
-    void nms_cf(const float *conf_data, const float *bboxes, const float *sizes,
-                int *buffer, int *indices, int &detections, int num_priors_actual);
+    inline void getActualPriorNum(const float* priorData, int* numPriorsActual, int n);
 
-    void nms_mx(const float *conf_data, const float *bboxes, const float *sizes,
-                int *buffer, int *indices, int *detections, int num_priors_actual);
+    inline void confReorderDense(const float* confData, const float* ARMConfData, float* reorderedConfData);
 
-    std::vector<float> _decoded_bboxes;
-    std::vector<int> _buffer;
-    std::vector<int> _indices;
-    std::vector<int> _detections_count;
-    std::vector<float> _reordered_conf;
-    std::vector<float> _bbox_sizes;
-    std::vector<int> _num_priors_actual;
+    inline void confFilterCF(float* reorderedConfData, int* indicesData, int* indicesBufData, int* detectionsData);
+
+    inline void confFilterMX(const float* confData, const float* ARMConfData, float* reorderedConfData,
+        int* indicesData, int* indicesBufData, int* detectionsData);
+
+    inline void confReorderAndFilterSparsityCF(const float* confData, const float* ARMConfData, float* reorderedConfData,
+        int* indicesData, int* indicesBufData, int* detectionsData);
+
+    inline void confReorderAndFilterSparsityMX(const float* confData, const float* ARMConfData, float* reorderedConfData,
+        int* indicesData, int* indicesBufData, int* detectionsData);
+
+    inline void decodeBBoxes(const float* prior_data, const float* loc_data, const float* variance_data,
+                      float* decoded_bboxes, float* decoded_bbox_sizes, int* num_priors_actual, int n, const int& offs, const int& pr_size,
+                      bool decodeType = true, const int* conf_info_h = nullptr, const int* conf_info_v = nullptr); // decodeType is false after ARM
+
+    inline void NMSCF(int* indicesIn, int& detections, int* indicesOut,
+        const float* bboxes, const float* boxSizes);
+
+    inline void NMSMX(int* indicesIn, int* detections, int* indicesOut,
+        const float* bboxes, const float* sizes);
+
+    inline void topk(const int* indicesIn, int* indicesOut, const float* conf, int n, int k);
+
+    inline void generateOutput(float* reorderedConfData, int* indicesData, int* detectionsData, float* decodedBboxesData, float* dstData);
+
+    std::vector<float> decodedBboxes;
+    std::vector<int> indicesBuffer;
+    std::vector<int> indices;
+    std::vector<int> detectionsCount;
+    std::vector<float> reorderedConf;
+    std::vector<float> bboxSizes;
+    std::vector<int> numPriorsActual;
+    std::vector<int> confInfoForPrior;
 
     std::string errorPrefix;
 };
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.cpp
index 1796d49989e9eb..e937e3df98bed4 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.cpp
@@ -19,8 +19,12 @@ using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNDFTNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNDFTNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto interpDFT = std::dynamic_pointer_cast<const ngraph::opset7::DFT>(op);
         const auto interpIDFT = std::dynamic_pointer_cast<const ngraph::opset7::IDFT>(op);
 
@@ -86,7 +90,7 @@ void MKLDNNDFTNode::initSupportedPrimitiveDescriptors() {
         IE_THROW() << layerErrorPrefix << " has unsupported 'axes' input precision: " << axesPrecision.name();
     }
 
-    if (getOriginalInputsNumber() > SIGNAL_SIZE_INDEX) {
+    if (inputShapes.size() > SIGNAL_SIZE_INDEX) {
         const auto& signalSizeTensorPrec = getOriginalInputPrecisionAtPort(SIGNAL_SIZE_INDEX);
         if (signalSizeTensorPrec != Precision::I32 && signalSizeTensorPrec != Precision::I64) {
             IE_THROW() << layerErrorPrefix << " has unsupported 'signal_size' input precision: " << signalSizeTensorPrec.name();
@@ -95,7 +99,7 @@ void MKLDNNDFTNode::initSupportedPrimitiveDescriptors() {
 
     std::vector<PortConfigurator> inDataConfigurators({{LayoutType::ncsp, Precision::FP32},
                                                        {LayoutType::ncsp, Precision::I32}});
-    if (getOriginalInputsNumber() > SIGNAL_SIZE_INDEX)
+    if (inputShapes.size() > SIGNAL_SIZE_INDEX)
         inDataConfigurators.push_back({LayoutType::ncsp,  Precision::I32});
 
     addSupportedPrimDesc(inDataConfigurators, {{LayoutType::ncsp, Precision::FP32}}, impl_desc_type::ref_any);
@@ -225,7 +229,7 @@ void copyDataToOutputWithSignalSize(const float* input, const std::vector<size_t
 void MKLDNNDFTNode::execute(mkldnn::stream strm) {
     auto axesEdge = getParentEdgeAt(AXES_INDEX);
     const auto* axesStartPtr = reinterpret_cast<const int32_t*>(axesEdge->getMemoryPtr()->GetPtr());
-    axes = std::vector<int32_t>(axesStartPtr, axesStartPtr + axesEdge->getShape().getStaticDims()[0]);
+    axes = std::vector<int32_t>(axesStartPtr, axesStartPtr + axesEdge->getMemory().getStaticDims()[0]);
     for (auto& axis : axes) {
         if (axis < 0) {
             axis += inputShape.size() - 1;
@@ -233,7 +237,7 @@ void MKLDNNDFTNode::execute(mkldnn::stream strm) {
     }
     std::sort(axes.begin(), axes.end());
 
-    outputShape = getChildEdgeAt(0)->getShape().getStaticDims();
+    outputShape = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
     for (size_t axis : axes) {
         size_t nComplex = outputShape[axis];
         // FFT uses different twiddle factors
@@ -247,8 +251,8 @@ void MKLDNNDFTNode::execute(mkldnn::stream strm) {
     const auto *input = reinterpret_cast<const float*>(inputDataEdge->getMemoryPtr()->GetPtr());
     auto *output = reinterpret_cast<float*>(outputDataEdge->getMemoryPtr()->GetPtr());
 
-    auto inputStrides = inputDataEdge->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
-    auto outputStrides = outputDataEdge->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    auto inputStrides = inputDataEdge->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
+    auto outputStrides = outputDataEdge->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
     if (inputShape != outputShape) {
         copyDataToOutputWithSignalSize(input, inputShape, inputStrides, output, outputShape, outputStrides);
     } else {
@@ -257,7 +261,7 @@ void MKLDNNDFTNode::execute(mkldnn::stream strm) {
     }
 
     // 1d case
-    if (inputDataEdge->getShape().getRank() == 2) {
+    if (inputDataEdge->getMemory().GetShape().getRank() == 2) {
         size_t nComplex = outputShape[0];
         if (IsPowerOfTwo(nComplex)) {
             fft(output, nComplex * 2, true);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.h
index 12d23dd5bcebdb..81ddff6e6c528b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_dft_node.h
@@ -21,7 +21,7 @@ class MKLDNNDFTNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     void dftNd(float* output, const std::vector<size_t>& outputStrides) const;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.cpp
index 1bba69c7cfbb28..b15a7e05fd4002 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.cpp
@@ -37,6 +37,7 @@
 #include <cmath>
 #include <map>
 #include <functional>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
@@ -372,7 +373,7 @@ struct jit_uni_eltwise_generic : public MKLDNNPlugin::jit_uni_eltwise_kernel, pu
     Vmm vmm_d_bias = Vmm(13);
     Vmm vmm_zero = Vmm(15);
 
-    std::unique_ptr<jit_emu_vcvtneps2bf16> emu_vcvtneps2bf16;
+    std::shared_ptr<jit_emu_vcvtneps2bf16> emu_vcvtneps2bf16;
 
     std::shared_ptr<jit_emitter> eltwise_emitter = nullptr;
     std::vector<std::shared_ptr<jit_emitter>> post_op_emitters = {};
@@ -958,14 +959,25 @@ std::map<const ngraph::DiscreteTypeInfo, std::function<void(const std::shared_pt
     }},
 };
 
+bool MKLDNNEltwiseNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
+    try {
+        if (initializers.find(op->get_type_info()) == initializers.end()) {
+            errorMessage = "Doesn't support Eltwise algorithm: " +  std::string(op->get_type_name());
+            return false;
+        }
+    } catch (...) {
+        return false;
+    }
+    return true;
+}
+
 MKLDNNEltwiseNode::MKLDNNEltwiseNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache) :
         MKLDNNNode(op, eng, cache) {
-    if (initializers.find(op->get_type_info()) != initializers.end()) {
-        initializers[op->get_type_info()](op, *this);
-    } else {
-        IE_THROW(NotImplemented)
-            << "CPU Eltwise node doesn't support ngraph operation " << op->get_type_name() << " with name " << op->get_friendly_name();
+    std::string errorMessage;
+    if (!isSupportedOperation(op, errorMessage)) {
+        IE_THROW(NotImplemented) << errorMessage;
     }
+    initializers[op->get_type_info()](op, *this);
 }
 
 size_t MKLDNNEltwiseNode::getOpInputsNum() const {
@@ -985,6 +997,8 @@ size_t MKLDNNEltwiseNode::getOpInputsNum() const {
     }
 }
 
+// TODO [DS]: used only in FuseConvolutionSumAndConvolutionSumActivation
+// fix when reimplement this transformation for dynamic shapes
 bool MKLDNNEltwiseNode::isWithBroadcast() {
     auto oDims = outputShapes[0].getStaticDims();
     for (size_t i = 0; i < inputShapes.size(); i++) {
@@ -1036,8 +1050,8 @@ void MKLDNNEltwiseNode::initSupportedPrimitiveDescriptors() {
                            << " (actual = " << getParentEdges().size() << ")";
 
     std::vector<InferenceEngine::Precision> inputPrecisions;
-    for (const auto &i : getOriginalInputPrecisions()) {
-        inputPrecisions.push_back(i);
+    for (const auto &prec : getOriginalInputPrecisions()) {
+        inputPrecisions.push_back(prec);
     }
 
     for (auto& fusedNode : fusedWith) {
@@ -1103,55 +1117,63 @@ void MKLDNNEltwiseNode::initSupportedPrimitiveDescriptors() {
     };
 
     auto initDesc = [&] (LayoutType lt) -> NodeDesc {
-        auto createMemoryDesc = [lt](MKLDNNEdgePtr edge, Precision prc, size_t offset) -> std::unique_ptr<BlockedMemoryDesc> {
-            if (lt == ChannelsFirst && edge->getShape().getRank() != 1) {
-                auto dims = edge->getShape().getStaticDims();
-                auto ndims = dims.size();
-                std::vector<size_t> order(ndims);
+        auto createMemoryDesc = [lt](const Shape &shape, Precision prc, size_t offset) -> std::shared_ptr<CpuBlockedMemoryDesc> {
+            const auto &dims = shape.getDims();
+            if (lt == ChannelsFirst && shape.getRank() != 1) {
+                auto ndims = shape.getRank();
+                VectorDims order(ndims);
                 std::iota(order.begin(), order.end(), 0);
                 if (ndims > 1) {
                     order.erase(order.begin() + 1);
                     order.push_back(1);
                 }
 
-                std::vector<size_t> blocks(ndims);
+                VectorDims blocks(ndims);
                 for (size_t i = 0; i < order.size(); i++) {
                     blocks[i] = dims[order[i]];
                 }
 
-                return MKLDNNPlugin::make_unique<BlockedMemoryDesc>(prc, edge->getShape().getStaticDims(), blocks, order, offset);
-            } else if (lt == Blocked && edge->getShape().getRank() != 1 && edge->getShape().getStaticDims()[1] != 1) {
+                return std::make_shared<CpuBlockedMemoryDesc>(prc, shape, blocks, order, offset);
+            // TODO: need investigate
+            // bad accuracy for shape {1, 1, 4, 11}, {2, 5, 1, 1}
+            // same for disabled collapse dims
+            } else if (lt == Blocked && shape.getRank() != 1 && (shape.getMinDims()[1] != Shape::UNDEFINED_DIM && shape.getMinDims()[1] > 1)) {
                 size_t blockSize = mayiuse(x64::avx512_common) ? 16 : 8;
 
-                std::vector<size_t> blocks = edge->getShape().getStaticDims();
-                std::vector<size_t> order(blocks.size());
+                VectorDims blocks = dims;
+                VectorDims order(blocks.size());
                 std::iota(order.begin(), order.end(), 0);
 
-                blocks[1] = div_up(blocks[1], blockSize);
+                blocks[1] = dims[1] != Shape::UNDEFINED_DIM ? div_up(blocks[1], blockSize) : Shape::UNDEFINED_DIM;
                 blocks.push_back(blockSize);
                 order.push_back(1);
 
-                return MKLDNNPlugin::make_unique<BlockedMemoryDesc>(prc, edge->getShape().getStaticDims(), blocks, order, offset);
+                return std::make_shared<CpuBlockedMemoryDesc>(prc, shape, blocks, order, offset);
             } else {
-                std::vector<size_t> blocks = edge->getShape().getStaticDims();
-                std::vector<size_t> order(blocks.size());
+                VectorDims blocks = dims;
+                VectorDims order(blocks.size());
                 std::iota(order.begin(), order.end(), 0);
 
-                return MKLDNNPlugin::make_unique<BlockedMemoryDesc>(prc, edge->getShape().getStaticDims(), blocks, order, offset);
+                return std::make_shared<CpuBlockedMemoryDesc>(prc, shape, blocks, order, offset);
             }
         };
 
-        size_t offset = std::numeric_limits<size_t>::max();
+        // TODO [DS]: inplace
+        size_t offset = isDynamicNode() ? 0 : std::numeric_limits<size_t>::max();
         NodeConfig config;
-        config.dynBatchSupport = getChildEdgeAt(0)->getShape().getRank() > 1 && getChildEdgeAt(0)->getShape() ==
-                                                                                getParentEdgeAt(0)->getShape();
+        if (!isDynamicNode()) {
+            config.dynBatchSupport = getOutputShapeAtPort(0).getRank() > 1 && getOutputShapeAtPort(0) ==
+                                                                                    getInputShapeAtPort(0);
+        }
 
         for (size_t i = 0; i < getParentEdges().size(); i++) {
             PortConfig portConfig;
-            portConfig.inPlace = (!i && canBeInPlace() && inputPrecisions[i] == outputPrecision) ? 0 : -1;
+            // TODO [DS]: inplace
+            if (!isDynamicNode())
+                portConfig.inPlace = (!i && canBeInPlace() && inputPrecisions[i] == outputPrecision) ? 0 : -1;
             portConfig.constant = false;
 
-            portConfig.desc = createMemoryDesc(getParentEdgeAt(i), inputPrecisions[i], offset);
+            portConfig.desc = createMemoryDesc(getInputShapeAtPort(i), inputPrecisions[i], offset);
 
             config.inConfs.push_back(portConfig);
         }
@@ -1160,7 +1182,7 @@ void MKLDNNEltwiseNode::initSupportedPrimitiveDescriptors() {
         portConfig.inPlace = -1;
         portConfig.constant = false;
 
-        portConfig.desc = createMemoryDesc(getChildEdgeAt(0), outputPrecision, offset);
+        portConfig.desc = createMemoryDesc(getOutputShapeAtPort(0), outputPrecision, offset);
 
         config.outConfs.push_back(portConfig);
 
@@ -1178,20 +1200,23 @@ void MKLDNNEltwiseNode::initSupportedPrimitiveDescriptors() {
         return {config, impl_type};
     };
 
-    bool isChannelsFirstApplicable = one_of(getChildEdgeAt(0)->getShape().getRank(), 1, 2, 4, 5);
+    bool isChannelsFirstApplicable = one_of(getOutputShapeAtPort(0).getRank(), 1, 2, 4, 5);
     for (size_t i = 0; i < getParentEdges().size(); i++) {
-        isChannelsFirstApplicable = isChannelsFirstApplicable && one_of(getParentEdgeAt(i)->getShape().getRank(), 1, 2, 4, 5);
-        isChannelsFirstApplicable = isChannelsFirstApplicable && implication(getParentEdgeAt(i)->getShape().getRank() != 1,
-                                                                             getChildEdgeAt(0)->getShape().getRank() ==
-                                                                                     getParentEdgeAt(i)->getShape().getRank());
+        isChannelsFirstApplicable = isChannelsFirstApplicable && one_of(getInputShapeAtPort(i).getRank(), 1, 2, 4, 5);
+        isChannelsFirstApplicable = isChannelsFirstApplicable && implication(getInputShapeAtPort(i).getRank() != 1,
+                                                                             getOutputShapeAtPort(0).getRank() ==
+                                                                                     getInputShapeAtPort(i).getRank());
     }
 
-    bool isBlockedApplicable = one_of(getChildEdgeAt(0)->getShape().getRank(), 1, 4, 5);
+    bool isBlockedApplicable = one_of(getOutputShapeAtPort(0).getRank(), 1, 4, 5);
     for (size_t i = 0; i < getParentEdges().size(); i++) {
-        isBlockedApplicable = isBlockedApplicable && one_of(getParentEdgeAt(i)->getShape().getRank(), 1, 4, 5);
-        isBlockedApplicable = isBlockedApplicable && implication(getParentEdgeAt(i)->getShape().getRank() != 1,
-                                                                 getChildEdgeAt(0)->getShape().getRank() ==
-                                                                 getParentEdgeAt(i)->getShape().getRank());
+        const auto &inShape = getInputShapeAtPort(i);
+        isBlockedApplicable = isBlockedApplicable && one_of(inShape.getRank(), 1, 4, 5);
+        isBlockedApplicable = isBlockedApplicable && implication(inShape.getRank() != 1,
+                                                                 getOutputShapeAtPort(0).getRank() ==
+                                                                 inShape.getRank());
+        if (isDynamicNode() && inShape.getRank() != 1)
+            isBlockedApplicable = isBlockedApplicable && inShape.getMinDims()[1] != Shape::UNDEFINED_DIM && inShape.getMinDims()[1] > 1;
     }
 
     if (isChannelsFirstApplicable)
@@ -1199,42 +1224,51 @@ void MKLDNNEltwiseNode::initSupportedPrimitiveDescriptors() {
     if (isBlockedApplicable)
         supportedPrimitiveDescriptors.emplace_back(initDesc(Blocked));
     supportedPrimitiveDescriptors.emplace_back(initDesc(Planar));
-}
 
-void MKLDNNEltwiseNode::createPrimitive() {
-    auto config = getSelectedPrimitiveDescriptor()->getConfig();
     inputNum = getParentEdges().size();
+    currentInBlkDims.resize(inputNum);
+    currentInDims.resize(inputNum);
+}
+
+void MKLDNNEltwiseNode::prepareParams() {
+    if (!isInputShapesDefined()) {
+        IE_THROW() << "Can't prepare params for eltwise node with name: " << getName();
+    }
+
+    if (memPtrs.empty()) {
+        for (auto i = 0; i < inputNum; i++)
+            memPtrs.push_back(getParentEdgeAt(i)->getMemoryPtr());
+        memPtrs.push_back(getChildEdgeAt(0)->getMemoryPtr());
+    }
 
-    auto initDims = [this, config](size_t maxInputSize) {
+    jit_eltwise_params jep = {};
+    std::vector<VectorDims> dims_in;
+
+    auto outBlockingDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
+    const auto &outOrder = outBlockingDesc->getOrder();
+    const auto &currentOutBlkDims = outBlockingDesc->getBlockDims();
+
+    auto initDims = [this, &dims_in, &jep, &outBlockingDesc, &currentOutBlkDims, &outOrder](size_t maxInputSize) {
         dims_in.resize(inputNum);
         for (int i = 0; i < inputNum; i++) {
             dims_in[i].resize(maxInputSize, 1);
         }
 
-        dims_out.resize(maxInputSize, 1);
-
-        auto outBlockingDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-        std::vector<size_t> order(maxInputSize);
-        auto outOrder = outBlockingDesc.getOrder();
-        for (size_t i = 0; i < order.size(); i++) {
-            if (i < order.size() - outOrder.size())
-                order[i] = i;
-            else
-                order[i] = outOrder[i - (order.size() - outOrder.size())] + (order.size() - outOrder.size());
-        }
+        jep.dims.resize(maxInputSize, 1);
 
-        size_t outRank = outBlockingDesc.getBlockDims().size();
+        size_t outRank = currentOutBlkDims.size();
         for (int i = 0; i < outRank; i++) {
-            dims_out[dims_out.size() - 1 - i] = outBlockingDesc.getBlockDims()[outRank - 1 - i];
+            jep.dims[jep.dims.size() - 1 - i] = currentOutBlkDims[outRank - 1 - i];
         }
 
         for (int i = 0; i < inputNum; i++) {
             auto inBlockingDesc = getParentEdgeAt(i)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-            size_t inRank = inBlockingDesc.getBlockDims().size();
+            currentInBlkDims[i] = inBlockingDesc->getBlockDims();
+            size_t inRank = currentInBlkDims[i].size();
 
             // WA to normalize blocked and planar layouts
-            auto inOrder = inBlockingDesc.getOrder();
-            size_t startOff = outOrder.size() != outBlockingDesc.getShape().getRank() &&
+            const auto &inOrder = inBlockingDesc->getOrder();
+            size_t startOff = outOrder.size() != outBlockingDesc->getShape().getRank() &&
                               outOrder[outOrder.size() - 1] != inOrder[inOrder.size() - 1] ? 1 : 0;
 
             // WA to handle nspc layout with 1D tensors
@@ -1243,41 +1277,40 @@ void MKLDNNEltwiseNode::createPrimitive() {
             }
 
             for (int j = 0; j < inRank; j++) {
-                dims_in[i][dims_in[i].size() - 1 - j - startOff] = inBlockingDesc.getBlockDims()[inRank - 1 - j];
+                dims_in[i][dims_in[i].size() - 1 - j - startOff] = currentInBlkDims[i][inRank - 1 - j];
             }
         }
 
         for (int i = 0; i < dims_in.size(); i++) {
             for (int j = 0; j < dims_in[i].size(); j++) {
-                if (dims_in[i][j] != dims_out[j] && dims_in[i][j] != 1)
+                if (dims_in[i][j] != jep.dims[j] && dims_in[i][j] != 1)
                     IE_THROW() << "Eltwise node with name `" << getName() << "` has invalid input/output dims configuration.";
             }
         }
     };
 
-    auto initOffsets = [this, config](size_t maxInputSize) {
-        offsets_out.resize(maxInputSize, 1);
-        offset_out_calc(offsets_out, dims_out);
+    auto initOffsets = [this, &dims_in, &jep](size_t maxInputSize) {
+        jep.dst_offsets.resize(maxInputSize, 1);
+        offset_out_calc(jep.dst_offsets, jep.dims);
         for (int j = 0; j < maxInputSize; j++) {
-            offsets_out[j] *= getChildEdgeAt(0)->getMemory().GetDesc().getPrecision().size();
+            jep.dst_offsets[j] *= getChildEdgeAt(0)->getMemory().getDesc().getPrecision().size();
         }
 
-        offsets_in.resize(inputNum);
         for (int i = 0; i < inputNum; i++) {
-            offsets_in[i].resize(maxInputSize, 1);
-            offset_in_calc(offsets_in[i], dims_in[i], dims_out);
+            jep.src_offsets[i].resize(maxInputSize, 1);
+            offset_in_calc(jep.src_offsets[i], dims_in[i], jep.dims);
             for (int j = 0; j < maxInputSize; j++) {
-                offsets_in[i][j] *= getParentEdgeAt(i)->getMemory().GetDesc().getPrecision().size();
+                jep.src_offsets[i][j] *= getParentEdgeAt(i)->getMemory().getDesc().getPrecision().size();
             }
         }
 
         start_offset_in.resize(inputNum);
         for (size_t i = 0; i < inputNum; i++) {
-            start_offset_in[i] = getParentEdgeAt(i)->getMemory().GetDescriptor().data.offset0 *
-                               MKLDNNExtensionUtils::sizeOfDataType(mkldnn::memory::data_type(getParentEdgeAt(i)->getMemory().GetDescriptor().data.data_type));
+            const auto desc = getParentEdgeAt(i)->getMemory().GetDescWithType<BlockedMemoryDesc>();
+            start_offset_in[i] = desc->getOffsetPadding() * desc->getPrecision().size();
         }
-        start_offset_out = getChildEdgeAt(0)->getMemory().GetDescriptor().data.offset0 *
-                         MKLDNNExtensionUtils::sizeOfDataType(mkldnn::memory::data_type(getChildEdgeAt(0)->getMemory().GetDescriptor().data.data_type));
+        const auto desc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
+        start_offset_out = desc->getOffsetPadding() * desc->getPrecision().size();
     };
 
     auto collapseLastDims = [](std::vector<size_t>& dims, int dimsToCollapse) {
@@ -1311,42 +1344,42 @@ void MKLDNNEltwiseNode::createPrimitive() {
         }
     };
 
-    auto outBlockingDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    tensorRank = std::max(static_cast<size_t>(optimalTensorRank), outBlockingDesc.getBlockDims().size());
-    initDims(tensorRank);
+    jep.input_size = std::max(static_cast<size_t>(optimalTensorRank), currentOutBlkDims.size());
+    initDims(jep.input_size);
 
-    auto outOrder = outBlockingDesc.getOrder();
     size_t oc_size = 0;
-    offsets_oc.resize(tensorRank, 0);
+    jep.oc_offsets.resize(jep.input_size, 0);
+    std::fill(jep.oc_offsets.begin(), jep.oc_offsets.end(), 0);
     if (isFusedWith(FakeQuantize)) {
         size_t offset_oc = 1;
         for (int i = outOrder.size() - 1; i >= 0; i--) {
             if (outOrder[i] == 1) {
-                int oc_dim_idx = i + (tensorRank - outOrder.size());
-                offsets_oc[oc_dim_idx] = offset_oc;
-                offset_oc *= dims_out[oc_dim_idx];
+                int oc_dim_idx = i + (jep.input_size - outOrder.size());
+                jep.oc_offsets[oc_dim_idx] = offset_oc;
+                offset_oc *= jep.dims[oc_dim_idx];
             }
         }
-        oc_size = offsets_oc[dims_out.size() - 1] != 0 ? dims_out[dims_out.size() - 1] : 1;
+        oc_size = jep.oc_offsets[jep.dims.size() - 1] != 0 ? jep.dims[jep.dims.size() - 1] : 1;
     }
 
+    // used in runtime
     fullWorkAmount = 1;
-    for (int i = 0; i < dims_out.size(); i++) {
-        fullWorkAmount *= dims_out[i];
+    for (int i = 0; i < jep.dims.size(); i++) {
+        fullWorkAmount *= jep.dims[i];
     }
 
     isDynBatchEnabled = getSelectedPrimitiveDescriptor()->getConfig().dynBatchSupport;
 
     size_t minimalConcurrency = parallel_get_max_threads();
     size_t minimalJitWorkAmount = 256;
-    size_t currentJitWorkAmount = dims_out[dims_out.size() - 1];
+    size_t currentJitWorkAmount = jep.dims[jep.dims.size() - 1];
     int collapsedDims = 0;
     if (canUseOptimizedImpl) {
         bool hasDifferentDims = false;
         while (currentJitWorkAmount < minimalJitWorkAmount && currentJitWorkAmount < fullWorkAmount &&
                // we shouldn't collapse batch dimension in case dynamic batch is enabled
-               (!isDynBatchEnabled || (outBlockingDesc.getBlockDims().size() - collapsedDims > 2))) {
-            if (dims_out.size() - collapsedDims - 2 < 0)
+               (!isDynBatchEnabled || (currentOutBlkDims.size() - collapsedDims > 2))) {
+            if (jep.dims.size() - collapsedDims - 2 < 0)
                 break;
 
             for (int j = 1; j < dims_in.size(); j++) {
@@ -1378,7 +1411,7 @@ void MKLDNNEltwiseNode::createPrimitive() {
                 break;
             }
 
-            size_t nextJitWorkAmount = currentJitWorkAmount * dims_out[dims_out.size() - 2];
+            size_t nextJitWorkAmount = currentJitWorkAmount * jep.dims[jep.dims.size() - 2];
             if (fullWorkAmount / nextJitWorkAmount >= minimalConcurrency) {
                 currentJitWorkAmount = nextJitWorkAmount;
                 collapsedDims++;
@@ -1386,10 +1419,10 @@ void MKLDNNEltwiseNode::createPrimitive() {
                 for (int i = 0; i < dims_in.size(); i++) {
                     collapseLastDims(dims_in[i], 1);
                 }
-                collapseLastDims(dims_out, 1);
+                collapseLastDims(jep.dims, 1);
 
                 if (isFusedWith(FakeQuantize)) {
-                    collapseLastOffsets(offsets_oc, 1);
+                    collapseLastOffsets(jep.oc_offsets, 1);
                 }
             } else {
                 break;
@@ -1397,55 +1430,52 @@ void MKLDNNEltwiseNode::createPrimitive() {
         }
     }
 
-    batchDimIdx = tensorRank - outBlockingDesc.getBlockDims().size() + collapsedDims;
-    schedulerWorkAmount = fullWorkAmount / dims_out[dims_out.size() - 1];
-
-    initOffsets(tensorRank);
+    // used in runtime
+    batchDimIdx = jep.input_size - currentOutBlkDims.size() + collapsedDims;
+    schedulerWorkAmount = fullWorkAmount / jep.dims[jep.dims.size() - 1];
 
-    for (auto i = 0; i < inputNum; i++)
-        memPtrs.push_back(getParentEdgeAt(i)->getMemoryPtr());
-    memPtrs.push_back(getChildEdgeAt(0)->getMemoryPtr());
-
-    if (!canUseOptimizedImpl)
-        return;
+    initOffsets(jep.input_size);
 
     jep.inputs_number = inputNum;
-    jep.input_size = tensorRank;
 
     for (int i = 0; i < inputNum; i++) {
+        jep.src_prc[i] = getParentEdgesAtPort(i).front()->getMemory().getDesc().getPrecision();
         jep.src_size[i] = dims_in[i][dims_in[i].size() - 1];
-        jep.src_prc[i] = getParentEdgesAtPort(i).front()->getMemory().GetDesc().getPrecision();
     }
-    jep.dst_size = dims_out[dims_out.size() - 1];
-    jep.dst_prc = getChildEdgesAtPort(0).front()->getMemory().GetDesc().getPrecision();
-
+    jep.dst_prc = getChildEdgesAtPort(0).front()->getMemory().getDesc().getPrecision();
+    jep.work_amount = jep.dst_size = jep.dims.back();
     jep.oc_size = oc_size;
-    jep.work_amount = dims_out.back();
 
-    jep.dims = dims_out;
-    for (size_t i = 0; i < inputNum; i++)
-        jep.src_offsets[i] = offsets_in[i];
-    jep.dst_offsets = offsets_out;
-    jep.oc_offsets = offsets_oc;
     std::transform(jep.oc_offsets.begin(), jep.oc_offsets.end(), jep.oc_offsets.begin(),
                    [](size_t& offset) { return offset * sizeof(float);});
 
-    if (mayiuse(x64::avx512_common)) {
-        eltwise_kernel.reset(new jit_uni_eltwise_generic<x64::avx512_common>(jep, *this));
-    } else if (mayiuse(x64::avx2)) {
-        eltwise_kernel.reset(new jit_uni_eltwise_generic<x64::avx2>(jep, *this));
-    } else if (mayiuse(x64::sse41)) {
-        eltwise_kernel.reset(new jit_uni_eltwise_generic<x64::sse41>(jep, *this));
+    if (canUseOptimizedImpl) {
+        pPrim = std::make_shared<EltwiseJitPrim>(jep, *this);
+    } else {
+        pPrim = std::make_shared<EltwiseRefPrim>(jep);
     }
+}
 
-    if (eltwise_kernel)
-        eltwise_kernel->create_ker();
+bool MKLDNNEltwiseNode::isPrepareParamsNeeded() const {
+    for (size_t i = 0; i < getParentEdges().size(); i++) {
+        if (getParentEdgesAtPort(i)[0]->getMemory().GetDescWithType<BlockedMemoryDesc>()->getBlockDims() != currentInBlkDims[i])
+            return true;
+    }
+    return false;
 }
 
 void MKLDNNEltwiseNode::selectOptimalPrimitiveDescriptor() {
     selectPreferPrimitiveDescriptor(getPrimitivesPriority(), true);
 }
 
+void MKLDNNEltwiseNode::createPrimitive() {
+    if (isInputShapesDefined()) {
+        if (isPrepareParamsNeeded())
+            prepareParams();
+        initCurrentDims();
+    }
+}
+
 void MKLDNNEltwiseNode::initOptimalPrimitiveDescriptor() {
     auto selected_pd = getSelectedPrimitiveDescriptor();
     if (selected_pd == nullptr)
@@ -1453,11 +1483,11 @@ void MKLDNNEltwiseNode::initOptimalPrimitiveDescriptor() {
     auto config = selected_pd->getConfig();
     if (!isConfigDefined(config)) {
         for (size_t i = 0; i < config.inConfs.size(); i++) {
-            config.inConfs[i].desc = std::move(getDefinedInputDesc(config, i));
+            config.inConfs[i].desc = getDefinedInputDesc(config, i);
         }
 
         for (size_t i = 0; i < config.outConfs.size(); i++) {
-            config.outConfs[i].desc = std::move(getDefinedOutputDesc(config, i));
+            config.outConfs[i].desc = getDefinedOutputDesc(config, i);
         }
 
         initDescriptor(config);
@@ -1466,7 +1496,7 @@ void MKLDNNEltwiseNode::initOptimalPrimitiveDescriptor() {
     }
 }
 
-void MKLDNNEltwiseNode::offset_out_calc(std::vector<size_t>& offset, std::vector<size_t>& dims) {
+void MKLDNNEltwiseNode::offset_out_calc(VectorDims& offset, VectorDims& dims) {
     int k = 1;
     for (int i = offset.size() - 1; i >= 0; i--) {
         offset[i] = k;
@@ -1474,7 +1504,7 @@ void MKLDNNEltwiseNode::offset_out_calc(std::vector<size_t>& offset, std::vector
     }
 }
 
-void MKLDNNEltwiseNode::offset_in_calc(std::vector<size_t>& offset, std::vector<size_t>& dims_in, std::vector<size_t>& dims_out) {
+void MKLDNNEltwiseNode::offset_in_calc(VectorDims& offset, VectorDims& dims_in, VectorDims& dims_out) {
     int k = 1;
     for (int i = offset.size() - 1; i >= 0; i--) {
         offset[i] = (dims_in[i] == dims_out[i]) ? k : 0;
@@ -1482,7 +1512,8 @@ void MKLDNNEltwiseNode::offset_in_calc(std::vector<size_t>& offset, std::vector<
     }
 }
 
-void MKLDNNEltwiseNode::executeOptimized6D() {
+void MKLDNNEltwiseNode::executeOptimized6D(const std::shared_ptr<jit_uni_eltwise_kernel> &pKernel, const jit_eltwise_call_args_ptrs &args_ptrs,
+                                           const VectorDims &dims_out) const {
     parallel_for5d(dims_out[0], dims_out[1], dims_out[2], dims_out[3], dims_out[4],
         [&](size_t i0, size_t i1, size_t i2, size_t i3, size_t i4) {
             auto args = jit_eltwise_call_args_indexes();
@@ -1492,11 +1523,12 @@ void MKLDNNEltwiseNode::executeOptimized6D() {
             args.indexes[3] = i3;
             args.indexes[4] = i4;
 
-            (*eltwise_kernel)(&args_ptrs, &args);
+            (*pKernel)(&args_ptrs, &args);
         });
 }
 
-void MKLDNNEltwiseNode::executeOptimizedGeneric() {
+void MKLDNNEltwiseNode::executeOptimizedGeneric(const std::shared_ptr<jit_uni_eltwise_kernel> &pKernel, const jit_eltwise_call_args_ptrs &args_ptrs,
+                                                const VectorDims &dims_out) const {
     parallel_nt(0, [&](const int ithr, const int nthr) {
         size_t start = 0, end = 0;
         splitter(schedulerWorkAmount, nthr, ithr, start, end);
@@ -1513,12 +1545,12 @@ void MKLDNNEltwiseNode::executeOptimizedGeneric() {
             for (size_t j = 0; j < counters.size(); j++)
                 args.indexes[j] = counters[j];
 
-            (*eltwise_kernel)(&args_ptrs, &args);
+            (*pKernel)(&args_ptrs, &args);
         }
     });
 }
 
-void MKLDNNEltwiseNode::executeReference() {
+void MKLDNNEltwiseNode::executeReference(const jit_eltwise_params &jep, const jit_eltwise_call_args_ptrs &args_ptrs, const VectorDims &dims_out) const {
     std::shared_ptr<ref_eltwise_scalar_fwd_t> ref_eltwise_injector = nullptr;
     if (getMKLDNNAlgorithm() != mkldnn::algorithm::undef) {
         ref_eltwise_injector = std::make_shared<ref_eltwise_scalar_fwd_t>(static_cast<mkldnn_alg_kind_t>(getMKLDNNAlgorithm()), alpha, beta, 1.f);
@@ -1541,14 +1573,14 @@ void MKLDNNEltwiseNode::executeReference() {
             for (int i = 0; i < inputNum; i++) {
                 index_in[i] = 0;
                 for (int j = 0; j < counters.size(); j++) {
-                    index_in[i] += counters[j] * offsets_in[i][j];
+                    index_in[i] += counters[j] * jep.src_offsets[i][j];
                 }
                 index_in[i] /= sizeof(float);
             }
 
             size_t index_out = 0;
             for (int j = 0; j < counters.size(); j++) {
-                index_out += counters[j] * offsets_out[j];
+                index_out += counters[j] * jep.dst_offsets[j];
             }
             index_out /= sizeof(float);
 
@@ -1594,23 +1626,21 @@ void MKLDNNEltwiseNode::executeReference() {
 }
 
 void MKLDNNEltwiseNode::execute(mkldnn::stream strm) {
-    std::vector<const uint8_t *> src_ptrs(inputNum);
-    for (int i = 0; i < inputNum; i++)
-        args_ptrs.src_ptr[i] = reinterpret_cast<const uint8_t*>(memPtrs[i]->GetData()) + start_offset_in[i];
-    args_ptrs.dst_ptr = reinterpret_cast<uint8_t*>(memPtrs.back()->GetData()) + start_offset_out;
-
-    // In general case we need to recompute offsets as well but currently all supported layout assumes batch to be outermost dimension
-    if (isDynBatchEnabled)
-        dims_out[batchDimIdx] = static_cast<size_t>(batchToProcess());
-
-    if (eltwise_kernel) {
-        if (tensorRank == optimalTensorRank) {
-            executeOptimized6D();
-        } else {
-            executeOptimizedGeneric();
+    if (pPrim) {
+        jit_eltwise_call_args_ptrs args_ptrs = {};
+        VectorDims dims_out = pPrim->getJep().dims;
+        for (int i = 0; i < memPtrs.size() - 1; i++)
+            args_ptrs.src_ptr[i] = reinterpret_cast<const uint8_t*>(memPtrs[i]->GetData()) + start_offset_in[i];
+        args_ptrs.dst_ptr = reinterpret_cast<uint8_t*>(memPtrs.back()->GetData()) + start_offset_out;
+
+        // In general case we need to recompute offsets as well but currently all supported layout assumes batch to be outermost dimension
+        if (isDynBatchEnabled) {
+            if (dims_out.size() <= batchDimIdx)
+                IE_THROW() << "Can't set batch dims for eltwise node with rank: " << dims_out.size() << " and batch idx: " << batchDimIdx;
+            dims_out[batchDimIdx] = static_cast<size_t>(batchToProcess());
         }
-    } else {
-        executeReference();
+
+        pPrim->exec(*this, args_ptrs, dims_out);
     }
 }
 
@@ -1638,14 +1668,15 @@ bool MKLDNNEltwiseNode::canBeInPlace() const {
         }
     }
 
-    return getParentEdgesAtPort(0)[0].get()->getShape() == getChildEdgesAtPort(0)[0].get()->getShape();
+    return getInputShapeAtPort(0) == getOutputShapeAtPort(0);
 }
 
 void MKLDNNEltwiseNode::fuseInto(MKLDNNNodePtr& parentNode) {
     // Handling Convolution custom Add node fusing case which is processed via dnnl append_sum() API.
+    // TODO [DS]: at this moment this transformation prohibit for dynamic case
     specialConvolutionAddFusing = (parentNode->getType() == Convolution || parentNode->getType() == BinaryConvolution) && getAlgorithm() == EltwiseAdd &&
-            getParentEdgesAtPort(0)[0]->getShape() == getParentEdgesAtPort(1)[0]->getShape();
-    if (!specialConvolutionAddFusing && canBePerformedAsScaleShift(parentNode.get())) {
+            getInputShapeAtPort(0) == getInputShapeAtPort(1);
+    if (!specialConvolutionAddFusing && parentNode->getType() != Eltwise && canBePerformedAsScaleShift(parentNode.get())) {
         fillScalesAndShifts(parentNode.get(), scales, shifts, 16);
     }
     MKLDNNNode::fuseInto(parentNode);
@@ -1748,7 +1779,7 @@ bool MKLDNNEltwiseNode::canFuse(const MKLDNNNodePtr& node) const {
         }
 
         // We can use optimized execution with fusions only in cases when dim rank is less or equal to the maximum possible
-        if (node->getParentEdgesAtPort(0).front()->getShape().getRank() > MAX_ELTWISE_DIM_RANK)
+        if (node->getInputShapeAtPort(0).getRank() > MAX_ELTWISE_DIM_RANK)
             return false;
 
         return true;
@@ -1774,4 +1805,40 @@ InferenceEngine::Precision MKLDNNEltwiseNode::getRuntimePrecision() const {
     return getMaxPrecision(inputPrecisions);
 }
 
+MKLDNNEltwiseNode::EltwiseJitPrim::EltwiseJitPrim(const jit_eltwise_params &_jep, MKLDNNEltwiseNode& node) {
+    if (mayiuse(x64::avx512_common)) {
+        pKernel.reset(new jit_uni_eltwise_generic<x64::avx512_common>(_jep, node));
+    } else if (mayiuse(x64::avx2)) {
+        pKernel.reset(new jit_uni_eltwise_generic<x64::avx2>(_jep, node));
+    } else if (mayiuse(x64::sse41)) {
+        pKernel.reset(new jit_uni_eltwise_generic<x64::sse41>(_jep, node));
+    } else {
+        IE_THROW() << "Can't create jit eltwise kernel";
+    }
+
+    if (pKernel)
+        pKernel->create_ker();
+}
+
+void MKLDNNEltwiseNode::EltwiseJitPrim::exec(const MKLDNNEltwiseNode& node, const jit_eltwise_call_args_ptrs &args_ptrs, const VectorDims &dims_out) {
+    if (!pKernel)
+        IE_THROW() << "Can't execute, kernel for eltwise node is not compiled";
+
+    if (pKernel->jep_.input_size == node.optimalTensorRank) {
+        node.executeOptimized6D(pKernel, args_ptrs, dims_out);
+    } else {
+        node.executeOptimizedGeneric(pKernel, args_ptrs, dims_out);
+    }
+}
+
+void MKLDNNEltwiseNode::EltwiseRefPrim::exec(const MKLDNNEltwiseNode& node, const jit_eltwise_call_args_ptrs &args_ptrs, const VectorDims &dims_out) {
+    node.executeReference(jep, args_ptrs, dims_out);
+}
+
+const jit_eltwise_params& MKLDNNEltwiseNode::EltwiseJitPrim::getJep() const {
+    if (!pKernel)
+        IE_THROW() << "Can't get jit eltwise params, kernel for eltwise node is not compiled";
+    return pKernel->jep_;
+}
+
 REG_MKLDNN_PRIM_FOR(MKLDNNEltwiseNode, Eltwise);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.h
index e1719be037fac5..8bc3b3e3424c74 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_eltwise_node.h
@@ -23,10 +23,10 @@ struct jit_eltwise_params {
     InferenceEngine::Precision src_prc[MAX_ELTWISE_INPUTS];
     InferenceEngine::Precision dst_prc;
 
-    std::vector<size_t> dims;
-    std::vector<size_t> src_offsets[MAX_ELTWISE_INPUTS];
-    std::vector<size_t> dst_offsets;
-    std::vector<size_t> oc_offsets;
+    VectorDims dims;
+    VectorDims src_offsets[MAX_ELTWISE_INPUTS];
+    VectorDims dst_offsets;
+    VectorDims oc_offsets;
 
     size_t src_size[MAX_ELTWISE_INPUTS];
     size_t dst_size;
@@ -71,7 +71,6 @@ class MKLDNNEltwiseNode : public MKLDNNNode {
     void initSupportedPrimitiveDescriptors() override;
     void selectOptimalPrimitiveDescriptor() override;
     void initOptimalPrimitiveDescriptor() override;
-    void createPrimitive() override;
     void execute(mkldnn::stream strm) override;
     bool created() const override;
     bool canBeInPlace() const override;
@@ -88,29 +87,55 @@ class MKLDNNEltwiseNode : public MKLDNNNode {
     bool isWithBroadcast();
     bool isSpecialConvolutionAddFusing() const { return specialConvolutionAddFusing; }
 
+    void createPrimitive() override;
+
+    bool isPrepareParamsNeeded() const override;
+    void prepareParams() override;
+
+    void executeDynamicImpl(mkldnn::stream strm) override { execute(strm); }
+
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
+
 private:
-    mkldnn::algorithm mkldnnAlgorithm = mkldnn::algorithm::undef;
+    struct EltwisePrim {
+        virtual void exec(const MKLDNNEltwiseNode& node, const jit_eltwise_call_args_ptrs &args_ptrs, const VectorDims &dims_out) = 0;
+        virtual const jit_eltwise_params& getJep() const = 0;
+        virtual ~EltwisePrim() = default;
+    };
+    using primPtr = std::shared_ptr<EltwisePrim>;
+    primPtr pPrim = nullptr;
+
+    struct EltwiseJitPrim : public EltwisePrim {
+        EltwiseJitPrim(const jit_eltwise_params &_jep, MKLDNNEltwiseNode& node);
+        void exec(const MKLDNNEltwiseNode& node, const jit_eltwise_call_args_ptrs &args_ptrs, const VectorDims &dims_out) override;
+        const jit_eltwise_params& getJep() const override;
+
+        std::shared_ptr<jit_uni_eltwise_kernel> pKernel;
+    };
+
+    struct EltwiseRefPrim : public EltwisePrim {
+        EltwiseRefPrim(const jit_eltwise_params &_jep) : jep(_jep) {}
+        void exec(const MKLDNNEltwiseNode& node, const jit_eltwise_call_args_ptrs &args_ptrs, const VectorDims &dims_out) override;
+        const jit_eltwise_params& getJep() const override { return jep; }
+
+        jit_eltwise_params jep;
+    };
 
-    std::shared_ptr<jit_uni_eltwise_kernel> eltwise_kernel = nullptr;
-    jit_eltwise_params jep = {};
-    jit_eltwise_call_args_ptrs args_ptrs = {};
+    mkldnn::algorithm mkldnnAlgorithm = mkldnn::algorithm::undef;
 
-    int optimalTensorRank = 6;
+    const int optimalTensorRank = 6;
     bool canUseOptimizedImpl = false;
     bool isDynBatchEnabled = false;
     bool specialConvolutionAddFusing = false;
     size_t batchDimIdx = 0;
-    size_t tensorRank = 0;
     size_t fullWorkAmount = 0;
     size_t schedulerWorkAmount = 0;
     size_t inputNum = 0;
-    std::vector<std::vector<size_t>> dims_in = {};
-    std::vector<std::vector<size_t>> offsets_in = {};
-    std::vector<size_t> dims_out = {};
-    std::vector<size_t> offsets_out = {};
     std::vector<ptrdiff_t> start_offset_in = {};
     ptrdiff_t start_offset_out = 0;
-    std::vector<size_t> offsets_oc = {};
+
+    // blocked dims for which kernel compiled and params prepared
+    std::vector<VectorDims> currentInBlkDims = {};
 
     float alpha = 0;
     float beta = 0;
@@ -123,12 +148,14 @@ class MKLDNNEltwiseNode : public MKLDNNNode {
 
     static std::map<const ngraph::DiscreteTypeInfo, std::function<void(const std::shared_ptr<ngraph::Node>&, MKLDNNEltwiseNode& node)>> initializers;
 
-    inline void executeOptimized6D();
-    inline void executeOptimizedGeneric();
-    inline void executeReference();
+    void executeOptimized6D(const std::shared_ptr<jit_uni_eltwise_kernel> &pKernel, const jit_eltwise_call_args_ptrs &args_ptrs,
+                            const VectorDims &dims_out) const;
+    void executeOptimizedGeneric(const std::shared_ptr<jit_uni_eltwise_kernel> &pKernel, const jit_eltwise_call_args_ptrs &args_ptrs,
+                                 const VectorDims &dims_out) const;
+    void executeReference(const jit_eltwise_params &jep, const jit_eltwise_call_args_ptrs &args_ptrs, const VectorDims &dims_out) const;
 
-    void offset_out_calc(std::vector<size_t>& offset, std::vector<size_t>& dims);
-    void offset_in_calc(std::vector<size_t>& offset, std::vector<size_t>& dims_in, std::vector<size_t>& dims_out);
+    void offset_out_calc(VectorDims& offset, VectorDims& dims);
+    void offset_in_calc(VectorDims& offset, VectorDims& dims_in, VectorDims& dims_out);
 
     size_t getOpInputsNum() const;
 };
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.cpp
index 4499e91dacb9bd..0f1c1da89de31a 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.cpp
@@ -11,8 +11,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNEmbeddingBagOffsetSumNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNEmbeddingBagOffsetSumNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto embBagOffsetSumOp = ngraph::as_type_ptr<const ngraph::op::v3::EmbeddingBagOffsetsSum>(op);
         if (!embBagOffsetSumOp) {
             errorMessage = "Node is not an instance of the EmbeddingBagOffsetsSum operation from opset v3.";
@@ -65,9 +69,9 @@ void MKLDNNEmbeddingBagOffsetSumNode::initSupportedPrimitiveDescriptors() {
     std::vector<PortConfigurator> inDataConfigurators({{LayoutType::ncsp, inDataPrecision},
                                                        {LayoutType::ncsp, Precision::I32},
                                                        {LayoutType::ncsp, Precision::I32}});
-    if (getOriginalInputsNumber() > DEFAULT_INDEX_IDX)
+    if (inputShapes.size() > DEFAULT_INDEX_IDX)
         inDataConfigurators.push_back({LayoutType::ncsp, Precision::I32});
-    if (getOriginalInputsNumber() > PER_SAMPLE_WEIGHTS_IDX)
+    if (inputShapes.size() > PER_SAMPLE_WEIGHTS_IDX)
         inDataConfigurators.push_back({LayoutType::ncsp, inDataPrecision});
 
     addSupportedPrimDesc(inDataConfigurators, {{LayoutType::ncsp, inDataPrecision}}, impl_desc_type::ref_any);
@@ -122,8 +126,9 @@ void MKLDNNEmbeddingBagOffsetSumNode::execute(mkldnn::stream strm) {
     if (_withWeights)
         weightsData = reinterpret_cast<const uint8_t *>(getParentEdgeAt(PER_SAMPLE_WEIGHTS_IDX)->getMemoryPtr()->GetPtr());
 
-    MKLDNNEmbeddingBagSumNode::execute(srcData, weightsData, dstData, getParentEdgeAt(0)->getMemory().GetDesc().getPrecision(),
-                                       getParentEdgeAt(0)->getShape().getStaticDims(), getChildEdgeAt(0)->getShape().getStaticDims());
+    const auto &inputMem  = getParentEdgeAt(0)->getMemory();
+    MKLDNNEmbeddingBagSumNode::execute(srcData, weightsData, dstData, inputMem .getDesc().getPrecision(),
+                                       inputMem .getStaticDims(), getChildEdgesAtPort(0)[0]->getMemory().GetShape().getStaticDims());
 }
 
 bool MKLDNNEmbeddingBagOffsetSumNode::created() const {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.h
index 26a38b05081c0c..8827ad545d95c3 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_offset_sum_node.h
@@ -23,7 +23,7 @@ class MKLDNNEmbeddingBagOffsetSumNode : public MKLDNNNode, public MKLDNNEmbeddin
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     void initFromInputs() override;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.cpp
index f185d08588157d..d95fbb5ca7a916 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.cpp
@@ -11,8 +11,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNEmbeddingBagPackedSumNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNEmbeddingBagPackedSumNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto embBagPackedSumOp = ngraph::as_type_ptr<const ngraph::op::v3::EmbeddingBagPackedSum>(op);
         if (!embBagPackedSumOp) {
             errorMessage = "Node is not an instance of the EmbeddingBagPackedSum operation from opset v3.";
@@ -60,7 +64,7 @@ void MKLDNNEmbeddingBagPackedSumNode::initSupportedPrimitiveDescriptors() {
 
     std::vector<PortConfigurator> inDataConfigurators({{LayoutType::ncsp, inDataPrecision},
                                                        {LayoutType::ncsp, Precision::I32}});
-    if (getOriginalInputsNumber() > PER_SAMPLE_WEIGHTS_IDX)
+    if (inputShapes.size() > PER_SAMPLE_WEIGHTS_IDX)
         inDataConfigurators.push_back({LayoutType::ncsp, inDataPrecision});
 
     addSupportedPrimDesc(inDataConfigurators, {{LayoutType::ncsp, inDataPrecision}}, impl_desc_type::ref_any);
@@ -89,8 +93,9 @@ void MKLDNNEmbeddingBagPackedSumNode::execute(mkldnn::stream strm) {
     if (_withWeights)
         weightsData = reinterpret_cast<const uint8_t *>(getParentEdgeAt(PER_SAMPLE_WEIGHTS_IDX)->getMemoryPtr()->GetPtr());
 
-    MKLDNNEmbeddingBagSumNode::execute(srcData, weightsData, dstData, getParentEdgeAt(0)->getMemory().GetDesc().getPrecision(),
-                                       getParentEdgeAt(0)->getShape().getStaticDims(), getChildEdgeAt(0)->getShape().getStaticDims());
+    const auto &inputMem  = getParentEdgeAt(0)->getMemory();
+    MKLDNNEmbeddingBagSumNode::execute(srcData, weightsData, dstData, inputMem .getDesc().getPrecision(),
+                                       inputMem .getStaticDims(), getChildEdgesAtPort(0)[0]->getMemory().GetShape().getStaticDims());
 }
 
 bool MKLDNNEmbeddingBagPackedSumNode::created() const {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.h
index 9d67116a499f77..b52c17ee85888b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_bag_packed_sum_node.h
@@ -23,7 +23,7 @@ class MKLDNNEmbeddingBagPackedSumNode : public MKLDNNNode, public MKLDNNEmbeddin
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     void initFromInputs() override;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.cpp
index 1cea74dc5fb886..6196c6478ac2e2 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.cpp
@@ -11,8 +11,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNEmbeddingSegmentsSumNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNEmbeddingSegmentsSumNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto embBagSegSumOp = ngraph::as_type_ptr<const ngraph::op::v3::EmbeddingSegmentsSum>(op);
         if (!embBagSegSumOp) {
             errorMessage = "Node is not an instance of the EmbeddingSegmentsSum operation from opset v3.";
@@ -66,9 +70,9 @@ void MKLDNNEmbeddingSegmentsSumNode::initSupportedPrimitiveDescriptors() {
                                                        {LayoutType::ncsp, Precision::I32},
                                                        {LayoutType::ncsp, Precision::I32},
                                                        {LayoutType::ncsp, Precision::I32}});
-    if (getOriginalInputsNumber() > DEFAULT_INDEX_IDX)
+    if (inputShapes.size() > DEFAULT_INDEX_IDX)
         inDataConfigurators.push_back({LayoutType::ncsp, Precision::I32});
-    if (getOriginalInputsNumber() > PER_SAMPLE_WEIGHTS_IDX)
+    if (inputShapes.size() > PER_SAMPLE_WEIGHTS_IDX)
         inDataConfigurators.push_back({LayoutType::ncsp, inDataPrecision});
 
     addSupportedPrimDesc(inDataConfigurators, {{LayoutType::ncsp, inDataPrecision}}, impl_desc_type::ref_any);
@@ -76,7 +80,7 @@ void MKLDNNEmbeddingSegmentsSumNode::initSupportedPrimitiveDescriptors() {
 
 void MKLDNNEmbeddingSegmentsSumNode::initFromInputs() {
     indices_ = reinterpret_cast<const int *>(getParentEdgeAt(INDICES_IDX)->getMemoryPtr()->GetPtr());
-    indicesSize_ = getParentEdgeAt(INDICES_IDX)->getShape().getElementsCount();
+    indicesSize_ = getParentEdgeAt(INDICES_IDX)->getMemory().GetShape().getElementsCount();
 
     segmentIds_ = reinterpret_cast<const int *>(getParentEdgeAt(SEGMENT_ID_IDX)->getMemoryPtr()->GetPtr());
 
@@ -124,8 +128,9 @@ void MKLDNNEmbeddingSegmentsSumNode::execute(mkldnn::stream strm) {
     if (_withWeights)
         weightsData = reinterpret_cast<const uint8_t *>(getParentEdgeAt(PER_SAMPLE_WEIGHTS_IDX)->getMemoryPtr()->GetPtr());
 
-    MKLDNNEmbeddingBagSumNode::execute(srcData, weightsData, dstData, getParentEdgeAt(0)->getMemory().GetDesc().getPrecision(),
-                                       getParentEdgeAt(0)->getShape().getStaticDims(), getChildEdgeAt(0)->getShape().getStaticDims());
+    const auto &inputMem  = getParentEdgeAt(0)->getMemory();
+    MKLDNNEmbeddingBagSumNode::execute(srcData, weightsData, dstData, inputMem .getDesc().getPrecision(),
+                                       inputMem .getStaticDims(), getChildEdgesAtPort(0)[0]->getMemory().GetShape().getStaticDims());
 }
 
 bool MKLDNNEmbeddingSegmentsSumNode::created() const {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.h
index b20e9d6765095b..7346e6c3b4b819 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_embedding_segments_sum_node.h
@@ -23,7 +23,7 @@ class MKLDNNEmbeddingSegmentsSumNode : public MKLDNNNode, public MKLDNNEmbedding
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     void initFromInputs() override;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.cpp
index d04b80b0086280..708c6d91921cb8 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.cpp
@@ -215,8 +215,12 @@ static void nms_cf(const float* conf_data,
     detections = (post_nms_topn == -1 ? detections : (std::min)(post_nms_topn, detections));
 }
 
-bool MKLDNNExperimentalDetectronDetectionOutputNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNExperimentalDetectronDetectionOutputNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto doOp = ngraph::as_type_ptr<const ngraph::op::v6::ExperimentalDetectronDetectionOutput>(op);
         if (!doOp) {
             errorMessage = "Node is not an instance of the ExperimentalDetectronDetectionOutput from the operations set v6.";
@@ -253,8 +257,8 @@ void MKLDNNExperimentalDetectronDetectionOutputNode::initSupportedPrimitiveDescr
         return;
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
-    for (int i = 0; i < getOriginalInputsNumber(); ++i)
+    inDataConf.reserve(inputShapes.size());
+    for (int i = 0; i < inputShapes.size(); ++i)
         inDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
 
     addSupportedPrimDesc(inDataConf,
@@ -265,9 +269,9 @@ void MKLDNNExperimentalDetectronDetectionOutputNode::initSupportedPrimitiveDescr
 }
 
 void MKLDNNExperimentalDetectronDetectionOutputNode::execute(mkldnn::stream strm) {
-    const int rois_num = getParentEdgeAt(INPUT_ROIS)->getShape().getStaticDims()[0];
-    assert(classes_num_ == static_cast<int>(getParentEdgeAt(INPUT_SCORES)->getShape().getStaticDims()[1]));
-    assert(4 * classes_num_ == static_cast<int>(getParentEdgeAt(INPUT_DELTAS)->getShape().getStaticDims()[1]));
+    const int rois_num = getParentEdgeAt(INPUT_ROIS)->getMemory().getStaticDims()[0];
+    assert(classes_num_ == static_cast<int>(getParentEdgeAt(INPUT_SCORES)->getMemory().getStaticDims()[1]));
+    assert(4 * classes_num_ == static_cast<int>(getParentEdgeAt(INPUT_DELTAS)->getMemory().getStaticDims()[1]));
 
     const auto* boxes = reinterpret_cast<const float *>(getParentEdgeAt(INPUT_ROIS)->getMemoryPtr()->GetPtr());
     const auto* deltas = reinterpret_cast<const float *>(getParentEdgeAt(INPUT_DELTAS)->getMemoryPtr()->GetPtr());
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.h
index 2df28ce5c4983b..aac589b058f4b6 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_detection_output_node.h
@@ -19,7 +19,7 @@ class MKLDNNExperimentalDetectronDetectionOutputNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     const int INPUT_ROIS {0};
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.cpp
index 8bd70dd2a6ebde..977493ed5be325 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.cpp
@@ -273,8 +273,12 @@ void fill_output_blobs(const float* proposals, const int* roi_indices,
 }
 
 bool MKLDNNExperimentalDetectronGenerateProposalsSingleImageNode::isSupportedOperation
-            (const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+            (const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto proposalOp = ngraph::as_type_ptr<const ngraph::op::v6::ExperimentalDetectronGenerateProposalsSingleImage>(op);
         if (!proposalOp) {
             errorMessage = "Node is not an instance of the Proposal from the operations set v0.";
@@ -327,20 +331,23 @@ void MKLDNNExperimentalDetectronGenerateProposalsSingleImageNode::execute(mkldnn
         }
 
         size_t anchor_dims_size = 1;
-        for (size_t i = 0; i < getParentEdgeAt(INPUT_ANCHORS)->getShape().getRank(); i++) {
-            anchor_dims_size *= getParentEdgeAt(INPUT_ANCHORS)->getShape().getStaticDims()[i];
+        const auto &anchorDims = getParentEdgeAt(INPUT_ANCHORS)->getMemory().getStaticDims();
+        for (size_t i = 0; i < anchorDims.size(); i++) {
+            anchor_dims_size *= anchorDims[i];
         }
 
         size_t deltas_dims_size = 1;
-        for (size_t i = 0; i < getParentEdgeAt(INPUT_DELTAS)->getShape().getRank(); i++) {
-            deltas_dims_size *= getParentEdgeAt(INPUT_DELTAS)->getShape().getStaticDims()[i];
+        const auto &deltaDims = getParentEdgeAt(INPUT_DELTAS)->getMemory().getStaticDims();
+        for (size_t i = 0; i < deltaDims.size(); i++) {
+            deltas_dims_size *= deltaDims[i];
         }
         if (anchor_dims_size != deltas_dims_size)
             IE_THROW() << "'Anchors' blob size for ONNXProposal is incompatible with 'deltas' blob size!";
 
         size_t score_dims_size = 1;
-        for (size_t i = 0; i < getParentEdgeAt(INPUT_SCORES)->getShape().getRank(); i++) {
-            score_dims_size *= getParentEdgeAt(INPUT_SCORES)->getShape().getStaticDims()[i];
+        const auto &scoreDims = getParentEdgeAt(INPUT_SCORES)->getMemory().getStaticDims();
+        for (size_t i = 0; i < scoreDims.size(); i++) {
+            score_dims_size *= scoreDims[i];
         }
         if (deltas_dims_size != (4 * score_dims_size))
             IE_THROW() << "'Deltas' blob size for ONNXProposal is incompatible with 'scores' blob size!";
@@ -354,11 +361,11 @@ void MKLDNNExperimentalDetectronGenerateProposalsSingleImageNode::execute(mkldnn
         float *p_roi_item       = reinterpret_cast<float *>(getChildEdgesAtPort(OUTPUT_ROIS)[0]->getMemoryPtr()->GetPtr());
         float *p_roi_score_item = reinterpret_cast<float *>(getChildEdgesAtPort(OUTPUT_SCORES)[0]->getMemoryPtr()->GetPtr());
 
-        const int anchors_num = getParentEdgeAt(INPUT_SCORES)->getShape().getStaticDims()[0];
+        const int anchors_num = scoreDims[0];
 
         // bottom shape: (num_anchors) x H x W
-        const int bottom_H = getParentEdgeAt(INPUT_DELTAS)->getShape().getStaticDims()[1];
-        const int bottom_W = getParentEdgeAt(INPUT_DELTAS)->getShape().getStaticDims()[2];
+        const int bottom_H = deltaDims[1];
+        const int bottom_W = deltaDims[2];
 
         // input image height & width
         const float img_H = p_img_info_cpu[0];
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.h
index b2f5f0bcd89fe1..3caf61e168be01 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_generate_proposals_single_image_node.h
@@ -20,7 +20,7 @@ class MKLDNNExperimentalDetectronGenerateProposalsSingleImageNode : public MKLDN
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     // Inputs:
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.cpp
index 001257c443d419..10359d50949116 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.cpp
@@ -11,8 +11,13 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNExperimentalDetectronPriorGridGeneratorNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNExperimentalDetectronPriorGridGeneratorNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op,
+                                                                             std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto priorGridGen = std::dynamic_pointer_cast<const ngraph::opset6::ExperimentalDetectronPriorGridGenerator>(op);
         if (!priorGridGen) {
             errorMessage = "Only opset6 ExperimentalDetectronPriorGridGenerator operation is supported";
@@ -61,14 +66,14 @@ void MKLDNNExperimentalDetectronPriorGridGeneratorNode::initSupportedPrimitiveDe
 }
 
 void MKLDNNExperimentalDetectronPriorGridGeneratorNode::execute(mkldnn::stream strm) {
-    const int num_priors_ = getParentEdgeAt(INPUT_PRIORS)->getShape().getStaticDims()[0];
-    assert(getParentEdgeAt(INPUT_PRIORS)->getShape().getStaticDims()[1] == 4);
+    const int num_priors_ = getParentEdgeAt(INPUT_PRIORS)->getMemory().getStaticDims()[0];
+    assert(getParentEdgeAt(INPUT_PRIORS)->getMemory().getStaticDims()[1] == 4);
 
     // Execute
-    const int layer_width = grid_w_ ? grid_w_ : getParentEdgeAt(INPUT_FEATUREMAP)->getShape().getStaticDims()[3];
-    const int layer_height = grid_h_ ? grid_h_ : getParentEdgeAt(INPUT_FEATUREMAP)->getShape().getStaticDims()[2];
-    const float step_w = stride_w_ ? stride_w_ : static_cast<float>(getParentEdgeAt(INPUT_IMAGE)->getShape().getStaticDims()[3]) / layer_width;
-    const float step_h = stride_h_ ? stride_h_ : static_cast<float>(getParentEdgeAt(INPUT_IMAGE)->getShape().getStaticDims()[2]) / layer_height;
+    const int layer_width = grid_w_ ? grid_w_ : getParentEdgeAt(INPUT_FEATUREMAP)->getMemory().getStaticDims()[3];
+    const int layer_height = grid_h_ ? grid_h_ : getParentEdgeAt(INPUT_FEATUREMAP)->getMemory().getStaticDims()[2];
+    const float step_w = stride_w_ ? stride_w_ : static_cast<float>(getParentEdgeAt(INPUT_IMAGE)->getMemory().getStaticDims()[3]) / layer_width;
+    const float step_h = stride_h_ ? stride_h_ : static_cast<float>(getParentEdgeAt(INPUT_IMAGE)->getMemory().getStaticDims()[2]) / layer_height;
 
     const auto *bottom_data_0 = reinterpret_cast<const float *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     auto *top_data_0 = reinterpret_cast<float *>(getChildEdgesAtPort(OUTPUT_ROIS)[0]->getMemoryPtr()->GetPtr());
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.h
index 9ef117f44e65f7..2f7e224e63c73b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_priorgridgenerator_node.h
@@ -19,7 +19,7 @@ class MKLDNNExperimentalDetectronPriorGridGeneratorNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     // Inputs:
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp
index 09313e30bd64aa..84992e52cadfdf 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.cpp
@@ -304,8 +304,13 @@ void reorder_rois(const float *rois, const int* ids, int* mapping, const int roi
     }
 }
 
-bool MKLDNNExperimentalDetectronROIFeatureExtractorNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNExperimentalDetectronROIFeatureExtractorNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op,
+                                                                              std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto roiFeatureExtractor = std::dynamic_pointer_cast<const ngraph::opset6::ExperimentalDetectronROIFeatureExtractor>(op);
         if (!roiFeatureExtractor) {
             errorMessage = "Only opset6 ExperimentalDetectronROIFeatureExtractor operation is supported";
@@ -340,8 +345,8 @@ void MKLDNNExperimentalDetectronROIFeatureExtractorNode::initSupportedPrimitiveD
         return;
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
-    for (int i = 0; i < getOriginalInputsNumber(); ++i)
+    inDataConf.reserve(inputShapes.size());
+    for (int i = 0; i < inputShapes.size(); ++i)
         inDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
 
     addSupportedPrimDesc(inDataConf,
@@ -352,8 +357,8 @@ void MKLDNNExperimentalDetectronROIFeatureExtractorNode::initSupportedPrimitiveD
 
 void MKLDNNExperimentalDetectronROIFeatureExtractorNode::execute(mkldnn::stream strm) {
     const int levels_num = inputShapes.size() - INPUT_FEATURES_START;
-    const int num_rois = getParentEdgeAt(INPUT_ROIS)->getShape().getStaticDims()[0];
-    const int channels_num = getParentEdgeAt(INPUT_FEATURES_START)->getShape().getStaticDims()[1];
+    const int num_rois = getParentEdgeAt(INPUT_ROIS)->getMemory().getStaticDims()[0];
+    const int channels_num = getParentEdgeAt(INPUT_FEATURES_START)->getMemory().getStaticDims()[1];
     const int feaxels_per_roi = pooled_height_ * pooled_width_ * channels_num;
 
     auto *input_rois = reinterpret_cast<const float *>(getParentEdgeAt(INPUT_ROIS)->getMemoryPtr()->GetPtr());
@@ -379,8 +384,8 @@ void MKLDNNExperimentalDetectronROIFeatureExtractorNode::execute(mkldnn::stream
         const int level_rois_num = rois_per_level[i + 1] - level_rois_offset;
         if (level_rois_num > 0) {
             auto *featuremap = reinterpret_cast<const float *>(getParentEdgeAt(INPUT_FEATURES_START + i)->getMemoryPtr()->GetPtr());
-            const int featuremap_height = getParentEdgeAt(INPUT_FEATURES_START + i)->getShape().getStaticDims()[2];
-            const int featuremap_width = getParentEdgeAt(INPUT_FEATURES_START + i)->getShape().getStaticDims()[3];
+            const int featuremap_height = getParentEdgeAt(INPUT_FEATURES_START + i)->getMemory().getStaticDims()[2];
+            const int featuremap_width = getParentEdgeAt(INPUT_FEATURES_START + i)->getMemory().getStaticDims()[3];
             ROIAlignForward_cpu_kernel<float>(feaxels_per_roi * level_rois_num,
                                               featuremap,
                                               1.0f / pyramid_scales_[i],
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.h
index bfcb9061f26fbe..cb17ee2cadd621 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_roifeatureextractor_node.h
@@ -19,7 +19,7 @@ class MKLDNNExperimentalDetectronROIFeatureExtractorNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     const int INPUT_ROIS {0};
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp
index f77c3fcb2b08b6..6cf84aac94f2fb 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.cpp
@@ -14,8 +14,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNExperimentalDetectronTopKROIsNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNExperimentalDetectronTopKROIsNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto topKROI = std::dynamic_pointer_cast<const ngraph::opset6::ExperimentalDetectronTopKROIs>(op);
         if (!topKROI) {
             errorMessage = "Only opset6 ExperimentalDetectronTopKROIs operation is supported";
@@ -56,7 +60,7 @@ void MKLDNNExperimentalDetectronTopKROIsNode::initSupportedPrimitiveDescriptors(
 }
 
 void MKLDNNExperimentalDetectronTopKROIsNode::execute(mkldnn::stream strm) {
-    const int input_rois_num = getParentEdgeAt(INPUT_ROIS)->getShape().getStaticDims()[0];
+    const int input_rois_num = getParentEdgeAt(INPUT_ROIS)->getMemory().getStaticDims()[0];
     const int top_rois_num = (std::min)(max_rois_num_, input_rois_num);
 
     auto *input_rois = reinterpret_cast<const float *>(getParentEdgeAt(INPUT_ROIS)->getMemoryPtr()->GetPtr());
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.h
index 76171de71e473c..40cea208abc768 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_experimental_detectron_topkrois_node.h
@@ -19,7 +19,7 @@ class MKLDNNExperimentalDetectronTopKROIsNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     // Inputs:
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.cpp
index 13ada3cf81dfa5..d130e753438402 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.cpp
@@ -268,8 +268,12 @@ struct jit_extract_image_patches_kernel : public jit_uni_extract_image_patches_k
     }
 };
 
-bool MKLDNNExtractImagePatchesNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNExtractImagePatchesNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto extImgPatcher = std::dynamic_pointer_cast<const ngraph::opset3::ExtractImagePatches>(op);
         if (!extImgPatcher) {
             errorMessage = "Only opset3 ExtractImagePatches operation is supported";
@@ -419,12 +423,12 @@ void MKLDNNExtractImagePatchesNode::execute(mkldnn::stream strm) {
     char *dst_data = reinterpret_cast<char *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
     const size_t dtype_size = getOriginalInputPrecisionAtPort(0).size();
 
-    const auto& inDims = getParentEdgeAt(0)->getShape().getStaticDims();
+    const auto& inDims = getParentEdgeAt(0)->getMemory().getStaticDims();
     const size_t IC = inDims[1];
     const size_t IH = inDims[2];
     const size_t IW = inDims[3];
 
-    const auto& outDims = getChildEdgesAtPort(0)[0]->getShape().getStaticDims();
+    const auto& outDims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
     const size_t OB = outDims[0];
     const size_t OH = outDims[2];
     const size_t OW = outDims[3];
@@ -434,8 +438,8 @@ void MKLDNNExtractImagePatchesNode::execute(mkldnn::stream strm) {
     const size_t RH = _rates[0], RW = _rates[1];
     const size_t PT = _pad_top, PL = _pad_left;
 
-    const std::vector<size_t> istrides = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
-    const std::vector<size_t> ostrides = getChildEdgesAtPort(0)[0]->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    const std::vector<size_t> istrides = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
+    const std::vector<size_t> ostrides = getChildEdgesAtPort(0)[0]->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
     const std::vector<size_t> ostrides_partial = {ostrides[0], KW * IC * ostrides[1], IC * ostrides[1], ostrides[1]};
 
     if (extract_image_patches_kernel) {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.h
index 2990b12d08f2e3..f78730185aa6d6 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_extract_image_patches_node.h
@@ -50,7 +50,7 @@ class MKLDNNExtractImagePatchesNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     enum class ExtImgPatcherPadType {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp
index b08ebae30f4c41..a0acfc5c7b3be4 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fake_quantize_node.cpp
@@ -19,7 +19,9 @@
 #include "ie_parallel.hpp"
 
 #include <ngraph/opsets/opset1.hpp>
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
+#include "utils/ngraph_utils.hpp"
 
 // Quantization ranges validation is switched off by default in order to avoid regressions on user side
 // #define VALIDATE_QUANTIZATION_RANGES
@@ -820,6 +822,11 @@ struct jit_uni_quantization_kernel : public jit_uni_quantize_kernel, public jit_
 
 bool MKLDNNFakeQuantizeNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto fq = std::dynamic_pointer_cast<const ngraph::opset1::FakeQuantize>(op);
         if (!fq) {
             errorMessage = "Only opset1 FakeQuantize operation is supported";
@@ -1093,13 +1100,13 @@ MKLDNNFakeQuantizeNode::MKLDNNFakeQuantizeNode(const std::shared_ptr<ngraph::Nod
 
 std::vector<LayoutType> MKLDNNFakeQuantizeNode::getDataFormats() const {
     // Special case for first FQ in the network
-    if (getParentEdgesAtPort(0)[0]->getShape().getStaticDims()[getAxis()] == 3) {
+    if (getInputShapeAtPort(0).getStaticDims()[getAxis()] == 3) {
         return { LayoutType::ncsp };
     } else {
         if (isBinarization()) {
             return { LayoutType::nspc };
         } else {
-            if (one_of(getParentEdgesAtPort(0)[0]->getShape().getRank(), 4, 5)) {
+            if (one_of(getInputShapeAtPort(0).getRank(), 4, 5)) {
                 if (getAxis() == 1) {
                     auto blkFormat = mayiuse(cpu::x64::avx512_common) ? LayoutType::nCsp16c : LayoutType::nCsp8c;
                     return { blkFormat, LayoutType::nspc, LayoutType::ncsp };
@@ -1140,12 +1147,12 @@ void MKLDNNFakeQuantizeNode::getSupportedDescriptors() {
             IE_THROW() << errorPrefix << "has unsupported number of parent edges at port " << i;
     }
 
-    if (getParentEdgesAtPort(0)[0]->getShape().getRank() != getChildEdgesAtPort(0)[0]->getShape().getRank()) {
+    if (getInputShapeAtPort(0).getRank() != getInputShapeAtPort(0).getRank()) {
         IE_THROW() << errorPrefix << "has different ranks for input and output tensors";
     }
 
     if (isBinarization()) {
-        if (getParentEdgesAtPort(0)[0]->getShape().getRank() != 4ul) {
+        if (getInputShapeAtPort(0).getRank() != 4ul) {
             IE_THROW() << errorPrefix << "doesn't support input/output rank != 4";
         }
     }
@@ -1192,10 +1199,10 @@ void MKLDNNFakeQuantizeNode::initSupportedPrimitiveDescriptors() {
 
             if (i == 0) {
                 auto descCreator = BlockedDescCreator::getCommonCreators().at(fmt);
-                dataConfig.desc = descCreator->createUniqueDesc(getInputPrecision(), getParentEdgeAt(i)->getShape().getStaticDims());
+                dataConfig.desc = descCreator->createSharedDesc(getInputPrecision(), getInputShapeAtPort(i));
             } else {
                 auto descCreator = BlockedDescCreator::getCommonCreators().at(LayoutType::ncsp);
-                dataConfig.desc = descCreator->createUniqueDesc(Precision::FP32, getParentEdgeAt(i)->getShape().getStaticDims());
+                dataConfig.desc = descCreator->createSharedDesc(Precision::FP32, getInputShapeAtPort(i));
             }
             config.inConfs.push_back(dataConfig);
         }
@@ -1204,7 +1211,7 @@ void MKLDNNFakeQuantizeNode::initSupportedPrimitiveDescriptors() {
         dataConfig.inPlace = -1;
         dataConfig.constant = false;
         auto descCreator = BlockedDescCreator::getCommonCreators().at(fmt);
-        dataConfig.desc = descCreator->createUniqueDesc(getOutputPrecision(), getChildEdgeAt(0)->getShape().getStaticDims());
+        dataConfig.desc = descCreator->createSharedDesc(getOutputPrecision(), getOutputShapeAtPort(0));
         config.outConfs.push_back(dataConfig);
 
         supportedPrimitiveDescriptors.push_back({config, impl_type});
@@ -1222,12 +1229,12 @@ void MKLDNNFakeQuantizeNode::createPrimitive() {
     jqp.dst_prc = config.outConfs[0].desc->getPrecision();
 
     auto srcDesc = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    jqp.s_str = srcDesc.getStrides();
+    jqp.s_str = srcDesc->getStrides();
 
     auto dstDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    jqp.d_str = dstDesc.getStrides();
+    jqp.d_str = dstDesc->getStrides();
 
-    jqp.is_planar = srcDesc.hasLayoutType(LayoutType::ncsp) && one_of(srcDesc.getShape().getRank(), 3, 4, 5);
+    jqp.is_planar = srcDesc->hasLayoutType(LayoutType::ncsp) && one_of(srcDesc->getShape().getRank(), 3, 4, 5);
 
     jqp.op_type = getAlgorithm();
 
@@ -1256,10 +1263,10 @@ void MKLDNNFakeQuantizeNode::createPrimitive() {
     if (quantize_kernel)
         quantize_kernel->create_ker();
 
-    size_t axisSize = getParentEdgeAt(0)->getShape().getStaticDims()[getAxis()];
+    size_t axisSize = getParentEdgesAtPort(0)[0]->getMemory().GetShape().getStaticDims()[getAxis()];
     size_t axisPaddedSize = rnd_up(axisSize, 16);
 
-    MKLDNNMemoryDesc weightsDataDesc = {{(uint32_t)axisPaddedSize}, memory::data_type::f32, memory::format_tag::x};
+    DnnlBlockedMemoryDesc weightsDataDesc(Shape(InferenceEngine::SizeVector{axisPaddedSize}), memory::data_type::f32, memory::format_tag::x);
 
     if (isBinarization()) {
         auto binarizationThresholdsDataMem = std::make_shared<MKLDNNMemory>(getEngine());
@@ -1295,8 +1302,8 @@ void MKLDNNFakeQuantizeNode::executeReference() {
 
     auto src = reinterpret_cast<const float *>(srcMemory->GetPtr());
 
-    auto srcDims = srcMemory->GetDesc().getShape().getStaticDims();
-    auto dstDims = dstMemory->GetDesc().getShape().getStaticDims();
+    auto srcDims = srcMemory->getStaticDims();
+    auto dstDims = dstMemory->getStaticDims();
 
     auto s_str = jqp.s_str;
     auto d_str = jqp.d_str;
@@ -1416,7 +1423,7 @@ void MKLDNNFakeQuantizeNode::executeBinarization() {
     auto thresholds = reinterpret_cast<const float*>(internalBlobMemory[0]->GetData());
     auto output_mask = reinterpret_cast<const float*>(internalBlobMemory[1]->GetData());
 
-    auto src_dims = srcMemory->GetDesc().getShape().getStaticDims();
+    auto src_dims = srcMemory->getStaticDims();
 
     std::vector<size_t> s_str = jqp.s_str;
     size_t tmp = s_str[s_str.size() - 1];
@@ -1459,7 +1466,7 @@ void MKLDNNFakeQuantizeNode::executeQuantization() {
     auto output_scale = reinterpret_cast<const float*>(internalBlobMemory[4]->GetData());
     auto output_shift = reinterpret_cast<const float*>(internalBlobMemory[5]->GetData());
 
-    auto& srcDesc = srcMemory->GetDesc();
+    auto& srcDesc = srcMemory->getDesc();
     auto srcDims = srcDesc.getShape().getStaticDims();
 
     bool is_blk_format = !srcDesc.hasLayoutType(LayoutType::nspc) && one_of(srcDesc.getShape().getRank(), 4, 5);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.cpp
index ee8dc1b730b911..cd8b171cd050ba 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.cpp
@@ -12,14 +12,20 @@
 #include <mkldnn_extension_utils.h>
 #include <mkldnn.hpp>
 #include "utils/general_utils.h"
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNFullyConnectedNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNFullyConnectedNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto fc = std::dynamic_pointer_cast<const FullyConnectedNode>(op);
         if (!fc) {
             errorMessage = "Only legacy FullyConnected operation is supported";
@@ -101,8 +107,8 @@ void MKLDNNFullyConnectedNode::getSupportedDescriptors() {
         outputDataType = memory::data_type::bf16;
     }
 
-    const auto inDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    const auto outDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    const auto& inDims = getInputShapeAtPort(0).getStaticDims();
+    const auto& outDims = getOutputShapeAtPort(0).getStaticDims();
 
     if (inDims.size() == 3) {
         weightsDims = InferenceEngine::SizeVector({static_cast<size_t>(outDims[2]), static_cast<size_t>(inDims[2])});
@@ -113,7 +119,7 @@ void MKLDNNFullyConnectedNode::getSupportedDescriptors() {
     }
     biasesDims.push_back(weightsDims[0]);
 
-    for (auto format : getAvailableFormatsForDims(getParentEdgeAt(0)->getShape())) {
+    for (auto format : getAvailableFormatsForDims(getInputShapeAtPort(0))) {
         auto in_candidate = mkldnn::memory::desc(MKLDNNExtensionUtils::convertToDnnlDims(inDims), inputDataType, format);
         auto out_candidate = mkldnn::memory::desc(MKLDNNExtensionUtils::convertToDnnlDims(outDims), outputDataType, mkldnn::memory::format_tag::any);
 
@@ -149,7 +155,7 @@ void MKLDNNFullyConnectedNode::execute(mkldnn::stream strm) {
                 auto oldMem = param->second;
                 auto dims = oldMem.get_desc().dims();
                 if (dims.size() == 3) {
-                    MKLDNNDims normalizedDims({static_cast<ptrdiff_t>(dims[0] * dims[1]), static_cast<ptrdiff_t>(dims[2])});
+                    std::vector<dnnl::memory::dim> normalizedDims({dims[0] * dims[1], dims[2]});
                     mkldnn::memory::desc newMemDesc(oldMem.get_desc().reshape(normalizedDims));
                     mkldnn::memory newMem(newMemDesc, oldMem.get_engine(), oldMem.get_data_handle());
                     primArgs.at(argType) = newMem;
@@ -237,7 +243,7 @@ std::shared_ptr<mkldnn::primitive_attr> MKLDNNFullyConnectedNode::initPrimitiveA
     return attr;
 }
 
-// WA: creation MKLDNNMemoryDesc with format == any is prohibited
+// WA: creation DnnlMemoryDesc with format == any is prohibited
 // so we create mkldnn::memory::desc directly
 // we need specific method and can't remove createDescriptor from base class because its used into initDescriptor
 void MKLDNNFullyConnectedNode::createDescriptorInternal(const mkldnn::memory::desc &inputDesc,
@@ -261,12 +267,12 @@ void MKLDNNFullyConnectedNode::createDescriptorInternal(const mkldnn::memory::de
         auto normalizedInDims = {inDims[0] * inDims[1], inDims[2]};
         auto normalizedOutDims = {outDims[0] * outDims[1], outDims[2]};
         in_candidate = mkldnn::memory::desc(normalizedInDims, in_candidate.data_type(),
-                                         MKLDNNMemory::GetPlainFormatByRank(normalizedInDims.size()));
+                                         MKLDNNExtensionUtils::GetPlainFormatByRank(normalizedInDims.size()));
         out_candidate = mkldnn::memory::desc(normalizedOutDims, out_candidate.data_type(),
-                                             MKLDNNMemory::GetPlainFormatByRank(normalizedOutDims.size()));
+                                             MKLDNNExtensionUtils::GetPlainFormatByRank(normalizedOutDims.size()));
     }
 
-    mkldnn::memory::desc wgh_candidate(MKLDNNDims(weightsDims), wdt, mkldnn::memory::format_tag::any);
+    mkldnn::memory::desc wgh_candidate(MKLDNNExtensionUtils::convertToDnnlDims(weightsDims), wdt, mkldnn::memory::format_tag::any);
 
     if (withBiases) {
         mkldnn::memory::desc bias_candidate(MKLDNNExtensionUtils::convertToDnnlDims(inputShapes[BIAS_ID].getStaticDims()), bdt,
@@ -283,28 +289,30 @@ void MKLDNNFullyConnectedNode::createDescriptorInternal(const mkldnn::memory::de
     }
 }
 
-void MKLDNNFullyConnectedNode::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc,
-                                                const std::vector<const MemoryDesc*> &outputDesc) {
-    createDescriptorInternal(MemoryDescUtils::convertToMKLDNNMemoryDesc(*inputDesc[0]), MemoryDescUtils::convertToMKLDNNMemoryDesc(*outputDesc[0]));
+void MKLDNNFullyConnectedNode::createDescriptor(const std::vector<MemoryDescPtr> &inputDesc,
+                                                const std::vector<MemoryDescPtr> &outputDesc) {
+    createDescriptorInternal(MemoryDescUtils::convertToDnnlMemoryDesc(inputDesc[0])->getDnnlDesc(),
+                             MemoryDescUtils::convertToDnnlMemoryDesc(outputDesc[0])->getDnnlDesc());
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNFullyConnectedNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
-    auto desc = idx > 0 ? MKLDNNMemoryDesc(primitive_desc_it.weights_desc(idx - 1)) : MKLDNNMemoryDesc(primitive_desc_it.src_desc(idx));
+std::shared_ptr<MemoryDesc> MKLDNNFullyConnectedNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+    auto desc = idx > 0 ? primitive_desc_it.weights_desc(idx - 1) : primitive_desc_it.src_desc(idx);
 
-    if (getParentEdgeAt(idx)->getShape().getRank() == 3) {
-        desc = MKLDNNMemoryDesc(getParentEdgeAt(idx)->getShape().getStaticDims(), MKLDNNExtensionUtils::IEPrecisionToDataType(desc.getPrecision()),
-                                MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(idx)->getShape().getRank()));
+    if (getInputShapeAtPort(idx).getRank() == 3) {
+        return std::make_shared<CpuBlockedMemoryDesc>(MKLDNNExtensionUtils::DataTypeToIEPrecision(
+            static_cast<mkldnn::memory::data_type>(desc.data.data_type)), getInputShapeAtPort(idx));
     }
-    return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::move(desc));
+    return MKLDNNExtensionUtils::makeDescriptor(desc);
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNFullyConnectedNode::getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
-    auto desc = MKLDNNMemoryDesc(primitive_desc_it.dst_desc(idx));
-    if (getChildEdgeAt(idx)->getShape().getRank() == 3) {
-        desc = MKLDNNMemoryDesc(getChildEdgeAt(idx)->getShape().getStaticDims(), MKLDNNExtensionUtils::IEPrecisionToDataType(desc.getPrecision()),
-                                MKLDNNMemory::GetPlainFormatByRank(getChildEdgeAt(idx)->getShape().getRank()));
+std::shared_ptr<MemoryDesc> MKLDNNFullyConnectedNode::getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+    auto desc = primitive_desc_it.dst_desc(idx);
+
+    if (getOutputShapeAtPort(idx).getRank() == 3) {
+        return std::make_shared<CpuBlockedMemoryDesc>(MKLDNNExtensionUtils::DataTypeToIEPrecision(
+            static_cast<mkldnn::memory::data_type>(desc.data.data_type)), getOutputShapeAtPort(idx));
     }
-    return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::move(desc));
+    return MKLDNNExtensionUtils::makeDescriptor(desc);
 }
 
 InferenceEngine::Precision MKLDNNFullyConnectedNode::getRuntimePrecision() const {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.h
index 01820fdfcc39ea..239bce774fd0ae 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_fullyconnected_node.h
@@ -27,21 +27,21 @@ class MKLDNNFullyConnectedNode : public MKLDNNNode {
     }
 
     const std::vector<impl_desc_type>& getPrimitivesPriority() override;
-    void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                          const std::vector<const MemoryDesc*>& outputDesc) override;
+    void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                          const std::vector<MemoryDescPtr>& outputDesc) override;
 
     size_t descInputNumbers(MKLDNNDescriptor desc) override {
         return static_cast<size_t>(getOriginalInputsNumber());
     }
 
-    std::unique_ptr<MKLDNNMemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
-    std::unique_ptr<MKLDNNMemoryDesc> getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
+    std::shared_ptr<MemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
+    std::shared_ptr<MemoryDesc> getDstMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
 
     InferenceEngine::Precision getRuntimePrecision() const override;
 
     bool canFuse(const MKLDNNNodePtr& node) const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 protected:
     std::shared_ptr<mkldnn::primitive_attr> initPrimitiveAttr();
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.cpp
index e4da50abe8af9a..68799da481a923 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.cpp
@@ -16,8 +16,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNGatherElementsNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNGatherElementsNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto gatherElementsOp = ngraph::as_type_ptr<const ngraph::op::v6::GatherElements>(op);
         if (!gatherElementsOp) {
             errorMessage = "Node is not an instance of the GatherElements operation from operation set v6.";
@@ -98,7 +102,7 @@ void MKLDNNGatherElementsNode::directExecution() {
     const auto *indices = reinterpret_cast<const int *>(getParentEdgeAt(indicesIndex_)->getMemoryPtr()->GetPtr());
     auto *dstData = reinterpret_cast<dataType *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
 
-    const int outSize = getChildEdgeAt(0)->getShape().getElementsCount();
+    const int outSize = getChildEdgesAtPort(0)[0]->getMemory().GetShape().getElementsCount();
     auto threadBody = [&](const int ithr, const int nthr) {
         int start(0lu), end(0lu);
         splitter(outSize, nthr, ithr, start, end);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.h
index bc19866768dfcf..a99edf4458e26a 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_elements_node.h
@@ -22,7 +22,7 @@ class MKLDNNGatherElementsNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     const size_t dataIndex_ = 0;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.cpp
index 75ee34dbda5be4..4ca5fe84ecfb3f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.cpp
@@ -16,8 +16,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNGatherNDNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNGatherNDNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto gatherElementsOp = ngraph::as_type_ptr<const ngraph::op::v5::GatherND>(op);
         if (!gatherElementsOp) {
             errorMessage = "Node is not an instance of the GatherND operation from operation set v5.";
@@ -101,11 +105,11 @@ void MKLDNNGatherNDNode::gatherElementwise() {
     const auto *indices = reinterpret_cast<const int *>(getParentEdgeAt(_indicesIndex)->getMemoryPtr()->GetPtr());
     auto *dstData = reinterpret_cast<dataType *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
 
-    auto strides = getParentEdgeAt(_dataIndex)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    auto strides = getParentEdgeAt(_dataIndex)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
     const size_t* srcMultipliers = strides.data() + _batchDims;
 
-    const size_t cycles = getChildEdgeAt(0)->getShape().getElementsCount() *
-                          getChildEdgeAt(0)->getMemory().GetDesc().getPrecision().size() / (sizeof(dataType) * _batchNum);
+    const size_t cycles = getChildEdgeAt(0)->getMemory().GetShape().getElementsCount() *
+                          getChildEdgeAt(0)->getMemory().getDesc().getPrecision().size() / (sizeof(dataType) * _batchNum);
     const size_t CS = cycles * _sliceRank;
     const size_t CB = cycles * _blockSize;
     const size_t workAmount = _batchNum * cycles;
@@ -150,7 +154,7 @@ void MKLDNNGatherNDNode::gatherBlocks() {
 
     std::vector<size_t> srcMultipliers(_sliceRank);
     for (size_t i = 0; i < _sliceRank ; i++)
-        srcMultipliers[i] = _dataTypeSize * getParentEdgeAt(_dataIndex)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides()[i + _batchDims];
+        srcMultipliers[i] = _dataTypeSize * getParentEdgeAt(_dataIndex)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides()[i + _batchDims];
 
     const size_t batchStep = _batchStep * _dataTypeSize;
     const size_t dataStep = _blockSize * _dataTypeSize;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.h
index 3845fabaf7005b..3d826621c9d0af 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_nd_node.h
@@ -22,7 +22,7 @@ class MKLDNNGatherNDNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     size_t _dataRank;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.cpp
index f41a57730a57cc..feb9c2e00d0b58 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.cpp
@@ -13,8 +13,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNGatherNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNGatherNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto gatherOp = ngraph::as_type_ptr<const ngraph::op::v7::Gather>(op);
         if (!gatherOp) {
             errorMessage = "Only opset7 Gather operation is supported";
@@ -92,10 +96,10 @@ void MKLDNNGatherNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         IE_THROW() << errorPrefix_ << " has unidentified preferable primitive descriptor.";
 
-    const SizeVector srcDims = getParentEdgeAt(GATHER_DATA)->getShape().getStaticDims();
-    const SizeVector idxDims = getParentEdgeAt(GATHER_INDEXES)->getShape().getStaticDims();
-    const SizeVector dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
-    dataSize = getParentEdgeAt(GATHER_DATA)->getMemory().GetDesc().getPrecision().size();
+    const SizeVector srcDims = getParentEdgeAt(GATHER_DATA)->getMemory().getStaticDims();
+    const SizeVector idxDims = getParentEdgeAt(GATHER_INDEXES)->getMemory().getStaticDims();
+    const SizeVector dstDims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
+    dataSize = getParentEdgeAt(GATHER_DATA)->getMemory().getDesc().getPrecision().size();
 
     indexRange = srcDims[axis];
     batchSize = std::accumulate(srcDims.begin(), srcDims.begin() + batchDims, 1, std::multiplies<size_t>());
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.h
index 6c7663bd95fd67..025b944eedc60e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_node.h
@@ -22,7 +22,7 @@ class MKLDNNGatherNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     int axis = 0;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.cpp
index 89fb6c08167f68..e3c38ac3c6bada 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.cpp
@@ -14,8 +14,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNGatherTreeNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNGatherTreeNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto gatherElementsOp = ngraph::as_type_ptr<const ngraph::op::v1::GatherTree>(op);
         if (!gatherElementsOp) {
             errorMessage = "Node is not an instance of the GatherTree operation from operation set v1.";
@@ -66,9 +70,9 @@ void MKLDNNGatherTreeNode::initSupportedPrimitiveDescriptors() {
     }
 
     addSupportedPrimDesc({{LayoutType::ncsp, precision},
-                            {LayoutType::ncsp, precision},
-                            {LayoutType::ncsp, precision},
-                            {LayoutType::ncsp, precision}},
+                          {LayoutType::ncsp, precision},
+                          {LayoutType::ncsp, precision},
+                          {LayoutType::ncsp, precision}},
                          {{LayoutType::ncsp, precision}},
                          impl_desc_type::ref_any);
 }
@@ -84,16 +88,17 @@ template<typename DATA_T>
 void MKLDNNGatherTreeNode::gatherTreeKernel() noexcept {
     const auto *step_idx = reinterpret_cast<DATA_T *>(getParentEdgeAt(GATHER_TREE_STEP_IDX)->getMemoryPtr()->GetPtr());
     const auto * const parent_idx = reinterpret_cast<DATA_T *>(getParentEdgeAt(GATHER_TREE_PARENT_IDX)->getMemoryPtr()->GetPtr());
-    const size_t parent_idx_size = getParentEdgeAt(GATHER_TREE_PARENT_IDX)->getShape().getElementsCount()
-                                   - getParentEdgeAt(GATHER_TREE_PARENT_IDX)->getMemory().GetDescWithType<BlockedMemoryDesc>().getOffsetPadding();
+    const size_t parent_idx_size = getParentEdgeAt(GATHER_TREE_PARENT_IDX)->getMemory().GetShape().getElementsCount()
+                                   - getParentEdgeAt(GATHER_TREE_PARENT_IDX)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getOffsetPadding();
     const auto *max_seq_len = reinterpret_cast<DATA_T *>(getParentEdgeAt(GATHER_TREE_MAX_SEQ_LEN)->getMemoryPtr()->GetPtr());
     auto end_token = (reinterpret_cast<DATA_T *>(getParentEdgeAt(GATHER_TREE_END_TOKEN)->getMemoryPtr()->GetPtr()))[0];
     auto * final_idx = reinterpret_cast<DATA_T *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
 
-    SizeVector step_idx_dims = getParentEdgeAt(GATHER_TREE_STEP_IDX)->getShape().getStaticDims();
-    SizeVector parent_idx_dims = getParentEdgeAt(GATHER_TREE_PARENT_IDX)->getShape().getStaticDims();
-    SizeVector max_seq_len_dims = getParentEdgeAt(GATHER_TREE_MAX_SEQ_LEN)->getShape().getStaticDims();
-    SizeVector final_idx_dims = getChildEdgesAtPort(0)[0]->getShape().getStaticDims();
+    SizeVector step_idx_dims = getParentEdgeAt(GATHER_TREE_STEP_IDX)->getMemory().getStaticDims();
+    SizeVector parent_idx_dims = getParentEdgeAt(GATHER_TREE_PARENT_IDX)->getMemory().getStaticDims();
+    SizeVector max_seq_len_dims = getParentEdgeAt(GATHER_TREE_MAX_SEQ_LEN)->getMemory().getStaticDims();
+    SizeVector final_idx_dims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
+
     int32_t max_time = step_idx_dims[0];
     const size_t batch_size = step_idx_dims[1];
     const size_t beam_width = step_idx_dims[2];
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.h
index 63f34fe6d6e685..4faf0da53699ff 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_gather_tree_node.h
@@ -19,7 +19,7 @@ class MKLDNNGatherTreeNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
     template<typename DATA_T>
     void gatherTreeKernel() noexcept;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_generic_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_generic_node.cpp
index ef87345daae9a1..9fd2c883acbab2 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_generic_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_generic_node.cpp
@@ -8,7 +8,8 @@
 #include <vector>
 #include <string>
 #include <blob_factory.hpp>
-#include "cpu_memory_desc_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -30,13 +31,13 @@ NodeConfig MKLDNNGenericNode::convertLayerToNodeConfig(const InferenceEngine::La
     for (size_t i = 0; i < layerConfig.inConfs.size(); i++) {
         config.inConfs[i].inPlace = layerConfig.inConfs[i].inPlace;
         config.inConfs[i].constant = layerConfig.inConfs[i].constant;
-        config.inConfs[i].desc = MemoryDescUtils::convertToMKLDNNMemoryDesc(layerConfig.inConfs[i].desc).clone();
+        config.inConfs[i].desc = MemoryDescUtils::convertToDnnlBlockedMemoryDesc(layerConfig.inConfs[i].desc).clone();
     }
     config.outConfs.resize(layerConfig.outConfs.size());
     for (size_t i = 0; i < layerConfig.outConfs.size(); i++) {
         config.outConfs[i].inPlace = layerConfig.outConfs[i].inPlace;
         config.outConfs[i].constant = layerConfig.outConfs[i].constant;
-        config.outConfs[i].desc = MemoryDescUtils::convertToMKLDNNMemoryDesc(layerConfig.outConfs[i].desc).clone();
+        config.outConfs[i].desc = MemoryDescUtils::convertToDnnlBlockedMemoryDesc(layerConfig.outConfs[i].desc).clone();
     }
     return config;
 }
@@ -112,13 +113,13 @@ bool MKLDNNGenericNode::created(const MKLDNNExtensionManager::Ptr &extMgr) {
             extFactory = extMgr->CreateExtensionFactory(ngraphOp);
 
             if (!extFactory)
-                IE_THROW(NotImplemented);
+                return false;
 
             std::vector<InferenceEngine::ILayerImpl::Ptr> impls_no_exec;
             InferenceEngine::ResponseDesc resp;
             InferenceEngine::StatusCode rc = extFactory->getImplementations(impls_no_exec, &resp);
             if (rc == InferenceEngine::NOT_IMPLEMENTED) {
-                IE_THROW(NotImplemented) << resp.msg;
+                return false;
             } else if (rc != InferenceEngine::OK) {
                 IE_THROW() << resp.msg;
             }
@@ -130,8 +131,7 @@ bool MKLDNNGenericNode::created(const MKLDNNExtensionManager::Ptr &extMgr) {
             }
         }
 
-        if (extFactory || !impls.empty())
-            setType(Generic);
+        setType(Generic);
     }
     return created();
 }
@@ -177,7 +177,7 @@ void MKLDNNGenericNode::execLayer() {
     for (size_t i = 0; i < outputShapes.size(); i++) {
         if (isDynBatch) {
             auto out_edge = getChildEdgesAtPort(i)[0];
-            auto td = MemoryDescUtils::convertToTensorDesc(out_edge->getMemory().GetDesc());
+            auto td = MemoryDescUtils::convertToTensorDesc(out_edge->getMemory().getDesc());
             td.setDims(execOutputShapes[i]);
             outputs.push_back(make_blob_with_precision(td, out_edge->getMemory().GetData()));
         } else {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp
index 605aa2d6af5283..d7da220de729ca 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.cpp
@@ -11,8 +11,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNGRNNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNGRNNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto grn = std::dynamic_pointer_cast<const ngraph::opset1::GRN>(op);
         if (!grn) {
             errorMessage = "Only opset1 GRN operation is supported";
@@ -53,7 +57,7 @@ void MKLDNNGRNNode::execute(mkldnn::stream strm) {
     const float* src_data = reinterpret_cast<const float *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     float* dst_data = reinterpret_cast<float *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
 
-    SizeVector dims = getParentEdgeAt(0)->getShape().getStaticDims();
+    const auto &dims = getParentEdgeAt(0)->getMemory().getStaticDims();
 
     int N = static_cast<int>((dims.size() > 0) ? dims[0] : 1);
     int C = static_cast<int>((dims.size() > 1) ? dims[1] : 1);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.h
index 8fe8d9d75b04e7..7fb3b6fb955231 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_grn_node.h
@@ -19,7 +19,7 @@ class MKLDNNGRNNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     float bias = 1.0f;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.cpp
index 33b6fdab4f4984..562cb842b899c7 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.cpp
@@ -20,6 +20,7 @@
 #include "common/cpu_convert.h"
 #include "utils/cpu_utils.hpp"
 #include <cpu/x64/jit_generator.hpp>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -242,14 +243,14 @@ MKLDNNInputNode::MKLDNNInputNode(const std::shared_ptr<ngraph::Node>& op, const
     if (constOp) {
         constant = ConstantType::Const;
         cloneBlobIfRequired();
-     }
+    }
 }
 
 void MKLDNNInputNode::cloneBlobIfRequired() {
-    std::vector<size_t> dims(constOp->get_shape().empty() ? ngraph::Shape(1, 1) : constOp->get_shape());
+    Shape shape(constOp->get_shape().empty() ? ngraph::Shape(1, 1) : constOp->get_shape());
     const auto prec = convertPrecision(constOp->get_element_type());
-    const size_t size = dims.size();
-    MKLDNNMemoryDesc memDesc(dims, MKLDNNExtensionUtils::IEPrecisionToDataType(prec));
+    const size_t size = shape.getRank();
+    DnnlBlockedMemoryDesc memDesc(prec, shape);
 
     auto cloneBlob = [&, this] () {
         MKLDNNMemory memory{ getEngine() };
@@ -411,6 +412,10 @@ void MKLDNNInputNode::initSupportedPrimitiveDescriptors() {
     addSupportedPrimDesc(inPortConfs,
                          outPortConfs,
                          impl_desc_type::unknown);
+
+    if (getType() == Output) {
+        currentInDims.resize(1);
+    }
 }
 
 void MKLDNNInputNode::createPrimitive() {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.h
index 8c57ac8873007e..7c7c3a95d9e06e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_input_node.h
@@ -25,6 +25,16 @@ class MKLDNNInputNode : public MKLDNNNode {
     void withMeanImage();
     MKLDNNMemoryCPtr getMemoryPtr() const;
 
+    void executeDynamicImpl(mkldnn::stream strm) override {}
+
+    std::vector<VectorDims> shapeInfer() const override {
+        return std::vector<VectorDims>();
+    }
+
+    bool isPrepareParamsNeeded() const override {
+        return false;
+    }
+
 private:
     void cloneBlobIfRequired();
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.cpp
index df6e4930b54c73..6b5dc95cf9f7aa 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.cpp
@@ -1641,8 +1641,13 @@ using ngInterpCoordTransf = ngraph::opset4::Interpolate::CoordinateTransformMode
 using ngInterpNearMode = ngraph::opset4::Interpolate::NearestMode;
 using ngInterpShapeCalcMode = ngraph::opset4::Interpolate::ShapeCalcMode;
 
-bool MKLDNNInterpolateNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNInterpolateNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto interp = std::dynamic_pointer_cast<const ngraph::opset4::Interpolate>(op);
         if (!interp) {
             errorMessage = "Only opset4 Interpolate operation is supported";
@@ -1829,7 +1834,7 @@ void MKLDNNInterpolateNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << " has incorrect number of output edges";
 
-    srcDim = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
+    srcDim = getInputShapeAtPort(DATA_ID).getStaticDims();
     int dataRank = srcDim.size();
 
     // get pad
@@ -1868,7 +1873,7 @@ void MKLDNNInterpolateNode::getSupportedDescriptors() {
     } else {
         srcDimPad = srcDim;
     }
-    dstDim = getChildEdgeAt(0)->getShape().getStaticDims();
+    dstDim = getOutputShapeAtPort(0).getStaticDims();
 }
 
 void MKLDNNInterpolateNode::initSupportedPrimitiveDescriptors() {
@@ -1894,10 +1899,8 @@ void MKLDNNInterpolateNode::initSupportedPrimitiveDescriptors() {
         inputPrecision = outputPrecision = Precision::FP32;
     }
 
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(inputPrecision);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(outputPrecision);
-    srcDataSize = MKLDNNExtensionUtils::sizeOfDataType(inputDataType);
-    dstDataSize = MKLDNNExtensionUtils::sizeOfDataType(outputDataType);
+    srcDataSize = inputPrecision.size();
+    dstDataSize = outputPrecision.size();
 
     inputPrec = inputPrecision;
     outputPrec = outputPrecision;
@@ -1911,63 +1914,48 @@ void MKLDNNInterpolateNode::initSupportedPrimitiveDescriptors() {
     }
     config.outConfs.resize(1);
 
-    auto targetShapeType = MKLDNNExtensionUtils::IEPrecisionToDataType(Precision::I32);
-    auto scalesType = MKLDNNExtensionUtils::IEPrecisionToDataType(Precision::FP32);
-    auto axesType = MKLDNNExtensionUtils::IEPrecisionToDataType(Precision::I32);
-
-    auto pushDesc = [&](memory::format_tag dataFormat, impl_desc_type implDetail) {
-        config.inConfs[DATA_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(DATA_ID)->getShape().getStaticDims(),
-                                                                                   inputDataType, dataFormat);
-        config.inConfs[TARGET_SHAPE_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(TARGET_SHAPE_ID)->getShape().getStaticDims(),
-                                                                             targetShapeType, memory::format_tag::x);
-        config.inConfs[SCALES_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(SCALES_ID)->getShape().getStaticDims(), scalesType,
-                                                                       memory::format_tag::x);
+    auto targetShapeType = Precision::I32;
+    auto scalesType = Precision::FP32;
+    auto axesType = Precision::I32;
+
+    auto& creatorsMap = BlockedDescCreator::getCommonCreators();
+    auto pushDesc = [&](LayoutType dataFormat, impl_desc_type implDetail) {
+        config.inConfs[DATA_ID].desc = creatorsMap.at(dataFormat)->createSharedDesc(inputPrecision, getInputShapeAtPort(DATA_ID));
+        config.inConfs[TARGET_SHAPE_ID].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(targetShapeType, getInputShapeAtPort(TARGET_SHAPE_ID));
+        config.inConfs[SCALES_ID].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(scalesType, getInputShapeAtPort(SCALES_ID));
+
         if (isAxesSpecified)
-            config.inConfs[AXES_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(AXES_ID)->getShape().getStaticDims(), axesType,
-                                                                         memory::format_tag::x);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType, dataFormat);
+            config.inConfs[AXES_ID].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(axesType, getInputShapeAtPort(AXES_ID));
+
+        config.outConfs[0].desc = creatorsMap.at(dataFormat)->createSharedDesc(outputPrecision, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.push_back({config, implDetail});
     };
 
-    auto channels = getParentEdgeAt(DATA_ID)->getShape().getRank() > 1 ? getParentEdgeAt(DATA_ID)->getShape().getStaticDims()[1] : 1;
+    auto channels = getInputShapeAtPort(DATA_ID).getRank() > 1 ? getInputShapeAtPort(DATA_ID).getStaticDims()[1] : 1;
 
     if (!mayiuse(cpu::x64::sse41) || mode == InterpolateMode::linear) {
-        pushDesc(MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(DATA_ID)->getShape().getRank()), ref);
+        pushDesc(LayoutType::ncsp, ref);
     } else {
         // blk and by_channel JIT kernel on sse41 or above machine
-        if (getParentEdgeAt(DATA_ID)->getShape().getRank() == 4) {
-            if (mayiuse(cpu::x64::avx512_common)) {
-                pushDesc(memory::format_tag::nhwc, jit_avx512);
-                if (channels != 1)
-                    pushDesc(memory::format_tag::nChw16c, jit_avx512);
-            } else if (mayiuse(cpu::x64::avx2)) {
-                pushDesc(memory::format_tag::nhwc, jit_avx2);
-                if (channels != 1)
-                    pushDesc(memory::format_tag::nChw8c, jit_avx2);
-            } else {
-                pushDesc(memory::format_tag::nhwc, jit_sse42);
-                if (channels != 1)
-                    pushDesc(memory::format_tag::nChw8c, jit_sse42);
-            }
-        } else if (getParentEdgeAt(DATA_ID)->getShape().getRank() == 5 && mode != InterpolateMode::cubic) {
+        if (getInputShapeAtPort(DATA_ID).getRank() == 4 || (getInputShapeAtPort(DATA_ID).getRank() == 5 && mode != InterpolateMode::cubic)) {
             if (mayiuse(cpu::x64::avx512_common)) {
-                pushDesc(memory::format_tag::ndhwc, jit_avx512);
+                pushDesc(LayoutType::nspc, jit_avx512);
                 if (channels != 1)
-                    pushDesc(memory::format_tag::nCdhw16c, jit_avx512);
+                    pushDesc(LayoutType::nCsp16c, jit_avx512);
             } else if (mayiuse(cpu::x64::avx2)) {
-                pushDesc(memory::format_tag::ndhwc, jit_avx2);
+                pushDesc(LayoutType::nspc, jit_avx2);
                 if (channels != 1)
-                    pushDesc(memory::format_tag::nCdhw8c, jit_avx2);
+                    pushDesc(LayoutType::nCsp8c, jit_avx2);
             } else {
-                pushDesc(memory::format_tag::ndhwc, jit_sse42);
+                pushDesc(LayoutType::nspc, jit_sse42);
                 if (channels != 1)
-                    pushDesc(memory::format_tag::nCdhw8c, jit_sse42);
+                    pushDesc(LayoutType::nCsp8c, jit_sse42);
             }
         }
 
         // planar for 1.ref on machine without sse41(if no sse41, canFuse() is false). 2.JIT kernel for f32 && avx2(gather).(with fuse)
         if (mayiuse(cpu::x64::avx2) && inputPrec == Precision::FP32) {
-            pushDesc(MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(DATA_ID)->getShape().getRank()), jit_avx2);
+            pushDesc(LayoutType::ncsp, jit_avx2);
         }
     }
 }
@@ -2011,10 +1999,10 @@ void MKLDNNInterpolateNode::createPrimitive() {
     jcp.ID = srcDimPad5d[2];
     jcp.spatial_dim_size = spatialDimSize;
 
-    if (getChildEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp)) {
+    if (getChildEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::ncsp)) {
         jcp.layout = InterpolateLayoutType::planar;
-    } else if (getChildEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c) ||
-               getChildEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c)) {
+    } else if (getChildEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c) ||
+               getChildEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c)) {
         jcp.layout = InterpolateLayoutType::block;
     } else {
         jcp.layout = InterpolateLayoutType::by_channel;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.h
index 2b2f1c38d90efe..1f7160e3dce801 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_interpolate_node.h
@@ -102,7 +102,7 @@ class MKLDNNInterpolateNode : public MKLDNNNode {
     }
     bool canFuse(const MKLDNNNodePtr& node) const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     // nearest neighbor
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp
index 702d5b42f0cff1..b85c15b7023a80 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.cpp
@@ -11,8 +11,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNLogSoftmaxNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNLogSoftmaxNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto logSoftMax = std::dynamic_pointer_cast<const ngraph::opset5::LogSoftmax>(op);
         if (!logSoftMax) {
             errorMessage = "Only opset5 LogSoftmax operation is supported";
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.h
index 456d7321efcdc4..15479cb81ffff5 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_log_softmax_node.h
@@ -20,7 +20,7 @@ class MKLDNNLogSoftmaxNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     size_t reducedAxisSize;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.cpp
index b107fca78343b2..b4e1e28891bd20 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.cpp
@@ -6,13 +6,19 @@
 #include <string>
 #include <mkldnn_extension_utils.h>
 #include <ngraph/opsets/opset1.hpp>
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNLrnNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNLrnNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto lrn = std::dynamic_pointer_cast<const ngraph::opset1::LRN>(op);
         if (!lrn) {
             errorMessage = "Only opset1 LRN operation is supported";
@@ -89,22 +95,19 @@ void MKLDNNLrnNode::getSupportedDescriptors() {
         precision = InferenceEngine::Precision::FP32;
     auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
 
-    const auto &parentShape = getParentEdgeAt(0)->getShape();
-    const auto parentStaticDims = parentShape.getStaticDims();
+    const auto &parentShape = getInputShapeAtPort(0);
 
     for (auto format : getAvailableFormatsForDims(parentShape)) {
-        auto in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(parentStaticDims, inputDataType, format);
-        createDescriptor({in_candidate.get()}, {});
+        auto in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(parentShape, inputDataType, format);
+        createDescriptor({in_candidate}, {});
     }
 }
 
-std::unique_ptr<MKLDNNMemoryDesc> MKLDNNLrnNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
+std::shared_ptr<MemoryDesc> MKLDNNLrnNode::getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) {
     if (idx > 0) {
-        return MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(idx)->getShape().getStaticDims(),
-                                             MKLDNNExtensionUtils::IEPrecisionToDataType(getOriginalInputPrecisions()[idx]),
-                                             MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(idx)->getShape().getRank()));
+        return std::make_shared<CpuBlockedMemoryDesc>(getOriginalInputPrecisionAtPort(idx), getInputShapeAtPort(idx));
     } else {
-        return MKLDNNNode::getSrcMemDesc(primitive_desc_it, idx);
+        return MKLDNNExtensionUtils::makeDescriptor(primitive_desc_it.dst_desc(idx));
     }
 }
 
@@ -125,11 +128,11 @@ bool MKLDNNLrnNode::created() const {
     return getType() == Lrn;
 }
 
-void MKLDNNLrnNode::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc,
-                                     const std::vector<const MemoryDesc*> &outputDesc) {
+void MKLDNNLrnNode::createDescriptor(const std::vector<MemoryDescPtr> &inputDesc,
+                                     const std::vector<MemoryDescPtr> &outputDesc) {
     mkldnn::algorithm alg = isAcrossMaps ? mkldnn::algorithm::lrn_across_channels : mkldnn::algorithm::lrn_within_channel;
     MKLDNNDescriptor desc(std::shared_ptr<mkldnn::lrn_forward::desc>(
-            new mkldnn::lrn_forward::desc(mkldnn::prop_kind::forward_scoring, alg, MemoryDescUtils::convertToMKLDNNMemoryDesc(*inputDesc[0]),
+            new mkldnn::lrn_forward::desc(mkldnn::prop_kind::forward_scoring, alg, MemoryDescUtils::convertToDnnlMemoryDesc(inputDesc[0])->getDnnlDesc(),
                                           size, alpha, beta, k)));
     descs.push_back(desc);
 }
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.h
index 295d16b369c191..8ab180829ad211 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_lrn_node.h
@@ -17,19 +17,19 @@ class MKLDNNLrnNode : public MKLDNNNode {
     MKLDNNLrnNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache);
 
     void getSupportedDescriptors() override;
-    void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                          const std::vector<const MemoryDesc*>& outputDesc) override;
+    void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                          const std::vector<MemoryDescPtr>& outputDesc) override;
     size_t descInputNumbers(MKLDNNDescriptor desc) override {
         return static_cast<size_t>(getOriginalInputsNumber());
     }
-    std::unique_ptr<MKLDNNMemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
+    std::shared_ptr<MemoryDesc> getSrcMemDesc(mkldnn::primitive_desc_iterator &primitive_desc_it, size_t idx) override;
     void createPrimitive() override;
     bool created() const override;
     bool canBeInPlace() const override {
         return false;
     }
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     bool isAcrossMaps = false;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.cpp
index fed1158f97eaf2..7a1be4706bb091 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.cpp
@@ -14,8 +14,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNMathNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNMathNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         if (initializers.find(op->get_type_info()) == initializers.end()) {
             errorMessage = "Unsupported Math layer type.";
             return false;
@@ -50,8 +54,8 @@ void MKLDNNMathNode::initSupportedPrimitiveDescriptors() {
         return;
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
-    for (int i = 0; i < getOriginalInputsNumber(); ++i)
+    inDataConf.reserve(inputShapes.size());
+    for (int i = 0; i < inputShapes.size(); ++i)
         inDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
 
     addSupportedPrimDesc(inDataConf,
@@ -60,7 +64,7 @@ void MKLDNNMathNode::initSupportedPrimitiveDescriptors() {
 }
 
 void MKLDNNMathNode::execute(mkldnn::stream strm) {
-    size_t dataSize = getChildEdgeAt(0)->getShape().getElementsCount();
+    size_t dataSize = getChildEdgesAtPort(0)[0]->getMemory().GetShape().getElementsCount();
     const float *src_data = reinterpret_cast<const float *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     float* dst_data = reinterpret_cast<float *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.h
index 28260dc476ec54..5c5de72a750a70 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_math_node.h
@@ -19,7 +19,7 @@ class MKLDNNMathNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     static std::map<const ngraph::DiscreteTypeInfo, std::function<void(const std::shared_ptr<ngraph::Node>&, MKLDNNMathNode& node)>> initializers;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.cpp
index a0a7f7eafa419f..7babb5033b9630 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.cpp
@@ -13,13 +13,19 @@
 #include "ie_parallel.hpp"
 #include "common/cpu_memcpy.h"
 #include <ngraph/opsets/opset1.hpp>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNMatMulNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNMatMulNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto matMul = std::dynamic_pointer_cast<const ngraph::opset1::MatMul>(op);
         if (!matMul) {
             errorMessage = "Only opset1 MatMul operation is supported";
@@ -70,9 +76,9 @@ void MKLDNNMatMulNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW()  << errorPrefix << " has incorrect number of output edges for layer " << getName();
 
-    auto inDims0 = getParentEdgeAt(0)->getShape().getStaticDims();
-    auto inDims1 = getParentEdgeAt(1)->getShape().getStaticDims();
-    auto outDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto inDims0 = getInputShapeAtPort(0).getStaticDims();
+    auto inDims1 = getInputShapeAtPort(1).getStaticDims();
+    auto outDims = getOutputShapeAtPort(0).getStaticDims();
 
     if (inDims0.size() != inDims1.size() || inDims0.size() != outDims.size())
         IE_THROW()  << errorPrefix << " has invalid dims count";
@@ -131,24 +137,22 @@ void MKLDNNMatMulNode::initSupportedPrimitiveDescriptors() {
         }
     }
 
-    auto inputDataType0 = MKLDNNExtensionUtils::IEPrecisionToDataType(inPrec0);
-    auto inputDataType1 = MKLDNNExtensionUtils::IEPrecisionToDataType(inPrec1);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(InferenceEngine::Precision::FP32);
+    auto outputPrec = InferenceEngine::Precision::FP32;
 
     NodeConfig config;
     config.dynBatchSupport = true;
 
-    auto createDataConfig = [](const std::vector<size_t>& dims, memory::data_type dataType) -> PortConfig {
+    auto createDataConfig = [](const Shape& shape, InferenceEngine::Precision dataType) -> PortConfig {
         PortConfig dataConfig;
         dataConfig.inPlace = -1;
         dataConfig.constant = false;
-        dataConfig.desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(dims, dataType, MKLDNNMemory::GetPlainFormatByRank(dims.size()));
+        dataConfig.desc = std::make_shared<DnnlBlockedMemoryDesc>(dataType, shape);
         return dataConfig;
     };
 
-    config.inConfs.push_back(createDataConfig(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType0));
-    config.inConfs.push_back(createDataConfig(getParentEdgeAt(1)->getShape().getStaticDims(), inputDataType1));
-    config.outConfs.push_back(createDataConfig(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType));
+    config.inConfs.push_back(createDataConfig(getInputShapeAtPort(0), inPrec0));
+    config.inConfs.push_back(createDataConfig(getInputShapeAtPort(1), inPrec1));
+    config.outConfs.push_back(createDataConfig(getOutputShapeAtPort(0), outputPrec));
 
     supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::gemm_any);
 }
@@ -181,8 +185,8 @@ void MKLDNNMatMulNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         IE_THROW()  << errorPrefix << " did not set preferable primitive descriptor";
 
-    auto inDims0 = src0MemPtr->GetDims();
-    auto outDims = dstMemPtr->GetDims();
+    auto inDims0 = src0MemPtr->getStaticDims();
+    auto outDims = dstMemPtr->getStaticDims();
 
     params.src0_mem_ptr = src0MemPtr;
     params.src1_mem_ptr = src1MemPtr;
@@ -207,7 +211,7 @@ void MKLDNNMatMulNode::createPrimitive() {
     params.shift1 = params.M * params.N * params.MB2;
     params.shift2 = params.M * params.N;
 
-    runtimePrecision = getParentEdgeAt(0)->getMemory().GetDesc().getPrecision();
+    runtimePrecision = getParentEdgeAt(0)->getMemory().getDesc().getPrecision();
 }
 
 inline void process_gemm(char transa, char transb, int M, int N, int K, float alpha, const float *A, int lda,
@@ -301,7 +305,7 @@ bool MKLDNNMatMulNode::created() const {
     return getType() == MatMul;
 }
 
-int MKLDNNMatMulNode::getMaxBatch() {
+size_t MKLDNNMatMulNode::getMaxBatch() const {
     if (!outputShapes.empty())
         return outputShapes[0].getStaticDims()[0];
     return 0;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.h
index 3f056cc99533d9..0451e1e47ce56a 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matmul_node.h
@@ -21,11 +21,11 @@ class MKLDNNMatMulNode : public MKLDNNNode {
     void createPrimitive() override;
     void execute(mkldnn::stream strm) override;
     bool created() const override;
-    int getMaxBatch() override;
+    size_t getMaxBatch() const override;
 
     InferenceEngine::Precision getRuntimePrecision() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     float alpha = 1.f;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.cpp
index ade776e8ce3b04..4317596fd325dc 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.cpp
@@ -22,8 +22,12 @@ using MatrixNmsIEInternal = ngraph::op::internal::NmsStaticShapeIE<ngraph::op::v
 using ngNmsSortResultType = ngraph::op::util::NmsBase::SortResultType;
 using ngNmseDcayFunction = ngraph::op::v8::MatrixNms::DecayFunction;
 
-bool MKLDNNMatrixNmsNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNMatrixNmsNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto nms = std::dynamic_pointer_cast<const MatrixNmsIEInternal>(op);
         if (!nms) {
             errorMessage = "Only internal MatrixNms operation is supported";
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.h
index 5d85a3669529d3..e0b77e3f08062f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_matrix_nms_node.h
@@ -31,7 +31,7 @@ class MKLDNNMatrixNmsNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     // input
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_memory_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_memory_node.cpp
index 3218bc54eb0300..62dcc701101472 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_memory_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_memory_node.cpp
@@ -8,6 +8,8 @@
 #include "mkldnn_memory_node.hpp"
 #include "common/cpu_memcpy.h"
 #include "utils/general_utils.h"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
+#include "utils/ngraph_utils.hpp"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -25,6 +27,11 @@ MKLDNNMemoryNode::MKLDNNMemoryNode(const std::shared_ptr<ngraph::Node>& op) {
 
 bool MKLDNNMemoryOutputNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (!MKLDNNPlugin::one_of(op->get_type_info(),
                 ngraph::op::v3::Assign::type_info,
                 ngraph::op::v6::Assign::type_info)) {
@@ -59,14 +66,12 @@ void MKLDNNMemoryOutputNode::initSupportedPrimitiveDescriptors() {
         return;
 
     InferenceEngine::Precision precision = getOriginalInputPrecisionAtPort(0);
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
     NodeConfig config;
     config.dynBatchSupport = true;
     config.inConfs.resize(1);
     config.inConfs[0].inPlace = -1;
     config.inConfs[0].constant = false;
-    config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                           MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(0)->getShape().getRank()));
+    config.inConfs[0].desc = std::make_shared<CpuBlockedMemoryDesc>(precision, getInputShapeAtPort(0));
     supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::unknown);
 }
 
@@ -80,6 +85,11 @@ void MKLDNNMemoryOutputNode::execute(mkldnn::stream strm)  {
 
 bool MKLDNNMemoryInputNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (!MKLDNNPlugin::one_of(op->get_type_info(),
                 ngraph::op::v3::ReadValue::type_info,
                 ngraph::op::v6::ReadValue::type_info)) {
@@ -106,10 +116,11 @@ MKLDNNMemoryInputNode::MKLDNNMemoryInputNode(const std::shared_ptr<ngraph::Node>
 void MKLDNNMemoryInputNode::createPrimitive() {
     MKLDNNInputNode::createPrimitive();
 
-    dataStore->Create(getChildEdgeAt(0)->getMemory().GetDesc());
+    dataStore->Create(getChildEdgeAt(0)->getMemory().getDesc());
 
     // default memory state is zero filled
-    dataStore->FillZero();
+    if (dataStore->getDesc().hasDefinedMaxSize())
+        dataStore->FillZero();
 }
 
 /**
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.cpp
index 64dccbdaeab47e..64d08e0fab3255 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.cpp
@@ -24,8 +24,12 @@ using namespace InferenceEngine;
 using ngNmsSortResultType = ngraph::op::util::NmsBase::SortResultType;
 using MulticlassNmsIEInternal = ngraph::op::internal::NmsStaticShapeIE<ngraph::op::v8::MulticlassNms>;
 
-bool MKLDNNMultiClassNmsNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNMultiClassNmsNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto nms = std::dynamic_pointer_cast<const MulticlassNmsIEInternal>(op);
         if (!nms) {
             errorMessage = "Only internal MulitClassNonMaxSuppression operation is supported";
@@ -135,7 +139,7 @@ void MKLDNNMultiClassNmsNode::execute(mkldnn::stream strm) {
     const float* boxes = reinterpret_cast<const float*>(getParentEdgeAt(NMS_BOXES)->getMemoryPtr()->GetPtr());
     const float* scores = reinterpret_cast<const float*>(getParentEdgeAt(NMS_SCORES)->getMemoryPtr()->GetPtr());
 
-    auto dims_boxes = getParentEdgeAt(NMS_BOXES)->getMemory().GetDesc().getShape().getStaticDims();
+    auto dims_boxes = getParentEdgeAt(NMS_BOXES)->getMemory().getStaticDims();
 
     if (max_output_boxes_per_class == 0)
         return;
@@ -146,8 +150,8 @@ void MKLDNNMultiClassNmsNode::execute(mkldnn::stream strm) {
 
     int* selected_num = reinterpret_cast<int*>(getChildEdgesAtPort(NMS_SELECTEDNUM)[0]->getMemoryPtr()->GetPtr());
 
-    auto boxesStrides = getParentEdgeAt(NMS_BOXES)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
-    auto scoresStrides = getParentEdgeAt(NMS_SCORES)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    auto boxesStrides = getParentEdgeAt(NMS_BOXES)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
+    auto scoresStrides = getParentEdgeAt(NMS_SCORES)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
 
     if ((nms_eta >= 0) && (nms_eta < 1)) {
         nmsWithEta(boxes, scores, boxesStrides, scoresStrides);
@@ -232,7 +236,7 @@ void MKLDNNMultiClassNmsNode::execute(mkldnn::stream strm) {
         });
     }
 
-    const size_t selectedBoxesNum = getChildEdgeAt(NMS_SELECTEDINDICES)->getMemory().GetDesc().getShape().getStaticDims()[0];
+    const size_t selectedBoxesNum = getChildEdgeAt(NMS_SELECTEDINDICES)->getMemory().getStaticDims()[0];
     const size_t validOutputs = std::min(startOffset, selectedBoxesNum);
 
     std::vector<size_t> m_selected_num;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.hpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.hpp
index 0627f72cea0df8..ac4a350bc564cd 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.hpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_multiclass_nms.hpp
@@ -27,7 +27,7 @@ class MKLDNNMultiClassNmsNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     // input (port Num)
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_mvn_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_mvn_node.cpp
index f476aa8dec5231..16e1eb473f60ac 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_mvn_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_mvn_node.cpp
@@ -23,6 +23,7 @@
 #include <cpu/x64/jit_uni_eltwise_injector.hpp>
 
 #include <ngraph/opsets/opset6.hpp>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -603,6 +604,11 @@ struct jit_uni_mvn_kernel_f32 : public jit_uni_mvn_kernel, public jit_generator
 
 bool MKLDNNMVNNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (op->get_output_partial_shape(0).rank().is_dynamic()) {
             errorMessage = "Unsupported dynamic input rank.";
             return false;
@@ -720,13 +726,8 @@ void MKLDNNMVNNode::initSupportedPrimitiveDescriptors() {
         inputPrecision = outputPrecision = Precision::FP32;
     }
 
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(inputPrecision);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(outputPrecision);
-
-    input_prec = inputPrecision;
-    output_prec = outputPrecision;
-    src_data_size = MKLDNNExtensionUtils::sizeOfDataType(inputDataType);
-    dst_data_size = MKLDNNExtensionUtils::sizeOfDataType(outputDataType);
+    src_data_size = inputPrecision.size();
+    dst_data_size = outputPrecision.size();
 
     bool canBeInplace = (src_data_size == dst_data_size) &&
                         (getParentEdgeAt(0)->getParent()->getChildEdges().size() == 1) &&
@@ -742,14 +743,14 @@ void MKLDNNMVNNode::initSupportedPrimitiveDescriptors() {
     config.inConfs[0].inPlace = -1;
     config.outConfs[0].inPlace = canBeInplace ? 0 : -1;
     if (inputsNum == 2) {
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(1)->getShape().getStaticDims(), memory::data_type::s32,
-                                                               MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(1)->getShape().getRank()));
+        config.inConfs[1].desc = std::make_shared<CpuBlockedMemoryDesc>(InferenceEngine::Precision::I32, getInputShapeAtPort(1));
         config.inConfs[1].constant = true;
     }
 
-    auto pushDesc = [&](memory::format_tag format, impl_desc_type impl_type) {
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType, format);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), outputDataType, format);
+    auto& creatorsMap = BlockedDescCreator::getCommonCreators();
+    auto pushDesc = [&](LayoutType format, impl_desc_type impl_type) {
+        config.inConfs[0].desc = creatorsMap.at(format)->createSharedDesc(inputPrecision, getInputShapeAtPort(0));
+        config.outConfs[0].desc = creatorsMap.at(format)->createSharedDesc(outputPrecision, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.push_back({config, impl_type});
     };
 
@@ -766,23 +767,17 @@ void MKLDNNMVNNode::initSupportedPrimitiveDescriptors() {
 
     if (mayiuse(cpu::x64::sse41)) {
         // nspc
-        if (getParentEdgeAt(0)->getShape().getRank() == 4) {
-            pushDesc(memory::format_tag::nhwc, impl_type);
-        } else if (getParentEdgeAt(0)->getShape().getRank() == 5) {
-            pushDesc(memory::format_tag::ndhwc, impl_type);
+        if (getInputShapeAtPort(0).getRank() == 4 || getInputShapeAtPort(0).getRank() == 5) {
+            pushDesc(LayoutType::nspc, impl_type);
         }
         // blk
         if (impl_desc_type::jit_avx512 == impl_type) {
-            if (getParentEdgeAt(0)->getShape().getRank() == 4) {
-                pushDesc(memory::format_tag::nChw16c, impl_type);
-            } else if (getParentEdgeAt(0)->getShape().getRank() == 5) {
-                pushDesc(memory::format_tag::nCdhw16c, impl_type);
+            if (getInputShapeAtPort(0).getRank() == 4 || getInputShapeAtPort(0).getRank() == 5) {
+                pushDesc(LayoutType::nCsp16c, impl_type);
             }
         } else if (impl_desc_type::jit_avx2 ==  impl_type || impl_desc_type::jit_sse42 == impl_type) {
-            if (getParentEdgeAt(0)->getShape().getRank() == 4) {
-                pushDesc(memory::format_tag::nChw8c, impl_type);
-            } else if (getParentEdgeAt(0)->getShape().getRank() == 5) {
-                pushDesc(memory::format_tag::nCdhw8c, impl_type);
+            if (getInputShapeAtPort(0).getRank() == 4 || getInputShapeAtPort(0).getRank() == 5) {
+                pushDesc(LayoutType::nCsp8c, impl_type);
             }
         }
     }
@@ -790,7 +785,7 @@ void MKLDNNMVNNode::initSupportedPrimitiveDescriptors() {
     // planar
     if (canBeInplace)
         config.inConfs[0].inPlace = 0;
-    pushDesc(MKLDNNMemory::GetPlainFormatByRank(getChildEdgeAt(0)->getShape().getRank()), impl_type);
+    pushDesc(LayoutType::ncsp, impl_type);
 }
 
 void MKLDNNMVNNode::createPrimitive() {
@@ -803,7 +798,7 @@ void MKLDNNMVNNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         IE_THROW() << "Preferable primitive descriptor is not set.";
 
-    const SizeVector in_dims = getParentEdgeAt(0)->getShape().getStaticDims();
+    const SizeVector in_dims = srcMemPtr->getStaticDims();
     transformTo5DCase(in_dims);
     auto selectedPD = getSelectedPrimitiveDescriptor();
     auto jcp = jit_mvn_config_params();
@@ -911,12 +906,12 @@ void MKLDNNMVNNode::execute(mkldnn::stream strm) {
     uint8_t *dst_data = reinterpret_cast<uint8_t*>(dstMemPtr->GetPtr());
     uint8_t *src_data = reinterpret_cast<uint8_t*>(srcMemPtr->GetPtr());
 
-    auto dim = getParentEdgeAt(0)->getShape().getStaticDims();
+    auto dim = srcMemPtr->getStaticDims();
     if (mayiuse(cpu::x64::sse41)) {
         if (!mvn_mean_kernel || (normalizeVariance_ && !mvn_variance_kernel) || !mvn_kernel) {
             IE_THROW() << "MVN layer with name '" << getName() << "' doesn't create kernel to execute on sse41 above platform.";
         }
-        if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp)) {
+        if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::ncsp)) {
             mvn_pln(src_data, dst_data, dim);
         } else {
             mvn_blk(src_data, dst_data, dim);
@@ -1170,7 +1165,7 @@ void MKLDNNMVNNode::mvn_blk(const uint8_t* src_data, uint8_t* dst_data, const Si
     size_t N = 1; size_t C = 1; size_t D = 1; size_t H = 1; size_t W = 1;
     std::tie(N, C, D, H, W) = shape5D;
 
-    bool is_nhwc = getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc);
+    bool is_nhwc = getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nspc);
 
     size_t CB = div_up(C, blk_size);
 
@@ -1401,7 +1396,7 @@ bool MKLDNNMVNNode::canFuse(const MKLDNNNodePtr& node) const {
     }
     // limit post ops to unary when shape transformed on channel
     // 1D only fused with unary
-    int inputRank = getParentEdgeAt(0)->getShape().getRank();
+    int inputRank = getInputShapeAtPort(0).getRank();
     bool unaryEltwise = one_of(node->getAlgorithm(), EltwiseRelu, EltwiseGelu, EltwiseElu, EltwiseSigmoid, EltwiseClamp, EltwiseTanh,
                                             EltwiseSwish, EltwiseHswish, EltwiseMish, EltwiseHsigmoid, EltwiseRoundHalfToEven,
                                             EltwiseRoundHalfAwayFromZero, EltwiseAbs, EltwiseSqrt, EltwiseSoftRelu);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.cpp
index a6c0bc07b2840e..c29f2e693e8e6f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.cpp
@@ -11,19 +11,37 @@
 
 #include "mkldnn_non_max_suppression_node.h"
 #include "ie_parallel.hpp"
+#include <ngraph/opsets/opset5.hpp>
 #include <ngraph_ops/nms_ie_internal.hpp>
 #include "utils/general_utils.h"
 
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNNonMaxSuppressionNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNNonMaxSuppressionNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
-        const auto nms = std::dynamic_pointer_cast<const ngraph::op::internal::NonMaxSuppressionIEInternal>(op);
-        if (!nms) {
-            errorMessage = "Only internal NonMaxSuppression operation is supported";
+        if (op->is_dynamic()) {
+            errorMessage = "Doesn't support op with dynamic input shapes";
             return false;
         }
+
+        using NonMaxSuppressionV5 = ngraph::op::v5::NonMaxSuppression;
+        if (!one_of(op->get_type_info(), NonMaxSuppressionV5::type_info, ngraph::op::internal::NonMaxSuppressionIEInternal::type_info)) {
+            errorMessage = "Only NonMaxSuppression v5 and NonMaxSuppressionIEInternal are supported";
+            return false;
+        }
+        if (op->get_input_size() > 2 && !dynamic_cast<ngraph::op::v0::Constant *>(op->get_input_node_ptr(2))) {
+            errorMessage = "Doesn't support NonMaxSuppression with undefined max_output_boxes_per_class";
+            return false;
+        }
+
+        if (const auto nms5 = std::dynamic_pointer_cast<const NonMaxSuppressionV5>(op)) {
+            const auto boxEncoding = nms5->get_box_encoding();
+            if (!one_of(boxEncoding, NonMaxSuppressionV5::BoxEncodingType::CENTER, NonMaxSuppressionV5::BoxEncodingType::CORNER)) {
+                errorMessage = "Supports only CENTER and CORNER box encoding type";
+                return false;
+            }
+        }
     } catch (...) {
         return false;
     }
@@ -38,19 +56,25 @@ MKLDNNNonMaxSuppressionNode::MKLDNNNonMaxSuppressionNode(const std::shared_ptr<n
         }
 
         errorPrefix = "NMS layer with name '" + op->get_friendly_name() + "' ";
-        const auto nms = std::dynamic_pointer_cast<const ngraph::op::internal::NonMaxSuppressionIEInternal>(op);
 
         if (getOriginalInputsNumber() < 2 || getOriginalInputsNumber() > 6)
             IE_THROW() << errorPrefix << "has incorrect number of input edges: " << getOriginalInputsNumber();
 
-        if (getOriginalOutputsNumber() < 1 || getOriginalOutputsNumber() > 3)
+        if (getOriginalOutputsNumber() != 3)
             IE_THROW() << errorPrefix << "has incorrect number of output edges: " << getOriginalOutputsNumber();
 
-        boxEncodingType = nms->m_center_point_box ? boxEncoding::CENTER : boxEncoding::CORNER;
-
-        sort_result_descending = nms->m_sort_result_descending;
+        if (const auto nms5 = std::dynamic_pointer_cast<const ngraph::op::v5::NonMaxSuppression>(op)) {
+            boxEncodingType = static_cast<boxEncoding>(nms5->get_box_encoding());
+            sort_result_descending = nms5->get_sort_result_descending();
+        } else if (const auto nmsIe = std::dynamic_pointer_cast<const ngraph::op::internal::NonMaxSuppressionIEInternal>(op)) {
+            boxEncodingType = nmsIe->m_center_point_box ? boxEncoding::CENTER : boxEncoding::CORNER;
+            sort_result_descending = nmsIe->m_sort_result_descending;
+        } else {
+            const auto &typeInfo = op->get_type_info();
+            IE_THROW() << errorPrefix << " doesn't support NMS: " << typeInfo.name << " v" << typeInfo.version;
+        }
 
-        const SizeVector &boxes_dims = op->get_input_shape(NMS_BOXES);
+        const auto &boxes_dims = getInputShapeAtPort(NMS_BOXES).getStaticDims();
         num_batches = boxes_dims[0];
         num_boxes = boxes_dims[1];
         if (boxes_dims.size() != 3)
@@ -58,7 +82,7 @@ MKLDNNNonMaxSuppressionNode::MKLDNNNonMaxSuppressionNode(const std::shared_ptr<n
         if (boxes_dims[2] != 4)
             IE_THROW() << errorPrefix << "has unsupported 'boxes' input 3rd dimension size: " << boxes_dims[2];
 
-        const SizeVector &scores_dims = op->get_input_shape(NMS_SCORES);
+        const auto &scores_dims = getInputShapeAtPort(NMS_SCORES).getStaticDims();
         num_classes = scores_dims[1];
         if (scores_dims.size() != 3)
             IE_THROW() << errorPrefix << "has unsupported 'scores' input rank: " << scores_dims.size();
@@ -72,21 +96,11 @@ MKLDNNNonMaxSuppressionNode::MKLDNNNonMaxSuppressionNode(const std::shared_ptr<n
         for (auto & i : numFiltBox)
             i.resize(num_classes);
 
-        inputShape_MAXOUTPUTBOXESPERCLASS = op->get_input_shape(NMS_MAXOUTPUTBOXESPERCLASS);
-        inputShape_IOUTHRESHOLD = op->get_input_shape(NMS_IOUTHRESHOLD);
-        inputShape_SCORETHRESHOLD = op->get_input_shape(NMS_SCORETHRESHOLD);
-        if (getOriginalInputsNumber() > NMS_SOFTNMSSIGMA) {
-            inputShape_SOFTNMSSIGMA = op->get_input_shape(NMS_SOFTNMSSIGMA);
-        }
-
-        outputShape_SELECTEDINDICES = op->get_output_shape(NMS_SELECTEDINDICES);
-        outputShape_SELECTEDSCORES = op->get_output_shape(NMS_SELECTEDSCORES);
-
-        const SizeVector &valid_outputs_dims = op->get_input_shape(NMS_VALIDOUTPUTS);
-        if (valid_outputs_dims.size() != 1)
-            IE_THROW() << errorPrefix << "has unsupported 'valid_outputs' output rank: " << valid_outputs_dims.size();
-        if (valid_outputs_dims[0] != 1)
-            IE_THROW() << errorPrefix << "has unsupported 'valid_outputs' output 1st dimension size: " << valid_outputs_dims[1];
+        const Shape valid_outputs_shape = getOutputShapeAtPort(NMS_VALIDOUTPUTS);
+        if (valid_outputs_shape.getRank() != 1)
+            IE_THROW() << errorPrefix << "has unsupported 'valid_outputs' output rank: " << valid_outputs_shape.getRank();
+        if (valid_outputs_shape.getDims()[0] != 1)
+            IE_THROW() << errorPrefix << "has unsupported 'valid_outputs' output 1st dimension size: " << valid_outputs_shape.getDims()[1];
 }
 
 void MKLDNNNonMaxSuppressionNode::initSupportedPrimitiveDescriptors() {
@@ -98,32 +112,33 @@ void MKLDNNNonMaxSuppressionNode::initSupportedPrimitiveDescriptors() {
 
     checkPrecision(getOriginalInputPrecisionAtPort(NMS_BOXES), supportedFloatPrecision, "boxes", inType);
     checkPrecision(getOriginalInputPrecisionAtPort(NMS_SCORES), supportedFloatPrecision, "scores", inType);
-    checkPrecision(getOriginalInputPrecisionAtPort(NMS_VALIDOUTPUTS), supportedIntOutputPrecision, "valid_outputs", outType);
+    checkPrecision(getOriginalOutputPrecisionAtPort(NMS_VALIDOUTPUTS), supportedIntOutputPrecision, "valid_outputs", outType);
 
     const std::vector<Precision> supportedPrecision = {Precision::I16, Precision::U8, Precision::I8, Precision::U16, Precision::I32,
                                                        Precision::U32, Precision::I64, Precision::U64};
 
-    check1DInput(inputShape_MAXOUTPUTBOXESPERCLASS, supportedPrecision, "max_output_boxes_per_class", NMS_MAXOUTPUTBOXESPERCLASS);
-    check1DInput(inputShape_IOUTHRESHOLD, supportedFloatPrecision, "iou_threshold", NMS_IOUTHRESHOLD);
-    check1DInput(inputShape_SCORETHRESHOLD, supportedFloatPrecision, "score_threshold", NMS_SCORETHRESHOLD);
-
-    if (getOriginalInputsNumber() > NMS_SOFTNMSSIGMA) {
-        check1DInput(inputShape_SOFTNMSSIGMA, supportedFloatPrecision, "soft_nms_sigma", NMS_SOFTNMSSIGMA);
-    }
+    if (inputShapes.size() > NMS_MAXOUTPUTBOXESPERCLASS)
+        check1DInput(getInputShapeAtPort(NMS_MAXOUTPUTBOXESPERCLASS), supportedPrecision, "max_output_boxes_per_class", NMS_MAXOUTPUTBOXESPERCLASS);
+    if (inputShapes.size() > NMS_IOUTHRESHOLD)
+        check1DInput(getInputShapeAtPort(NMS_IOUTHRESHOLD), supportedFloatPrecision, "iou_threshold", NMS_IOUTHRESHOLD);
+    if (inputShapes.size() > NMS_SCORETHRESHOLD)
+        check1DInput(getInputShapeAtPort(NMS_SCORETHRESHOLD), supportedFloatPrecision, "score_threshold", NMS_SCORETHRESHOLD);
+    if (inputShapes.size() > NMS_SOFTNMSSIGMA)
+        check1DInput(getInputShapeAtPort(NMS_SCORETHRESHOLD), supportedFloatPrecision, "soft_nms_sigma", NMS_SCORETHRESHOLD);
 
-    checkOutput(outputShape_SELECTEDINDICES, supportedIntOutputPrecision, "selected_indices", NMS_SELECTEDINDICES);
-    checkOutput(outputShape_SELECTEDSCORES, supportedFloatPrecision, "selected_scores", NMS_SELECTEDSCORES);
+    checkOutput(getOutputShapeAtPort(NMS_SELECTEDINDICES), supportedIntOutputPrecision, "selected_indices", NMS_SELECTEDINDICES);
+    checkOutput(getOutputShapeAtPort(NMS_SELECTEDSCORES), supportedFloatPrecision, "selected_scores", NMS_SELECTEDSCORES);
 
     std::vector<PortConfigurator> inDataConf;
-    inDataConf.reserve(getOriginalInputsNumber());
-    for (int i = 0; i < getOriginalInputsNumber(); ++i) {
+    inDataConf.reserve(inputShapes.size());
+    for (int i = 0; i < inputShapes.size(); ++i) {
         Precision inPrecision = i == NMS_MAXOUTPUTBOXESPERCLASS ? Precision::I32 : Precision::FP32;
         inDataConf.emplace_back(LayoutType::ncsp, inPrecision);
     }
 
     std::vector<PortConfigurator> outDataConf;
-    outDataConf.reserve(getOriginalOutputsNumber());
-    for (int i = 0; i < getOriginalOutputsNumber(); ++i) {
+    outDataConf.reserve(outputShapes.size());
+    for (int i = 0; i < outputShapes.size(); ++i) {
         Precision outPrecision = i == NMS_SELECTEDSCORES ? Precision::FP32 : Precision::I32;
         outDataConf.emplace_back(LayoutType::ncsp, outPrecision);
     }
@@ -135,44 +150,35 @@ void MKLDNNNonMaxSuppressionNode::execute(mkldnn::stream strm) {
     const float *boxes = reinterpret_cast<const float *>(getParentEdgeAt(NMS_BOXES)->getMemoryPtr()->GetPtr());
     const float *scores = reinterpret_cast<const float *>(getParentEdgeAt(NMS_SCORES)->getMemoryPtr()->GetPtr());
 
-    max_output_boxes_per_class = outputShapes.size() > NMS_SELECTEDSCORES ? 0 : num_boxes;
     if (inputShapes.size() > NMS_MAXOUTPUTBOXESPERCLASS) {
         max_output_boxes_per_class = reinterpret_cast<int *>(getParentEdgeAt(NMS_MAXOUTPUTBOXESPERCLASS)->getMemoryPtr()->GetPtr())[0];
     }
 
+    if (!isDynamicNode()) {
+        max_output_boxes_per_class = std::min(max_output_boxes_per_class, num_boxes);
+    }
+
     if (max_output_boxes_per_class == 0)
         return;
 
-    iou_threshold = outputShapes.size() > NMS_SELECTEDSCORES ? 0.0f : 1.0f;
     if (inputShapes.size() > NMS_IOUTHRESHOLD)
         iou_threshold = reinterpret_cast<float *>(getParentEdgeAt(NMS_IOUTHRESHOLD)->getMemoryPtr()->GetPtr())[0];
 
-    score_threshold = 0.0f;
     if (inputShapes.size() > NMS_SCORETHRESHOLD)
         score_threshold = reinterpret_cast<float *>(getParentEdgeAt(NMS_SCORETHRESHOLD)->getMemoryPtr()->GetPtr())[0];
 
-    soft_nms_sigma = 0.0f;
     if (inputShapes.size() > NMS_SOFTNMSSIGMA)
         soft_nms_sigma = reinterpret_cast<float *>(getParentEdgeAt(NMS_SOFTNMSSIGMA)->getMemoryPtr()->GetPtr())[0];
     scale = 0.0f;
     if (soft_nms_sigma > 0.0) {
-        scale = -0.5 / soft_nms_sigma;
+        scale = -0.5f / soft_nms_sigma;
     }
 
-    int *selected_indices = reinterpret_cast<int *>(getChildEdgesAtPort(NMS_SELECTEDINDICES)[0]->getMemoryPtr()->GetPtr());
-
-    float *selected_scores = nullptr;
-    if (outputShapes.size() > NMS_SELECTEDSCORES)
-        selected_scores = reinterpret_cast<float *>(getChildEdgesAtPort(NMS_SELECTEDSCORES)[0]->getMemoryPtr()->GetPtr());
-
-    int *valid_outputs = nullptr;
-    if (outputShapes.size() > NMS_VALIDOUTPUTS)
-        valid_outputs = reinterpret_cast<int *>(getChildEdgesAtPort(NMS_VALIDOUTPUTS)[0]->getMemoryPtr()->GetPtr());
-
-    auto boxesStrides = getParentEdgeAt(NMS_BOXES)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
-    auto scoresStrides = getParentEdgeAt(NMS_SCORES)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    auto boxesStrides = getParentEdgeAt(NMS_BOXES)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
+    auto scoresStrides = getParentEdgeAt(NMS_SCORES)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
 
-    std::vector<filteredBoxes> filtBoxes(max_output_boxes_per_class * num_batches * num_classes);
+    const auto maxNumberOfBoxes = max_output_boxes_per_class * num_batches * num_classes;
+    std::vector<filteredBoxes> filtBoxes(maxNumberOfBoxes);
 
     if (soft_nms_sigma == 0.0f) {
         nmsWithoutSoftSigma(boxes, scores, boxesStrides, scoresStrides, filtBoxes);
@@ -205,12 +211,20 @@ void MKLDNNNonMaxSuppressionNode::execute(mkldnn::stream strm) {
                       });
     }
 
-    const size_t selectedBoxesNum = getChildEdgesAtPort(NMS_SELECTEDINDICES)[0]->getShape().getStaticDims()[0];
-    const size_t validOutputs = std::min(filtBoxes.size(), selectedBoxesNum);
+    auto indicesMemPtr = getChildEdgesAtPort(NMS_SELECTEDINDICES)[0]->getMemoryPtr();
+    auto scoresMemPtr =  getChildEdgesAtPort(NMS_SELECTEDSCORES)[0]->getMemoryPtr();
+    const size_t validOutputs = std::min(filtBoxes.size(), maxNumberOfBoxes);
 
-    int selectedIndicesStride = getChildEdgesAtPort(NMS_SELECTEDINDICES)[0]->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides()[0];
-    int *selectedIndicesPtr = selected_indices;
-    float *selectedScoresPtr = selected_scores;
+    if (isDynamicNode()) {
+        VectorDims newDims{validOutputs, 3};
+        indicesMemPtr->redefineDesc(getBaseMemDescAtOutputPort(NMS_SELECTEDINDICES)->cloneWithNewDims(newDims));
+        scoresMemPtr->redefineDesc(getBaseMemDescAtOutputPort(NMS_SELECTEDSCORES)->cloneWithNewDims(newDims));
+    }
+
+    int selectedIndicesStride = indicesMemPtr->GetDescWithType<BlockedMemoryDesc>()->getStrides()[0];
+
+    int *selectedIndicesPtr = reinterpret_cast<int *>(indicesMemPtr->GetPtr());
+    float *selectedScoresPtr = reinterpret_cast<float *>(scoresMemPtr->GetPtr());
 
     size_t idx = 0lu;
     for (; idx < validOutputs; idx++) {
@@ -218,19 +232,20 @@ void MKLDNNNonMaxSuppressionNode::execute(mkldnn::stream strm) {
         selectedIndicesPtr[1] = filtBoxes[idx].class_index;
         selectedIndicesPtr[2] = filtBoxes[idx].box_index;
         selectedIndicesPtr += selectedIndicesStride;
-        if (outputShapes.size() > NMS_SELECTEDSCORES) {
-            selectedScoresPtr[0] = static_cast<float>(filtBoxes[idx].batch_index);
-            selectedScoresPtr[1] = static_cast<float>(filtBoxes[idx].class_index);
-            selectedScoresPtr[2] = static_cast<float>(filtBoxes[idx].score);
-            selectedScoresPtr += selectedIndicesStride;
-        }
+
+        selectedScoresPtr[0] = static_cast<float>(filtBoxes[idx].batch_index);
+        selectedScoresPtr[1] = static_cast<float>(filtBoxes[idx].class_index);
+        selectedScoresPtr[2] = static_cast<float>(filtBoxes[idx].score);
+        selectedScoresPtr += selectedIndicesStride;
     }
-    std::fill(selectedIndicesPtr, selectedIndicesPtr + (selectedBoxesNum - idx) * selectedIndicesStride, -1);
-    if (outputShapes.size() > NMS_SELECTEDSCORES) {
-        std::fill(selectedScoresPtr, selectedScoresPtr + (selectedBoxesNum - idx) * selectedIndicesStride, -1.f);
+
+    if (!isDynamicNode()) {
+        std::fill(selectedIndicesPtr, selectedIndicesPtr + (maxNumberOfBoxes - idx) * selectedIndicesStride, -1);
+        std::fill(selectedScoresPtr, selectedScoresPtr + (maxNumberOfBoxes - idx) * selectedIndicesStride, -1.f);
     }
-    if (outputShapes.size() > NMS_VALIDOUTPUTS)
-        *valid_outputs = static_cast<int>(validOutputs);
+
+    int *valid_outputs = reinterpret_cast<int *>(getChildEdgesAtPort(NMS_VALIDOUTPUTS)[0]->getMemoryPtr()->GetPtr());
+    *valid_outputs = static_cast<int>(validOutputs);
 }
 
 bool MKLDNNNonMaxSuppressionNode::created() const {
@@ -272,8 +287,8 @@ float MKLDNNNonMaxSuppressionNode::intersectionOverUnion(const float *boxesI, co
     return intersection_area / (areaI + areaJ - intersection_area);
 }
 
-void MKLDNNNonMaxSuppressionNode::nmsWithSoftSigma(const float *boxes, const float *scores, const SizeVector &boxesStrides,
-                                                             const SizeVector &scoresStrides, std::vector<filteredBoxes> &filtBoxes) {
+void MKLDNNNonMaxSuppressionNode::nmsWithSoftSigma(const float *boxes, const float *scores, const VectorDims &boxesStrides,
+                                                             const VectorDims &scoresStrides, std::vector<filteredBoxes> &filtBoxes) {
     auto less = [](const boxInfo& l, const boxInfo& r) {
         return l.score < r.score || ((l.score == r.score) && (l.idx > r.idx));
     };
@@ -333,8 +348,8 @@ void MKLDNNNonMaxSuppressionNode::nmsWithSoftSigma(const float *boxes, const flo
     });
 }
 
-void MKLDNNNonMaxSuppressionNode::nmsWithoutSoftSigma(const float *boxes, const float *scores, const SizeVector &boxesStrides,
-                                                                const SizeVector &scoresStrides, std::vector<filteredBoxes> &filtBoxes) {
+void MKLDNNNonMaxSuppressionNode::nmsWithoutSoftSigma(const float *boxes, const float *scores, const VectorDims &boxesStrides,
+                                                                const VectorDims &scoresStrides, std::vector<filteredBoxes> &filtBoxes) {
     int max_out_box = static_cast<int>(max_output_boxes_per_class);
     parallel_for2d(num_batches, num_classes, [&](int batch_idx, int class_idx) {
         const float *boxesPtr = boxes + batch_idx * boxesStrides[0];
@@ -375,31 +390,31 @@ void MKLDNNNonMaxSuppressionNode::nmsWithoutSoftSigma(const float *boxes, const
     });
 }
 
-void MKLDNNNonMaxSuppressionNode::checkPrecision(const Precision prec, const std::vector<Precision> precList,
-                                                           const std::string name, const std::string type) {
+void MKLDNNNonMaxSuppressionNode::checkPrecision(const Precision& prec, const std::vector<Precision>& precList,
+                                                           const std::string& name, const std::string& type) {
     if (std::find(precList.begin(), precList.end(), prec) == precList.end())
         IE_THROW() << errorPrefix << "has unsupported '" << name << "' " << type << " precision: " << prec;
 }
 
-void MKLDNNNonMaxSuppressionNode::check1DInput(const SizeVector& dims, const std::vector<Precision> precList,
-                                                         const std::string name, const size_t port) {
+void MKLDNNNonMaxSuppressionNode::check1DInput(const Shape& shape, const std::vector<Precision>& precList,
+                                                         const std::string& name, const size_t port) {
     checkPrecision(getOriginalInputPrecisionAtPort(port), precList, name, inType);
 
-    if (dims.size() != 0 && dims.size() != 1)
-        IE_THROW() << errorPrefix << "has unsupported '" << name << "' input rank: " << dims.size();
-    if (dims.size() == 1)
-        if (dims[0] != 1)
-            IE_THROW() << errorPrefix << "has unsupported '" << name << "' input 1st dimension size: " << dims[0];
+    if (shape.getRank() != 0 && shape.getRank() != 1)
+        IE_THROW() << errorPrefix << "has unsupported '" << name << "' input rank: " << shape.getRank();
+    if (shape.getRank() == 1)
+        if (shape.getDims()[0] != 1)
+            IE_THROW() << errorPrefix << "has unsupported '" << name << "' input 1st dimension size: " << MemoryDescUtils::dim2str(shape.getDims()[0]);
 }
 
-void MKLDNNNonMaxSuppressionNode::checkOutput(const SizeVector& dims, const std::vector<Precision> precList,
-                                                        const std::string name, const size_t port) {
+void MKLDNNNonMaxSuppressionNode::checkOutput(const Shape& shape, const std::vector<Precision>& precList,
+                                                        const std::string& name, const size_t port) {
     checkPrecision(getOriginalOutputPrecisionAtPort(port), precList, name, outType);
 
-    if (dims.size() != 2)
-        IE_THROW() << errorPrefix << "has unsupported '" << name << "' output rank: " << dims.size();
-    if (dims[1] != 3)
-        IE_THROW() << errorPrefix << "has unsupported '" << name << "' output 2nd dimension size: " << dims[1];
+    if (shape.getRank() != 2)
+        IE_THROW() << errorPrefix << "has unsupported '" << name << "' output rank: " << shape.getRank();
+    if (shape.getDims()[1] != 3)
+        IE_THROW() << errorPrefix << "has unsupported '" << name << "' output 2nd dimension size: " << MemoryDescUtils::dim2str(shape.getDims()[1]);
 }
 
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.h
index 4651da1f2e795c..24c489981e8940 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_non_max_suppression_node.h
@@ -24,7 +24,7 @@ class MKLDNNNonMaxSuppressionNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
     struct filteredBoxes {
         float score;
@@ -50,19 +50,30 @@ class MKLDNNNonMaxSuppressionNode : public MKLDNNNode {
     void nmsWithoutSoftSigma(const float *boxes, const float *scores, const SizeVector &boxesStrides,
                              const SizeVector &scoresStrides, std::vector<filteredBoxes> &filtBoxes);
 
+    void executeDynamicImpl(mkldnn::stream strm) override { execute(strm); }
+
+    std::vector<VectorDims> shapeInfer() const override {
+        return std::vector<VectorDims>();
+    }
+
 private:
     // input
-    const size_t NMS_BOXES = 0;
-    const size_t NMS_SCORES = 1;
-    const size_t NMS_MAXOUTPUTBOXESPERCLASS = 2;
-    const size_t NMS_IOUTHRESHOLD = 3;
-    const size_t NMS_SCORETHRESHOLD = 4;
-    const size_t NMS_SOFTNMSSIGMA = 5;
+    enum : size_t {
+        NMS_BOXES,
+        NMS_SCORES,
+        NMS_MAXOUTPUTBOXESPERCLASS,
+        NMS_IOUTHRESHOLD,
+        NMS_SCORETHRESHOLD,
+        NMS_SOFTNMSSIGMA,
+    } InputNumber;
 
     // output
-    const size_t NMS_SELECTEDINDICES = 0;
-    const size_t NMS_SELECTEDSCORES = 1;
-    const size_t NMS_VALIDOUTPUTS = 2;
+    enum : size_t {
+        NMS_SELECTEDINDICES,
+        NMS_SELECTEDSCORES,
+        NMS_VALIDOUTPUTS
+    } OutputNumber;
+
 
     enum class boxEncoding {
         CORNER,
@@ -81,22 +92,14 @@ class MKLDNNNonMaxSuppressionNode : public MKLDNNNode {
     float soft_nms_sigma = 0.0f;
     float scale = 1.f;
 
-    SizeVector inputShape_MAXOUTPUTBOXESPERCLASS;
-    SizeVector inputShape_IOUTHRESHOLD;
-    SizeVector inputShape_SCORETHRESHOLD;
-    SizeVector inputShape_SOFTNMSSIGMA;
-
-    SizeVector outputShape_SELECTEDINDICES;
-    SizeVector outputShape_SELECTEDSCORES;
-
     std::string errorPrefix;
 
     std::vector<std::vector<size_t>> numFiltBox;
     const std::string inType = "input", outType = "output";
 
-    void checkPrecision(const Precision prec, const std::vector<Precision> precList, const std::string name, const std::string type);
-    void check1DInput(const SizeVector& dims, const std::vector<Precision> precList, const std::string name, const size_t port);
-    void checkOutput(const SizeVector& dims, const std::vector<Precision> precList, const std::string name, const size_t port);
+    void checkPrecision(const Precision& prec, const std::vector<Precision>& precList, const std::string& name, const std::string& type);
+    void check1DInput(const Shape& shape, const std::vector<Precision>& precList, const std::string& name, const size_t port);
+    void checkOutput(const Shape& shape, const std::vector<Precision>& precList, const std::string& name, const size_t port);
 };
 
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_normalize_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_normalize_node.cpp
index 10b1be0dac532d..a10e42d6e72e8b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_normalize_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_normalize_node.cpp
@@ -21,6 +21,7 @@
 #include <mkldnn_selective_build.h>
 
 #include <ngraph/opsets/opset1.hpp>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -662,6 +663,11 @@ MKLDNNNormalizeL2Node::MKLDNNNormalizeL2Node(const std::shared_ptr<ngraph::Node>
 
 bool MKLDNNNormalizeL2Node::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto norm = std::dynamic_pointer_cast<const ngraph::op::v0::NormalizeL2>(op);
         if (!norm) {
             errorMessage = "Only opset1 NormalizeL2 operation is supported";
@@ -717,7 +723,7 @@ void MKLDNNNormalizeL2Node::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << " has incorrect number of output edges: " << getChildEdges().size();
 
-    if (getParentEdgeAt(0)->getShape().getRank() > 4 || getParentEdgeAt(0)->getShape().getRank() < 2) {
+    if (getInputShapeAtPort(0).getRank() > 4 || getInputShapeAtPort(0).getRank() < 2) {
         IE_THROW() << errorPrefix << "has invalid input shape. Normalize supports from 2D to 4D blobs.";
     }
 }
@@ -749,13 +755,10 @@ void MKLDNNNormalizeL2Node::initSupportedPrimitiveDescriptors() {
         IE_THROW() << errorPrefix << "has unsupported output precision. " << getName();
     }
 
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(inputPrecision);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(outputPrecision);
-
     input_prec = inputPrecision;
     output_prec = outputPrecision;
-    src_data_size = MKLDNNExtensionUtils::sizeOfDataType(inputDataType);
-    dst_data_size = MKLDNNExtensionUtils::sizeOfDataType(outputDataType);
+    src_data_size = inputPrecision.size();
+    dst_data_size = outputPrecision.size();
 
     bool canBeInplace = src_data_size == dst_data_size && getParentEdgeAt(DATA)->getParent()->getChildEdges().size() == 1;
 
@@ -765,28 +768,31 @@ void MKLDNNNormalizeL2Node::initSupportedPrimitiveDescriptors() {
     config.outConfs.resize(1);
     config.outConfs[0].inPlace = canBeInplace ? 0 : -1;
 
-    auto pushDesc = [&](memory::format_tag format) {
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(DATA)->getShape().getStaticDims(), inputDataType, format);
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(AXES)->getShape().getStaticDims(), memory::data_type::s32,
-                                                               memory::format_tag::x);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(DATA)->getShape().getStaticDims(), outputDataType, format);
+    auto& creatorsMap = BlockedDescCreator::getCommonCreators();
+    auto pushDesc = [&](LayoutType format) {
+        auto a = creatorsMap.at(format)->createSharedDesc(inputPrecision, getInputShapeAtPort(DATA));
+        config.inConfs[0].desc = std::move(a);
+        a = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(InferenceEngine::Precision::I32, getInputShapeAtPort(AXES));
+        config.inConfs[1].desc = std::move(a);
+        a = creatorsMap.at(format)->createSharedDesc(outputPrecision, getOutputShapeAtPort(DATA));
+        config.outConfs[0].desc = std::move(a);
         supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
     };
 
     // only plain layout support when w/o sse42
-    if (getParentEdgeAt(DATA)->getShape().getRank() == 4 && !cornerCase) {
+    if (getInputShapeAtPort(DATA).getRank() == 4 && !cornerCase) {
         if (mayiuse(cpu::x64::sse41)) {
-            pushDesc(memory::format_tag::nhwc);
+            pushDesc(LayoutType::nspc);
             if (mayiuse(cpu::x64::avx512_common)) {
-                pushDesc(memory::format_tag::nChw16c);
+                pushDesc(LayoutType::nCsp16c);
             } else {
-                pushDesc(memory::format_tag::nChw8c);
+                pushDesc(LayoutType::nCsp8c);
             }
         }
     }
     if (canBeInplace)
         config.inConfs[0].inPlace = 0;
-    pushDesc(MKLDNNMemory::GetPlainFormatByRank(getChildEdgeAt(DATA)->getShape().getRank()));
+    pushDesc(LayoutType::ncsp);
 }
 
 bool MKLDNNNormalizeL2Node::canFuse(const MKLDNNNodePtr& node) const {
@@ -833,17 +839,17 @@ void MKLDNNNormalizeL2Node::createPrimitive() {
         jcp.dst_data_size = MKLDNNExtensionUtils::sizeOfDataType(jcp.dst_dt);
 
         jcp.is_nchw = jcp.is_nhwc = jcp.is_blk = false;
-        if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp)) {
+        if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::ncsp)) {
             jcp.is_nchw = true;
-        } else if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c) ||
-                  getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c)) {
+        } else if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c) ||
+                  getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c)) {
             jcp.is_blk = true;
         } else {
             jcp.is_nhwc = true;
         }
 
         jcp.across_spatial = across_spatial;
-        auto dims = getParentEdgeAt(0)->getShape().getStaticDims();
+        auto dims = getParentEdgeAt(0)->getMemory().getStaticDims();
         size_t dims_size = dims.size();
         jcp.n = (dims_size > 0) ? dims[0] : 1lu;
         jcp.c = (dims_size > 1) ? dims[1] : 1lu;
@@ -909,7 +915,7 @@ void MKLDNNNormalizeL2Node::execute(mkldnn::stream strm) {
     const uint8_t *src_ptr = reinterpret_cast<const uint8_t*>(srcMemPtr->GetPtr());
     uint8_t *dst_ptr = reinterpret_cast<uint8_t*>(dstMemPtr->GetPtr());
 
-    auto dims = getParentEdgeAt(DATA)->getShape().getStaticDims();
+    auto dims = getParentEdgeAt(DATA)->getMemory().getStaticDims();
 
     NormalizeContext ctx = {
         *this,
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.cpp
index 350e86e556e85d..24c40f93329b82 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.cpp
@@ -17,8 +17,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNOneHotNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNOneHotNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto oneHot = std::dynamic_pointer_cast<const ngraph::opset1::OneHot>(op);
         if (!oneHot) {
             errorMessage = "Only opset1 OneHot operation is supported";
@@ -125,13 +129,13 @@ void MKLDNNOneHotNode::one_hot(size_t prefix_size, size_t suffix_size) {
 
 void MKLDNNOneHotNode::execute(mkldnn::stream strm) {
     std::size_t prefix_size = 1;
-    auto input_dims = getParentEdgeAt(0)->getShape().getStaticDims();
+    auto input_dims = getParentEdgeAt(0)->getMemory().getStaticDims();
 
     std::size_t actual_axis = (axis == -1) ? src_dims.size() : axis;
     for (size_t i = 0; i < actual_axis; ++i)
         prefix_size *= input_dims[i];
 
-    std::size_t suffix_size = getParentEdgeAt(0)->getShape().getElementsCount() / prefix_size;
+    std::size_t suffix_size = getParentEdgeAt(0)->getMemory().GetShape().getElementsCount() / prefix_size;
 
     OneHotContext ctx = {this, prefix_size, suffix_size};
     OV_SWITCH(MKLDNNPlugin, OneHotExecute, ctx, output_precision.size(),
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.h
index 9f39ff1232eeec..18367f21baf672 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_one_hot_node.h
@@ -23,7 +23,7 @@ class MKLDNNOneHotNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     typedef InferenceEngine::PrecisionTrait<InferenceEngine::Precision::I32>::value_type in_type;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.cpp
index 584eb4bce79051..626d66921d1d59 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.cpp
@@ -18,8 +18,13 @@ using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNPadNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNPadNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto pad = std::dynamic_pointer_cast<const ngraph::opset1::Pad>(op);
         if (!pad) {
             errorMessage = "Only opset1 Pad operation is supported";
@@ -92,8 +97,8 @@ void MKLDNNPadNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << "Incorrect number of output edges";
 
-    const SizeVector srcDims = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-    const SizeVector dstDims = getChildEdgeAt(DATA_ID)->getShape().getStaticDims();
+    const auto srcDims = getInputShapeAtPort(DATA_ID).getStaticDims();
+    const auto dstDims = getOutputShapeAtPort(DATA_ID).getStaticDims();
     if (srcDims.size() != dstDims.size() || padsBegin.size() != srcDims.size() || padsEnd.size() != srcDims.size())
         IE_THROW() << errorPrefix << " has incorrect number of input/output dimensions!";
 
@@ -120,9 +125,8 @@ void MKLDNNPadNode::initSupportedPrimitiveDescriptors() {
     InferenceEngine::Precision precision = getOriginalInputPrecisionAtPort(DATA_ID);
     if (std::find(supportedPrecisions.begin(), supportedPrecisions.end(), precision) == supportedPrecisions.end())
         precision = precision.is_float() ? InferenceEngine::Precision::FP32 : InferenceEngine::Precision::I32;
-    auto dataType = MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
 
-    auto srcDims = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
+    auto srcDims = getInputShapeAtPort(DATA_ID).getStaticDims();
     int numOfDims = srcDims.size();
 
     NodeConfig config;
@@ -130,42 +134,33 @@ void MKLDNNPadNode::initSupportedPrimitiveDescriptors() {
     config.inConfs.resize(isPadValueSpecified ? 4 : 3);
     config.outConfs.resize(1);
 
-    auto pushSupportedPrimitiveDescriptor = [&](memory::format_tag memoryFormat) {
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(DATA_ID)->getShape().getStaticDims(), dataType,
-                                                                             memoryFormat);
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(PADS_BEGIN_ID)->getShape().getStaticDims(),
-                                                                             memory::data_type::s32, memory::format_tag::x);
-        config.inConfs[2].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(PADS_END_ID)->getShape().getStaticDims(),
-                                                                             memory::data_type::s32, memory::format_tag::x);
+    auto& creatorsMap = BlockedDescCreator::getCommonCreators();
+    auto pushSupportedPrimitiveDescriptor = [&](LayoutType memoryFormat) {
+        config.inConfs[0].desc = creatorsMap.at(memoryFormat)->createSharedDesc(precision, getInputShapeAtPort(DATA_ID));
+        config.inConfs[1].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(InferenceEngine::Precision::I32, getInputShapeAtPort(PADS_BEGIN_ID));
+        config.inConfs[2].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(InferenceEngine::Precision::I32, getInputShapeAtPort(PADS_END_ID));
         if (isPadValueSpecified)
-            config.inConfs[3].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(PAD_VALUE_ID)->getShape().getStaticDims(),
-                                                                                 memory::data_type::f32, memory::format_tag::x);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(DATA_ID)->getShape().getStaticDims(), dataType, memoryFormat);
+            config.inConfs[3].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(InferenceEngine::Precision::FP32, getInputShapeAtPort(PAD_VALUE_ID));
+
+        config.outConfs[0].desc = creatorsMap.at(memoryFormat)->createSharedDesc(precision, getOutputShapeAtPort(DATA_ID));
         supportedPrimitiveDescriptors.push_back({config, impl_desc_type::ref});
     };
 
-    if (numOfDims == 4)
-        pushSupportedPrimitiveDescriptor(mkldnn::memory::format_tag::nhwc);
-    else if (numOfDims == 5)
-        pushSupportedPrimitiveDescriptor(mkldnn::memory::format_tag::ndhwc);
+    if (numOfDims == 4 || numOfDims == 5)
+        pushSupportedPrimitiveDescriptor(LayoutType::nspc);
 
-    pushSupportedPrimitiveDescriptor(MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(0)->getShape().getRank()));
+    pushSupportedPrimitiveDescriptor(LayoutType::ncsp);
 
     auto canUseBlocked = [=](const size_t blockSize) {
         return (padMode == CONSTANT && padsBegin[1] % blockSize == 0 && padsEnd[1] % blockSize == 0) ||
                (padMode != CONSTANT && padsBegin[1] == 0 && padsEnd[1] == 0);
     };
 
-    if (numOfDims == 4) {
-        if (srcDims[1] % 8 == 0 && canUseBlocked(8))
-            pushSupportedPrimitiveDescriptor(mkldnn::memory::format_tag::nChw8c);
-        if (srcDims[1] % 16 == 0 && canUseBlocked(16))
-            pushSupportedPrimitiveDescriptor(mkldnn::memory::format_tag::nChw16c);
-    } else if (numOfDims == 5) {
+    if (numOfDims == 4 || numOfDims == 5) {
         if (srcDims[1] % 8 == 0 && canUseBlocked(8))
-            pushSupportedPrimitiveDescriptor(mkldnn::memory::format_tag::nCdhw8c);
+            pushSupportedPrimitiveDescriptor(LayoutType::nCsp8c);
         if (srcDims[1] % 16 == 0 && canUseBlocked(16))
-            pushSupportedPrimitiveDescriptor(mkldnn::memory::format_tag::nCdhw16c);
+            pushSupportedPrimitiveDescriptor(LayoutType::nCsp16c);
     }
 }
 
@@ -182,8 +177,8 @@ void MKLDNNPadNode::createPrimitive() {
     params.sizeData = this->getSelectedPrimitiveDescriptor()->getConfig().inConfs[0].desc->getPrecision().size();
 
     const auto inBlkDesc = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    params.srcDims = inBlkDesc.getBlockDims();
-    params.dstDims = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getBlockDims();
+    params.srcDims = inBlkDesc->getBlockDims();
+    params.dstDims = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getBlockDims();
 
     size_t nDims = params.srcDims.size();
     params.srcStrides.resize(nDims, 1);
@@ -193,14 +188,14 @@ void MKLDNNPadNode::createPrimitive() {
         params.dstStrides[i] = params.dstStrides[i + 1] * params.dstDims[i + 1];
     }
 
-    if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c) ||
-            getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c)) {
+    if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c) ||
+            getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c)) {
         padsBegin[1] /= params.srcDims[params.srcDims.size() - 1];
         padsEnd[1] /= params.srcDims[params.srcDims.size() - 1];
         padsBegin.push_back(0);
         padsEnd.push_back(0);
     } else {
-        auto order = inBlkDesc.getOrder();
+        auto order = inBlkDesc->getOrder();
         std::vector<unsigned int> newPadsBegin(padsBegin.size(), 0), newPadsEnd(padsEnd.size(), 0);
         for (size_t i = 0; i < padsBegin.size(); ++i) {
             newPadsBegin[i] = padsBegin[order[i]];
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.h
index a4a1333914bb10..68af48dac0ba50 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pad_node.h
@@ -20,7 +20,7 @@ class MKLDNNPadNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     enum PadMode {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.cpp
index 5d6e900d75d9fd..1e66a99616f160 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.cpp
@@ -13,14 +13,36 @@
 #include <mkldnn_types.h>
 #include <mkldnn_extension_utils.h>
 #include <utils/general_utils.h>
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
+bool MKLDNNPoolingNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
+    try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+        if (!ngraph::as_type_ptr<const ngraph::op::v1::MaxPool>(op) && !ngraph::as_type_ptr<const ngraph::op::v1::AvgPool>(op)) {
+            errorMessage = "Only opset1 MaxPool and AvgPool operations are supported";
+            return false;
+        }
+    } catch (...) {
+        return false;
+    }
+    return true;
+}
+
 MKLDNNPoolingNode::MKLDNNPoolingNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache)
         : MKLDNNNode(op, eng, cache) {
+    std::string errorMessage;
+    if (!isSupportedOperation(op, errorMessage)) {
+        IE_THROW(NotImplemented) << errorMessage;
+    }
+
     auto maxPoolOp = ngraph::as_type_ptr<ngraph::op::v1::MaxPool>(op);
     auto avgPoolOp = ngraph::as_type_ptr<ngraph::op::v1::AvgPool>(op);
     if (maxPoolOp) {
@@ -55,9 +77,6 @@ MKLDNNPoolingNode::MKLDNNPoolingNode(const std::shared_ptr<ngraph::Node>& op, co
         for (int i = 0; i < avgPoolOp->get_pads_end().size(); i++) {
             data_pad_end.push_back(static_cast<ptrdiff_t>(avgPoolOp->get_pads_end()[i]));
         }
-    } else {
-        IE_THROW(NotImplemented)
-                << "CPU Pooling node doesn't support ngraph operation " << op->get_type_name() << " with name " << op->get_friendly_name();
     }
 }
 
@@ -113,17 +132,17 @@ void MKLDNNPoolingNode::getSupportedDescriptors() {
     effective_pad_begin = data_pad_begin;
     effective_pad_end.resize(data_pad_end.size());
 
-    auto parentDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    auto childDims = getChildEdgeAt(0)->getShape().getStaticDims();
-    const size_t inputRank = getParentEdgeAt(0)->getShape().getRank();
+    auto parentShape = getInputShapeAtPort(0);
+    auto childShape = getOutputShapeAtPort(0);
+    const size_t inputRank = getInputShapeAtPort(0).getRank();
 
     if ((inputRank < 4) || (inputRank > 5))
         IE_THROW() << "Pooling layer. Unsupported mode. Only 4D and 5D blobs are supported as input.";
 
     for (int i = 0; i < effective_pad_end.size(); i++) {
         int krn = kernel[i];
-        int src = getParentEdgeAt(0)->getShape().getStaticDims()[2 + i];
-        int dst = getChildEdgeAt(0)->getShape().getStaticDims()[2 + i];
+        int src = getInputShapeAtPort(0).getStaticDims()[2 + i];
+        int dst = getOutputShapeAtPort(0).getStaticDims()[2 + i];
 
         int calc_dst = (src - krn + data_pad_begin[i]) / stride[i] + 1;
         effective_pad_end[i] = (dst - calc_dst) * stride[i];
@@ -133,28 +152,28 @@ void MKLDNNPoolingNode::getSupportedDescriptors() {
         if (outputDataType == memory::data_type::bf16)
             outputDataType = memory::data_type::f32;
         // i8 layers supports only ndhwc and nhwc layouts
-        const auto in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(parentDims, inputDataType, inputRank == 5 ?
-                                                                 memory::format_tag::ndhwc : memory::format_tag::nhwc);
-        const auto out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(childDims, outputDataType, inputRank == 5 ?
-                                                                 memory::format_tag::ndhwc : memory::format_tag::nhwc);
-        createDescriptor({ in_candidate.get() }, { out_candidate.get() });
-    } else if ((inputRank == 4 || inputRank == 5) && parentDims[1] == 1) {
+        const auto in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(parentShape, inputDataType, inputRank == 5 ?
+                                                                                   memory::format_tag::ndhwc : memory::format_tag::nhwc);
+        const auto out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(childShape, outputDataType, inputRank == 5 ?
+                                                                                    memory::format_tag::ndhwc : memory::format_tag::nhwc);
+        createDescriptor({ in_candidate }, { out_candidate });
+    } else if ((inputRank == 4 || inputRank == 5) && parentShape.getStaticDims()[1] == 1) {
         // WA. We should force planar layout since it provides better performance
-        const auto in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(parentDims, inputDataType, inputRank == 5 ?
-                                                                memory::format_tag::ncdhw : memory::format_tag::nchw);
-        const auto out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(childDims, outputDataType, inputRank == 5 ?
-                                                                memory::format_tag::ncdhw : memory::format_tag::nchw);
-        createDescriptor({ in_candidate.get() }, { out_candidate.get() });
+        const auto in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(parentShape, inputDataType, inputRank == 5 ?
+                                                                                   memory::format_tag::ncdhw : memory::format_tag::nchw);
+        const auto out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(childShape, outputDataType, inputRank == 5 ?
+                                                                                    memory::format_tag::ncdhw : memory::format_tag::nchw);
+        createDescriptor({ in_candidate }, { out_candidate });
     } else {
         if (inputDataType != memory::data_type::bf16) {
             inputDataType = memory::data_type::f32;
             outputDataType = memory::data_type::f32;
         }
         // It doesn't support any format
-        for (auto format : getAvailableFormatsForDims(getParentEdgeAt(0)->getShape())) {
-            const auto in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(parentDims, inputDataType, format);
-            const auto out_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(childDims, outputDataType, format);
-            createDescriptor({in_candidate.get()}, {out_candidate.get()});
+        for (auto format : getAvailableFormatsForDims(getInputShapeAtPort(0))) {
+            const auto in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(parentShape, inputDataType, format);
+            const auto out_candidate = std::make_shared<DnnlBlockedMemoryDesc>(childShape, outputDataType, format);
+            createDescriptor({in_candidate}, {out_candidate});
         }
     }
 }
@@ -179,10 +198,10 @@ bool MKLDNNPoolingNode::created() const {
     return getType() == Pooling;
 }
 
-void MKLDNNPoolingNode::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc,
-                                         const std::vector<const MemoryDesc*> &outputDesc) {
-    MKLDNNMemoryDesc in_candidate =  MemoryDescUtils::convertToMKLDNNMemoryDesc(*inputDesc[0]);
-    MKLDNNMemoryDesc out_candidate = MemoryDescUtils::convertToMKLDNNMemoryDesc(*outputDesc[0]);
+void MKLDNNPoolingNode::createDescriptor(const std::vector<MemoryDescPtr> &inputDesc,
+                                         const std::vector<MemoryDescPtr> &outputDesc) {
+    auto in_candidate =  MemoryDescUtils::convertToDnnlMemoryDesc(inputDesc[0])->getDnnlDesc();
+    auto out_candidate = MemoryDescUtils::convertToDnnlMemoryDesc(outputDesc[0])->getDnnlDesc();
 
     mkldnn::algorithm alg;
     if (algorithm == PoolingAvg) {
@@ -253,8 +272,12 @@ void MKLDNNPoolingNode::initSupportedPrimitiveDescriptors() {
                 PortConfig dataConfig;
                 dataConfig.inPlace = -1;
                 dataConfig.constant = false;
-                dataConfig.desc = MemoryDescUtils::applyUndefinedOffset(*getSrcMemDesc(itpd, i));
-                dataConfig.desc = getSrcMemDesc(itpd, i);
+                auto desc = getSrcMemDesc(itpd, i);
+                if (desc->getType() & MemoryDescType::Blocked) {
+                    dataConfig.desc = MemoryDescUtils::cloneWithUndefStridesAndOffset(*desc);
+                } else {
+                    dataConfig.desc = std::move(desc);
+                }
                 config.inConfs.push_back(dataConfig);
             }
 
@@ -262,8 +285,12 @@ void MKLDNNPoolingNode::initSupportedPrimitiveDescriptors() {
                 PortConfig dataConfig;
                 dataConfig.inPlace = canBeInPlace() ? 0 : -1;
                 dataConfig.constant = false;
-                dataConfig.desc = MemoryDescUtils::applyUndefinedOffset(*getDstMemDesc(itpd, i));
-                dataConfig.desc = getDstMemDesc(itpd, i);
+                auto desc = getDstMemDesc(itpd, i);
+                if (desc->getType() & MemoryDescType::Blocked) {
+                    dataConfig.desc = MemoryDescUtils::cloneWithUndefStridesAndOffset(*desc);
+                } else {
+                    dataConfig.desc = std::move(desc);
+                }
                 config.outConfs.push_back(dataConfig);
             }
             impl_desc_type impl_type = parse_impl_name(itpd.impl_info_str());
@@ -280,13 +307,13 @@ void MKLDNNPoolingNode::initDescriptor(const NodeConfig& config) {
     if (!selectedPD) {
         return;
     }
-    std::vector<const MemoryDesc*> inDescs;
+    std::vector<MemoryDescPtr> inDescs;
     for (const auto& inConf : config.inConfs)
-        inDescs.push_back(inConf.desc.get());
-    std::vector<const MemoryDesc*> outDescs;
+        inDescs.push_back(inConf.desc);
+    std::vector<MemoryDescPtr> outDescs;
     for (const auto& outConf : config.outConfs)
-        outDescs.push_back(outConf.desc.get());
-    createDescriptor({inDescs}, {outDescs});
+        outDescs.push_back(outConf.desc);
+    createDescriptor(inDescs, outDescs);
 
     mkldnn::primitive_attr attr;
     setPostOps(attr);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.h
index a594e774e47709..d131bed7857cad 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_pooling_node.h
@@ -16,8 +16,8 @@ class MKLDNNPoolingNode : public MKLDNNNode {
 public:
     MKLDNNPoolingNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache);
 
-    void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                          const std::vector<const MemoryDesc*>& outputDesc) override;
+    void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                          const std::vector<MemoryDescPtr>& outputDesc) override;
     std::vector<mkldnn::memory::format_tag> getAvailableFormatsForDims(const Shape &dims) const override;
     void getSupportedDescriptors() override;
     void initSupportedPrimitiveDescriptors() override;
@@ -28,6 +28,8 @@ class MKLDNNPoolingNode : public MKLDNNNode {
         return false;
     }
 
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
+
 private:
     void setPostOps(mkldnn::primitive_attr &attr, bool initWeights = false);
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.cpp
index e7421d82f1270c..bcc37aebfe5305 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.cpp
@@ -71,8 +71,12 @@ static std::vector<float> generate_anchors(proposal_conf &conf) {
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNProposalNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNProposalNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto proposal0Op = ngraph::as_type_ptr<const ngraph::op::v0::Proposal>(op);
         const auto proposal4Op = ngraph::as_type_ptr<const ngraph::op::v4::Proposal>(op);
         if (!proposal0Op && !proposal4Op) {
@@ -165,8 +169,8 @@ void MKLDNNProposalNode::execute(mkldnn::stream strm) {
         if (store_prob)
             outProbData = reinterpret_cast <float *>(getChildEdgesAtPort(PROBABILITIES_OUT_IDX)[0]->getMemoryPtr()->GetPtr());
 
-        auto inProbDims = getParentEdgeAt(0)->getShape().getStaticDims();
-        const size_t imgInfoSize = getParentEdgeAt(2)->getShape().getStaticDims()[0];
+        auto inProbDims = getParentEdgeAt(0)->getMemory().getStaticDims();
+        const size_t imgInfoSize = getParentEdgeAt(2)->getMemory().getStaticDims()[0];
 
         // input image height & width
         const float imgHeight = imgInfoData[0];
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.h
index 4fdb333b25921b..c2da9756b7fc45 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_proposal_node.h
@@ -22,7 +22,7 @@ class MKLDNNProposalNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     const size_t PROBABILITIES_IN_IDX = 0lu;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.cpp
index e56d6d2c245563..8ec2e2f67627fa 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.cpp
@@ -21,8 +21,12 @@ using namespace mkldnn::impl;
 using namespace mkldnn::impl::cpu::x64;
 using namespace mkldnn::impl::utils;
 
-bool MKLDNNPSROIPoolingNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNPSROIPoolingNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto psroi = std::dynamic_pointer_cast<const ngraph::opset1::PSROIPooling>(op);
         const auto defPsroi = std::dynamic_pointer_cast<const ngraph::opset1::DeformablePSROIPooling>(op);
         if (!psroi && !defPsroi) {
@@ -495,8 +499,9 @@ void MKLDNNPSROIPoolingNode::executeSpecified() {
     int numClasses = 1;
     int channelsEachClass = outputDim;
     if (!noTrans) {
-        bottomTrans = reinterpret_cast<const float *>(getParentEdgeAt(2)->getMemoryPtr()->GetPtr());
-        numClasses = static_cast<int>(getParentEdgeAt(2)->getShape().getStaticDims()[1]) / 2;
+        const auto mem = getParentEdgeAt(2)->getMemoryPtr();
+        bottomTrans = reinterpret_cast<const float *>(mem->GetPtr());
+        numClasses = static_cast<int>(mem->getStaticDims()[1]) / 2;
         channelsEachClass /= numClasses;
     }
 
@@ -504,9 +509,9 @@ void MKLDNNPSROIPoolingNode::executeSpecified() {
         const float *bottomRois = bottomRoisBeginning + currentRoi * 5;
         int roiBatchInd = static_cast<int>(bottomRois[0]);
         if (getAlgorithm() == Algorithm::PSROIPoolingAverage) {
-            executeAverage(srcData, dstData, bottomRois, currentRoi, roiBatchInd, srcDesc, dstDesc);
+            executeAverage(srcData, dstData, bottomRois, currentRoi, roiBatchInd, *srcDesc, *dstDesc);
         } else if (getAlgorithm() == Algorithm::PSROIPoolingBilinear) {
-            executeBilinear(srcData, dstData, bottomRois, currentRoi, roiBatchInd, srcDesc, dstDesc);
+            executeBilinear(srcData, dstData, bottomRois, currentRoi, roiBatchInd, *srcDesc, *dstDesc);
         } else if (getAlgorithm() == Algorithm::PSROIPoolingBilinearDeformable) {
             executeBilinearDeformable(srcData, dstData, bottomRois, bottomTrans,
                     numClasses, channelsEachClass, currentRoi, roiBatchInd);
@@ -533,8 +538,8 @@ struct MKLDNNPSROIPoolingNode::PSROIPoolingExecute {
 };
 
 void MKLDNNPSROIPoolingNode::execute(mkldnn::stream strm) {
-    auto inputPrec = getParentEdgesAtPort(0)[0]->getMemory().GetDesc().getPrecision();
-    auto outputPrec = getChildEdgesAtPort(0)[0]->getMemory().GetDesc().getPrecision();
+    auto inputPrec = getParentEdgesAtPort(0)[0]->getMemory().getDesc().getPrecision();
+    auto outputPrec = getChildEdgesAtPort(0)[0]->getMemory().getDesc().getPrecision();
 
     if (!((inputPrec == Precision::BF16 && outputPrec == Precision::BF16) ||
           (inputPrec == Precision::FP32 && outputPrec == Precision::FP32))) {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.h
index 45f275fe1ddff5..c79382a393d0df 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_psroi_pooling_node.h
@@ -22,7 +22,7 @@ class MKLDNNPSROIPoolingNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     size_t outputDim = 0;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.cpp
index 86818d36140967..c4243b89c63825 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.cpp
@@ -12,8 +12,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNRangeNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNRangeNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         if (!MKLDNNPlugin::one_of(op->get_type_info(), ngraph::op::v0::Range::type_info, ngraph::op::v4::Range::type_info)) {
             errorMessage = "Only opset1 and opset4 Range operation is supported";
             return false;
@@ -74,15 +78,15 @@ void MKLDNNRangeNode::initSupportedPrimitiveDescriptors() {
             getOriginalInputPrecisionAtPort(RANGE_LIMIT) == Precision::FP32 &&
             getOriginalInputPrecisionAtPort(RANGE_DELTA) == Precision::FP32 &&
             getOriginalOutputPrecisionAtPort(0) == Precision::FP32)) {
-        inDataConf.reserve(getOriginalInputsNumber());
-        for (int i = 0; i < getOriginalInputsNumber(); ++i)
+        inDataConf.reserve(inputShapes.size());
+        for (int i = 0; i < inputShapes.size(); ++i)
             inDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
         outDataConf.reserve(1);
         outDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
         addSupportedPrimDesc(inDataConf, outDataConf, impl_desc_type::ref_any);
     } else {
-        inDataConf.reserve(getOriginalInputsNumber());
-        for (int i = 0; i < getOriginalInputsNumber(); ++i)
+        inDataConf.reserve(inputShapes.size());
+        for (int i = 0; i < inputShapes.size(); ++i)
             inDataConf.emplace_back(LayoutType::ncsp);
         outDataConf.reserve(1);
         outDataConf.emplace_back(LayoutType::ncsp);
@@ -92,7 +96,7 @@ void MKLDNNRangeNode::initSupportedPrimitiveDescriptors() {
 
 void MKLDNNRangeNode::execute(mkldnn::stream strm) {
     StatusCode retcode = OK;
-    switch (getParentEdgeAt(0)->getMemory().GetDesc().getPrecision()) {
+    switch (getParentEdgeAt(0)->getMemory().getDesc().getPrecision()) {
         case Precision::FP32:
             retcode = rangeKernel<float>();
             break;
@@ -110,7 +114,7 @@ void MKLDNNRangeNode::execute(mkldnn::stream strm) {
 
 template <typename data_t>
 InferenceEngine::StatusCode MKLDNNRangeNode::rangeKernel() noexcept {
-    size_t dst_size = (getChildEdgesAtPort(0)[0]->getShape().getStaticDims())[0];
+    size_t dst_size = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims()[0];
     data_t* dst_data = reinterpret_cast<data_t *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
     data_t start = reinterpret_cast<const data_t *>(getParentEdgeAt(RANGE_START)->getMemoryPtr()->GetPtr())[0];
     data_t limit = reinterpret_cast<const data_t *>(getParentEdgeAt(RANGE_LIMIT)->getMemoryPtr()->GetPtr())[0];
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.h
index b5584be6aa949c..36b3f4aaeefab0 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_range_node.h
@@ -19,7 +19,7 @@ class MKLDNNRangeNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
     template <typename data_t>
     InferenceEngine::StatusCode rangeKernel() noexcept;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.cpp
index c76156ec4ae464..62ed485c63a635 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.cpp
@@ -1359,10 +1359,14 @@ std::map<const ngraph::DiscreteTypeInfo, std::function<void(const std::shared_pt
     }}
 };
 
-bool MKLDNNReduceNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNReduceNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
-        if (std::dynamic_pointer_cast<ngraph::op::util::ArithmeticReductionKeepDims>(op) == nullptr &&
-                std::dynamic_pointer_cast<ngraph::op::util::LogicalReductionKeepDims>(op) == nullptr) {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+        if (std::dynamic_pointer_cast<const ngraph::op::util::ArithmeticReductionKeepDims>(op) == nullptr &&
+                std::dynamic_pointer_cast<const ngraph::op::util::LogicalReductionKeepDims>(op) == nullptr) {
             errorMessage = "Reduce node with name " + op->get_friendly_name() + " is not derived from ArithmeticReductionKeepDims or LogicalReductionKeepDims";
             return false;
         }
@@ -1405,18 +1409,18 @@ void MKLDNNReduceNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << " gets incorrect number of output edges!";
 
-    if (getParentEdgeAt(REDUCE_INDEXES)->getShape().getRank() != 1) {
+    if (getInputShapeAtPort(REDUCE_INDEXES).getRank() != 1) {
         IE_THROW() << errorPrefix << " gets incorrect index vector dimension! Index vector should be 1 dimension.";
     }
 
     if (keep_dims) {
-        if (getParentEdgeAt(REDUCE_DATA)->getShape().getRank() != getChildEdgeAt(0)->getShape().getRank())
+        if (getInputShapeAtPort(REDUCE_DATA).getRank() != getOutputShapeAtPort(0).getRank())
             IE_THROW() << errorPrefix << " gets incorrect number of input/output dimensions!";
     } else {
         // In fact, after the Reduce operation, the shape must be a scalar if the previous one was 1d.
         // But for now, 0d tensor (scalar) is emulated as 1d tensor. Skip checking in such cases.
-        bool is_emulated_0d_as_1d = getParentEdgeAt(REDUCE_DATA)->getShape().getRank() == 1 && getChildEdgeAt(0)->getShape().getRank() == 1;
-        if (getParentEdgeAt(REDUCE_DATA)->getShape().getRank() <= getChildEdgeAt(0)->getShape().getRank() && !is_emulated_0d_as_1d)
+        bool is_emulated_0d_as_1d = getInputShapeAtPort(REDUCE_DATA).getRank() == 1 && getOutputShapeAtPort(0).getRank() == 1;
+        if (getInputShapeAtPort(REDUCE_DATA).getRank() <= getOutputShapeAtPort(0).getRank() && !is_emulated_0d_as_1d)
             IE_THROW() << errorPrefix << "gets incorrect number of input/output dimensions!";
     }
 }
@@ -1436,7 +1440,7 @@ void MKLDNNReduceNode::initSupportedPrimitiveDescriptors() {
     Precision inputPrecision = getOriginalInputPrecisionAtPort(REDUCE_DATA);
     Precision outputPrecision = getOriginalOutputPrecisionAtPort(0);
 
-    jit_mode = (mayiuse(cpu::x64::sse41)) && getParentEdgeAt(REDUCE_DATA)->getShape().getRank() <= 5 &&
+    jit_mode = (mayiuse(cpu::x64::sse41)) && getInputShapeAtPort(REDUCE_DATA).getRank() <= 5 &&
                std::find(std::begin(supportedPrecisions), std::end(supportedPrecisions), inputPrecision) != std::end(supportedPrecisions) &&
                std::find(std::begin(supportedPrecisions), std::end(supportedPrecisions), outputPrecision) != std::end(supportedPrecisions);
 
@@ -1453,13 +1457,10 @@ void MKLDNNReduceNode::initSupportedPrimitiveDescriptors() {
         }
     }
 
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(inputPrecision);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(outputPrecision);
-
     input_prec = inputPrecision;
     output_prec = outputPrecision;
-    src_data_size = MKLDNNExtensionUtils::sizeOfDataType(inputDataType);
-    dst_data_size = MKLDNNExtensionUtils::sizeOfDataType(outputDataType);
+    src_data_size = inputPrecision.size();
+    dst_data_size = outputPrecision.size();
 
     NodeConfig config;
     config.dynBatchSupport = false;
@@ -1472,13 +1473,14 @@ void MKLDNNReduceNode::initSupportedPrimitiveDescriptors() {
     config.inConfs[REDUCE_INDEXES].inPlace = -1;
     config.outConfs[0].inPlace = -1;
 
-    auto pushDesc = [&](memory::format_tag inFormat, memory::format_tag outFormat, memory::data_type inDataType,
-            memory::data_type outDataType, impl_desc_type impl_type) {
-        config.inConfs[REDUCE_DATA].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(REDUCE_DATA)->getShape().getStaticDims(),
-                                                                                       inDataType, inFormat);
-        config.inConfs[REDUCE_INDEXES].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(REDUCE_INDEXES)->getShape().getStaticDims(),
-                                                                            memory::data_type::s32, memory::format_tag::x);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outDataType, outFormat);
+    auto& creatorsMap = BlockedDescCreator::getCommonCreators();
+
+    auto pushDesc = [&](LayoutType inFormat, LayoutType outFormat, InferenceEngine::Precision inDataType,
+            InferenceEngine::Precision outDataType, impl_desc_type impl_type) {
+        config.inConfs[REDUCE_DATA].desc = creatorsMap.at(inFormat)->createSharedDesc(inDataType, getInputShapeAtPort(REDUCE_DATA));
+        config.inConfs[REDUCE_INDEXES].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(InferenceEngine::Precision::I32,
+                                                                                                 getInputShapeAtPort(REDUCE_INDEXES));
+        config.outConfs[0].desc = creatorsMap.at(outFormat)->createSharedDesc(outDataType, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.push_back({config, impl_type});
     };
 
@@ -1490,27 +1492,19 @@ void MKLDNNReduceNode::initSupportedPrimitiveDescriptors() {
             impl_type = impl_desc_type::jit_avx2;
         }
 
-        pushDesc(MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(REDUCE_DATA)->getShape().getRank()),
-                 MKLDNNMemory::GetPlainFormatByRank(getChildEdgeAt(0)->getShape().getRank()), inputDataType, outputDataType, impl_type);
+        pushDesc(LayoutType::ncsp, LayoutType::ncsp, inputPrecision, outputPrecision, impl_type);
         if (keep_dims) {
-            if (getParentEdgeAt(REDUCE_DATA)->getShape().getRank() == 4 && getParentEdgeAt(REDUCE_DATA)->getShape().getStaticDims()[1] > 1) {
-                if (mayiuse(cpu::x64::avx512_common)) {
-                    pushDesc(memory::format_tag::nChw16c, memory::format_tag::nChw16c, inputDataType, outputDataType, impl_type);
-                } else if (mayiuse(cpu::x64::avx2) || mayiuse(cpu::x64::sse41)) {
-                    pushDesc(memory::format_tag::nChw8c, memory::format_tag::nChw8c, inputDataType, outputDataType, impl_type);
-                }
-            } else if (getParentEdgeAt(REDUCE_DATA)->getShape().getRank() == 5 && getParentEdgeAt(REDUCE_DATA)->getShape().getStaticDims()[1] > 1) {
+            if ((getInputShapeAtPort(REDUCE_DATA).getRank() == 4 || getInputShapeAtPort(REDUCE_DATA).getRank() == 5) &&
+                    getInputShapeAtPort(REDUCE_DATA).getStaticDims()[1] > 1) {
                 if (mayiuse(cpu::x64::avx512_common)) {
-                    pushDesc(memory::format_tag::nCdhw16c, memory::format_tag::nCdhw16c, inputDataType, outputDataType, impl_type);
+                    pushDesc(LayoutType::nCsp16c, LayoutType::nCsp16c, inputPrecision, outputPrecision, impl_type);
                 } else if (mayiuse(cpu::x64::avx2) || mayiuse(cpu::x64::sse41)) {
-                    pushDesc(memory::format_tag::nCdhw8c, memory::format_tag::nCdhw8c, inputDataType, outputDataType, impl_type);
+                    pushDesc(LayoutType::nCsp8c, LayoutType::nCsp8c, inputPrecision, outputPrecision, impl_type);
                 }
             }
         }
     } else {
-        pushDesc(MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(REDUCE_DATA)->getShape().getRank()),
-                 MKLDNNMemory::GetPlainFormatByRank(getChildEdgeAt(0)->getShape().getRank()),
-                 memory::data_type::f32, memory::data_type::f32, impl_desc_type::ref);
+        pushDesc(LayoutType::ncsp, LayoutType::ncsp, InferenceEngine::Precision::FP32, InferenceEngine::Precision::FP32, impl_desc_type::ref);
     }
 }
 
@@ -1526,7 +1520,7 @@ void MKLDNNReduceNode::createPrimitive() {
         IE_THROW() << errorPrefix << " has nullable preferable primitive descriptor";
 
     auto selectedPD = getSelectedPrimitiveDescriptor();
-    planar_layout = getParentEdgeAt(REDUCE_DATA)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp);
+    planar_layout = getParentEdgeAt(REDUCE_DATA)->getMemory().getDesc().hasLayoutType(LayoutType::ncsp);
 
     auto jcp = jit_reduce_config_params();
     jcp.src_dt = MKLDNNExtensionUtils::IEPrecisionToDataType(selectedPD->getConfig().inConfs[REDUCE_DATA].desc->getPrecision());
@@ -1566,8 +1560,8 @@ void MKLDNNReduceNode::execute(mkldnn::stream strm) {
 
     const auto idx_data = reinterpret_cast<const int32_t *>(srcIndexesMemPtr->GetData());
     size_t dst_size = dstMemPtr->GetSize();
-    src_dims = getParentEdgeAt(REDUCE_DATA)->getShape().getStaticDims();
-    src_strides = getParentEdgeAt(REDUCE_DATA)->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    src_dims = getParentEdgeAt(REDUCE_DATA)->getMemory().getStaticDims();
+    src_strides = getParentEdgeAt(REDUCE_DATA)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
     dims_size = src_dims.size();
     calc_process_dst_dims(idx_data);
 
@@ -1932,9 +1926,9 @@ inline void MKLDNNReduceNode::init_dst_data(uint8_t *out_ptr, size_t dst_size) {
 
 inline void MKLDNNReduceNode::calc_process_dst_dims(const int32_t *idx_data) {
     SizeVector out_dims;
-    SizeVector dst_dims = getChildEdgeAt(0)->getShape().getStaticDims();
+    SizeVector dst_dims = getOutputShapeAtPort(0).getStaticDims();
     std::set<size_t> axes;
-    for (size_t i = 0; i < getParentEdgeAt(REDUCE_INDEXES)->getShape().getStaticDims()[0]; i++) {
+    for (size_t i = 0; i < getParentEdgeAt(REDUCE_INDEXES)->getMemory().getStaticDims()[0]; i++) {
         int32_t axis = idx_data[i];
         if (axis < 0)
             axis += src_dims.size();
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.h
index 07e2724d98a5c1..566277f06ee895 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reduce_node.h
@@ -75,7 +75,7 @@ class MKLDNNReduceNode : public MKLDNNNode {
         return false;
     }
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     void reduce_type(const uint8_t *in_ptr, uint8_t *out_ptr, size_t dst_size);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.cpp
index f7ddad8b6794a4..75bad46202c6cf 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.cpp
@@ -7,6 +7,7 @@
 #include <mkldnn_extension_utils.h>
 #include <ngraph/runtime/host_tensor.hpp>
 #include "common/blocked_desc_creator.h"
+#include <ngraph/opsets/opset1.hpp>
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -50,13 +51,15 @@ void MKLDNNReferenceNode::execute(mkldnn::stream strm) {
     ngraph::HostTensorVector inputs;
     for (size_t i = 0; i < inputShapes.size(); i++) {
         void *srcDataPtr = getParentEdgesAtPort(i)[0]->getMemory().GetPtr();
-        inputs.push_back(std::make_shared<ngraph::HostTensor>(ngraphOp->get_input_element_type(i), ngraphOp->get_input_shape(i), srcDataPtr));
+        inputs.push_back(std::make_shared<ngraph::HostTensor>(ngraphOp->get_input_element_type(i),
+                                                              getParentEdgesAtPort(i)[0]->getMemory().getStaticDims(), srcDataPtr));
     }
 
     ngraph::HostTensorVector outputs;
     for (size_t i = 0; i < outputShapes.size(); i++) {
         void *dstDataPtr = getChildEdgesAtPort(i)[0]->getMemory().GetPtr();
-        outputs.push_back(std::make_shared<ngraph::HostTensor>(ngraphOp->get_output_element_type(i), ngraphOp->get_output_shape(i), dstDataPtr));
+        outputs.push_back(std::make_shared<ngraph::HostTensor>(ngraphOp->get_output_element_type(i),
+                                                               getChildEdgesAtPort(i)[0]->getMemory().getStaticDims(), dstDataPtr));
     }
 
     if (!ngraphOp->evaluate(outputs, inputs)) {
@@ -64,6 +67,10 @@ void MKLDNNReferenceNode::execute(mkldnn::stream strm) {
     }
 }
 
+void MKLDNNReferenceNode::executeDynamicImpl(mkldnn::stream strm) {
+    execute(strm);
+}
+
 bool MKLDNNReferenceNode::created() const {
     return getType() == Reference;
 }
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.h
index ce27028aa56700..a37a32d83afe69 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reference_node.h
@@ -20,6 +20,8 @@ class MKLDNNReferenceNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
+    void executeDynamicImpl(mkldnn::stream strm) override;
+
 private:
     const std::shared_ptr<ngraph::Node> ngraphOp;
     const std::string additionalErrorMessage;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.cpp
index c140baa88c533c..fe7adbb9552ecd 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.cpp
@@ -227,8 +227,12 @@ struct jit_uni_logistic_kernel_f32 : public jit_uni_logistic_kernel, public jit_
     }
 };
 
-bool MKLDNNRegionYoloNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNRegionYoloNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto regionYolo = std::dynamic_pointer_cast<const ngraph::opset1::RegionYolo>(op);
         if (!regionYolo) {
             errorMessage = "Only opset1 RegionYolo operation is supported";
@@ -367,10 +371,12 @@ inline void MKLDNNRegionYoloNode::calculate_logistic(size_t start_index, int cou
 }
 
 void MKLDNNRegionYoloNode::execute(mkldnn::stream strm) {
-    size_t B =  (getParentEdgeAt(0)->getShape().getRank() > 0) ? getParentEdgeAt(0)->getShape().getStaticDims()[0] : 1;
-    size_t IC = (getParentEdgeAt(0)->getShape().getRank() > 1) ? getParentEdgeAt(0)->getShape().getStaticDims()[1] : 1;
-    size_t IH = (getParentEdgeAt(0)->getShape().getRank() > 2) ? getParentEdgeAt(0)->getShape().getStaticDims()[2] : 1;
-    size_t IW = (getParentEdgeAt(0)->getShape().getRank() > 3) ? getParentEdgeAt(0)->getShape().getStaticDims()[3] : 1;
+    const auto &inShape = getParentEdgeAt(0)->getMemory().GetShape();
+    const auto &inDims = inShape.getStaticDims();
+    size_t B =  (inShape.getRank() > 0) ? inDims[0] : 1;
+    size_t IC = (inShape.getRank() > 1) ? inDims[1] : 1;
+    size_t IH = (inShape.getRank() > 2) ? inDims[2] : 1;
+    size_t IW = (inShape.getRank() > 3) ? inDims[3] : 1;
 
     size_t mask_size = mask.size();
     int end_index = 0;
@@ -388,8 +394,9 @@ void MKLDNNRegionYoloNode::execute(mkldnn::stream strm) {
         output_size = B * IH * IW * mask_size * (classes + coords + 1);
     }
 
-    if (output_size != getChildEdgeAt(0)->getMemoryPtr()->GetElementsCount())
-        IE_THROW() << "Incorrect layer configuration or output dimensions. " << output_size << " != " << getChildEdgeAt(0)->getMemoryPtr()->GetElementsCount();
+    if (output_size != getChildEdgeAt(0)->getMemoryPtr()->GetShape().getElementsCount())
+        IE_THROW() << "Incorrect layer configuration or output dimensions. " << output_size << " != "
+                   << getChildEdgeAt(0)->getMemoryPtr()->GetShape().getElementsCount();
 
     size_t inputs_size = IH * IW * num_ * (classes + coords + 1);
     size_t total_size = 2 * IH * IW;
@@ -397,8 +404,8 @@ void MKLDNNRegionYoloNode::execute(mkldnn::stream strm) {
     const auto *src_data = reinterpret_cast<const uint8_t *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     auto *dst_data = reinterpret_cast<uint8_t *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
 
-    cpu_convert(src_data, dst_data, getParentEdgeAt(0)->getMemory().GetDesc().getPrecision(),
-                getChildEdgeAt(0)->getMemory().GetDesc().getPrecision(), output_size);
+    cpu_convert(src_data, dst_data, getParentEdgeAt(0)->getMemory().getDesc().getPrecision(),
+                getChildEdgeAt(0)->getMemory().getDesc().getPrecision(), output_size);
 
     for (int b = 0; b < B; b++) {
         for (int n = 0; n < num_; n++) {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.h
index 31404a5be11c9c..fda76d7b33a697 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_region_yolo_node.h
@@ -47,7 +47,7 @@ class MKLDNNRegionYoloNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     int classes;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.cpp
index c1701deacdeeb4..c643d655fdf71e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.cpp
@@ -11,6 +11,9 @@
 #include "ie_parallel.hpp"
 #include "utils/general_utils.h"
 #include <cpu/x64/cpu_isa_traits.hpp>
+#include "nodes/common/cpu_memcpy.h"
+#include "nodes/common/cpu_convert.h"
+#include "mkldnn_convert_node.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -22,8 +25,8 @@ MKLDNNReorderNode::MKLDNNReorderNode(const std::shared_ptr<ngraph::Node>& op, co
 }
 
 MKLDNNReorderNode::MKLDNNReorderNode(const std::string& name, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &w_cache) :
-        MKLDNNNode("Reorder", name, eng, w_cache) {
-}
+        MKLDNNNode("Reorder", name, eng, w_cache) {}
+
 void MKLDNNReorderNode::getSupportedDescriptors() {
     if (getParentEdges().size() != 1)
         IE_THROW() << "Incorrect number of input edges for layer " << getName();
@@ -51,63 +54,92 @@ void MKLDNNReorderNode::initSupportedPrimitiveDescriptors() {
         config.outConfs[0].inPlace = 0;
     }
     if (input && output) {
-        config.inConfs[0].desc = input->clone();
-        config.outConfs[0].desc = output->clone();
+        config.inConfs[0].desc = input;
+        config.outConfs[0].desc = output;
     } else if (parent->getSelectedPrimitiveDescriptor() != nullptr &&
                child->getSelectedPrimitiveDescriptor() != nullptr) {
-        config.inConfs[0].desc = parent->getSelectedPrimitiveDescriptor()->getConfig().outConfs[0].desc->clone();
-        config.outConfs[0].desc = child->getSelectedPrimitiveDescriptor()->getConfig().inConfs[0].desc->clone();
+        config.inConfs[0].desc = parent->getSelectedPrimitiveDescriptor()->getConfig().outConfs[0].desc;
+        config.outConfs[0].desc = child->getSelectedPrimitiveDescriptor()->getConfig().inConfs[0].desc;
     } else {
         IE_THROW() << "Cannot initialize supported PDs for Reorder node with name `" << getName() << "`";
     }
 
     supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::reorder);
-}
-
-void MKLDNNReorderNode::createPrimitive() {
-    auto &dstMemPtr = getChildEdgeAt(0)->getMemoryPtr();
-    auto &srcMemPtr = getParentEdgeAt(0)->getMemoryPtr();
-    if (!dstMemPtr || !dstMemPtr->GetPrimitivePtr())
-        IE_THROW() << "Destination memory didn't allocate.";
-    if (!srcMemPtr || !srcMemPtr->GetPrimitivePtr())
-        IE_THROW() << "Input memory didn't allocate.";
-    if (getSelectedPrimitiveDescriptor() == nullptr)
-        IE_THROW() << "Preferable primitive descriptor is not set.";
 
-    auto inDims = getParentEdgeAt(0)->getShape().getStaticDims();
+    isDynamic = !(config.inConfs[0].desc->isDefined() && config.outConfs[0].desc->isDefined());
 
     if (!isOptimized) {
-        if (MKLDNNPlugin::one_of(inDims.size(), 4, 5) &&
-                inDims[1] <= 64 &&
-                inDims[1] >= 16 &&
-                (getParentEdgeAt(0)->getMemory().GetElementsCount() / inDims[1]) >= 128 &&
-                getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc) &&
-                getChildEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp) &&
-                getParentEdgeAt(0)->getMemory().GetDesc().getPrecision() == Precision::FP32 &&
-                getChildEdgeAt(0)->getMemory().GetDesc().getPrecision() == Precision::FP32) {
+        const auto &inShape = getInputShapeAtPort(0);
+        if (MKLDNNPlugin::one_of(inShape.getRank(), 4, 5) &&
+                config.inConfs[0].desc->hasLayoutType(LayoutType::nspc) &&
+                config.outConfs[0].desc->hasLayoutType(LayoutType::ncsp) &&
+                config.inConfs[0].desc->getPrecision() == Precision::FP32 &&
+                config.outConfs[0].desc->getPrecision() == Precision::FP32) {
             // oneDNN JIT reorder shows bad perf for nspc to ncsp reorder case so we fallback on simple c++ implementation
-            canUseOptimizedNspc2Ncsp = true;
+            isNspc2NcspCase = true;
         } else if (!impl::cpu::x64::mayiuse(impl::cpu::x64::avx2) &&
-                   MKLDNNPlugin::one_of(inDims.size(), 4, 5) &&
-                   getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp) &&
-                   getChildEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc) &&
-                   getParentEdgeAt(0)->getMemory().GetDataType() == getChildEdgeAt(0)->getMemory().GetDataType() &&
-                   MKLDNNExtensionUtils::sizeOfDataType(getParentEdgeAt(0)->getMemory().GetDataType()) == 1) {
+                   MKLDNNPlugin::one_of(inShape.getRank(), 4, 5) &&
+                   config.inConfs[0].desc->hasLayoutType(LayoutType::ncsp) &&
+                   config.outConfs[0].desc->hasLayoutType(LayoutType::nspc) &&
+                   config.inConfs[0].desc->getPrecision() == config.outConfs[0].desc->getPrecision() &&
+                   config.inConfs[0].desc->getPrecision().size() == 1) {
             // oneDNN doesn't provide JIT reorder impl for non-avx2 targets so we fallback on simple c++ implementation which shows better perf
-            canUseOptimizedNcsp2Nspc = true;
-        } else {
-            createReorderPrimitive(srcMemPtr->GetDescriptor(), srcMemPtr->GetPrimitive().get_data_handle(),
-                                   dstMemPtr->GetDescriptor(), dstMemPtr->GetPrimitive().get_data_handle());
+            canUseNcsp2Nspc = true;
+        }
+    }
+    currentInDims.resize(1);
+}
+
+void MKLDNNReorderNode::createPrimitive() {
+    if (isInputShapesDefined()) {
+        if (isPrepareParamsNeeded())
+            prepareParams();
+        initCurrentDims();
+    }
+}
+
+void MKLDNNReorderNode::prepareParams() {
+    if (!isOptimized) {
+        if (!isInputShapesDefined()) {
+            IE_THROW() << "Can't prepare params for eltwise node with name: " << getName();
+        }
+
+        auto &srcMemPtr = getParentEdgeAt(0)->getMemoryPtr();
+        auto &dstMemPtr = getChildEdgeAt(0)->getMemoryPtr();
+        if (!dstMemPtr || !dstMemPtr->GetPrimitivePtr())
+            IE_THROW() << "Destination memory didn't allocate.";
+        if (!srcMemPtr || !srcMemPtr->GetPrimitivePtr())
+            IE_THROW() << "Input memory didn't allocate.";
+        if (getSelectedPrimitiveDescriptor() == nullptr)
+            IE_THROW() << "Preferable primitive descriptor is not set.";
+
+        if (isNspc2NcspCase) {
+            const auto &inDims = srcMemPtr->getStaticDims();
+            canUseNspc2Ncsp = inDims[1] <= 64 && inDims[1] >= 16 &&
+                              (srcMemPtr->GetDescWithType<BlockedMemoryDesc>()->getPaddedElementsCount() / inDims[1]) >= 128;
+        }
+        if (!canUseNcsp2Nspc && !canUseNspc2Ncsp) {
+            auto &dstMemPtr = getChildEdgeAt(0)->getMemoryPtr();
+            auto &srcMemPtr = getParentEdgeAt(0)->getMemoryPtr();
+            if (!dstMemPtr || !dstMemPtr->GetPrimitivePtr())
+                IE_THROW() << "Destination memory didn't allocate.";
+            if (!srcMemPtr || !srcMemPtr->GetPrimitivePtr())
+                IE_THROW() << "Input memory didn't allocate.";
+            if (getSelectedPrimitiveDescriptor() == nullptr)
+                IE_THROW() << "Preferable primitive descriptor is not set.";
+
+            createReorderPrimitive(srcMemPtr->GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc(), srcMemPtr->GetPrimitive().get_data_handle(),
+                                   dstMemPtr->GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc(), dstMemPtr->GetPrimitive().get_data_handle());
         }
     }
 }
 
 void MKLDNNReorderNode::createReorderPrimitive(const mkldnn::memory::desc &srcDesc, void* srcPtr, const mkldnn::memory::desc &dstDesc, void* dstPtr) {
     src_blocked = std::make_shared<MKLDNNMemory>(getEngine());
-    src_blocked->Create(MKLDNNMemoryDesc(srcDesc), srcPtr, false);
+    src_blocked->Create(MKLDNNExtensionUtils::makeDescriptor(srcDesc), srcPtr, false);
 
     dst_blocked = std::make_shared<MKLDNNMemory>(getEngine());
-    dst_blocked->Create(MKLDNNMemoryDesc(dstDesc), dstPtr, false);
+    dst_blocked->Create(MKLDNNExtensionUtils::makeDescriptor(dstDesc), dstPtr, false);
 
     mkldnn::primitive_attr attr;
     auto createReorder = [&]() -> bool {
@@ -137,13 +169,13 @@ void MKLDNNReorderNode::createReorderPrimitive(const mkldnn::memory::desc &srcDe
         // perform such conversion if the source tensor can be reshaped to the destination rank. This is
         // useful in situations when rank in IR does not much rank that is required by the oneDNN primitive,
         // but the input tensor can be reshaped (e.g. weights for grouped convolutions, biases etc.)
-        if (src_blocked->GetDesc().hasLayoutType(LayoutType::ncsp) &&
-            src_blocked->GetDims().size() != dst_blocked->GetDims().size()) {
-            const auto newDims = dst_blocked->GetDims();
-            const auto newFormat = MKLDNNMemory::GetPlainFormatByRank(newDims.size());
+        if (src_blocked->getDesc().hasLayoutType(LayoutType::ncsp) &&
+            src_blocked->GetShape().getRank() != dst_blocked->GetShape().getRank()) {
+            const auto newDims = dst_blocked->getStaticDims();
+            const auto newFormat = MKLDNNExtensionUtils::GetPlainFormatByRank(newDims.size());
 
-            auto newDesc = mkldnn::memory::desc(newDims, src_blocked->GetDataType(), newFormat);
-            src_blocked->Create(MKLDNNMemoryDesc(newDesc), srcPtr, false);
+            auto newDesc = mkldnn::memory::desc(MKLDNNExtensionUtils::convertToDnnlDims(newDims), src_blocked->GetDataType(), newFormat);
+            src_blocked->Create(MKLDNNExtensionUtils::makeDescriptor(newDesc), srcPtr, false);
 
             success = createReorder();
         }
@@ -171,7 +203,7 @@ void MKLDNNReorderNode::optimizedNcsp2Nspc() {
     auto parentEdge = getParentEdgeAt(0);
     auto childEdge = getChildEdgeAt(0);
 
-    auto inDims = parentEdge->getShape().getStaticDims();
+    auto inDims = parentEdge->getMemory().GetShape().getStaticDims();
     const size_t ndims = inDims.size();
     const size_t DIM0 = inDims[0];
     const size_t DIM1 = inDims[1];
@@ -202,7 +234,7 @@ void MKLDNNReorderNode::optimizedNspc2Ncsp() {
     auto parentEdge = getParentEdgeAt(0);
     auto childEdge = getChildEdgeAt(0);
 
-    auto inDims = parentEdge->getShape().getStaticDims();
+    auto inDims = parentEdge->getMemory().GetShape().getStaticDims();
     const size_t ndims = inDims.size();
     const size_t DIM0 = inDims[0];
     const size_t DIM1 = inDims[1];
@@ -230,9 +262,9 @@ void MKLDNNReorderNode::execute(mkldnn::stream strm) {
     if (isOptimized)
         return;
 
-    if (canUseOptimizedNspc2Ncsp) {
+    if (canUseNspc2Ncsp) {
         optimizedNspc2Ncsp();
-    } else if (canUseOptimizedNcsp2Nspc) {
+    } else if (canUseNcsp2Nspc) {
         optimizedNcsp2Nspc();
     } else {
         src_blocked->GetPrimitivePtr()->set_data_handle(getParentEdgeAt(0)->getMemory().GetPrimitive().get_data_handle());
@@ -247,8 +279,8 @@ void MKLDNNReorderNode::setDynamicBatchLim(int lim) {
     if (prim) {
         auto &dstMemPtr = getChildEdgeAt(0)->getMemoryPtr();
         auto &srcMemPtr = getParentEdgeAt(0)->getMemoryPtr();
-        memory::desc src_d = srcMemPtr->GetDescriptor();
-        memory::desc dst_d = dstMemPtr->GetDescriptor();
+        memory::desc src_d = srcMemPtr->GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc();
+        memory::desc dst_d = dstMemPtr->GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc();
         void *src_data_hdl = srcMemPtr->GetPrimitive().get_data_handle();
         void *dst_data_hdl = dstMemPtr->GetPrimitive().get_data_handle();
 
@@ -277,4 +309,56 @@ std::string MKLDNNReorderNode::getReorderArgs(const MemoryDesc &parentDesc, cons
     return inArgs + "_" + outArgs;
 }
 
+void MKLDNNReorderNode::reorderData(const MKLDNNMemory &input, const MKLDNNMemory &output, size_t size) {
+    if (!input.getDesc().isDefined() || !output.getDesc().isDefined())
+        IE_THROW() << "Can't reorder data with dynamic shapes";
+
+    if (size != 0)
+        IE_ASSERT(size <= output.GetSize());
+    if (input.getDesc().isCompatible(output.getDesc())) {
+        auto srcPtr = static_cast<uint8_t*>(input.GetPtr());
+        auto dstPtr = static_cast<uint8_t*>(output.GetPtr());
+
+        auto copySize = size == 0 ? output.GetSize() : size;
+        cpu_memcpy(dstPtr, srcPtr, copySize);
+    } else {
+        std::unique_ptr<mkldnn::reorder> pReorder;
+        std::shared_ptr<mkldnn::memory> srcMemoryPtr;
+        std::vector<uint8_t> tmpBuff;
+
+        try {
+            pReorder = std::unique_ptr<mkldnn::reorder>(new mkldnn::reorder(input.GetPrimitive(), output.GetPrimitive()));
+            srcMemoryPtr = input.GetPrimitivePtr();
+        }
+        catch (const mkldnn::error& err) {
+            if (mkldnn_unimplemented == err.status && output.GetDataType() != input.GetDataType() && MKLDNNConvertNode::isSupportedDesc(input.getDesc()) &&
+                    MKLDNNConvertNode::isSupportedDesc(output.getDesc())) {
+                //we probably could not make the reorder because there is no one supporting this precision conversion
+                //lets try to convert data first using cpu_convert
+                auto data = static_cast<const uint8_t *>(input.GetPtr());
+                tmpBuff.resize(input.GetSize());
+
+                const auto outPrc = MKLDNNExtensionUtils::DataTypeToIEPrecision(output.GetDataType());
+                cpu_convert(data, tmpBuff.data(), MKLDNNExtensionUtils::DataTypeToIEPrecision(input.GetDataType()),
+                            outPrc, input.GetSize() / input.getDesc().getPrecision().size());
+
+                MKLDNNMemory tmpMem(output.getEngine());
+                auto tmpDesc = MemoryDescUtils::cloneWithNewPrecision(input.getDesc(), outPrc);
+                tmpMem.Create(std::move(tmpDesc), tmpBuff.data());
+
+                pReorder = std::unique_ptr<mkldnn::reorder>(new mkldnn::reorder(tmpMem.GetPrimitive(), output.GetPrimitive()));
+                srcMemoryPtr = tmpMem.GetPrimitivePtr();
+            } else {
+                throw;
+            }
+        }
+        if (pReorder) {
+            mkldnn::stream loc_stream(output.getEngine(), mkldnn::stream::flags::default_order);
+            pReorder->execute(loc_stream, *srcMemoryPtr, *output.GetPrimitivePtr());
+        } else {
+            IE_THROW() << "Could not make mkldnn reorder.";
+        }
+    }
+}
+
 REG_MKLDNN_PRIM_FOR(MKLDNNReorderNode, Reorder);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.h
index da821878035e37..795a7d2a60241f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorder_node.h
@@ -20,11 +20,20 @@ class MKLDNNReorderNode : public MKLDNNNode {
 
     void getSupportedDescriptors() override;
     void initSupportedPrimitiveDescriptors() override;
-    void createPrimitive() override;
     void execute(mkldnn::stream strm) override;
     bool created() const override;
     const std::vector<impl_desc_type>& getPrimitivesPriority() override;
 
+    void createPrimitive() override;
+
+    std::vector<VectorDims> shapeInfer() const override {
+        return {getParentEdgesAtPort(0)[0]->getMemory().getStaticDims()};
+    }
+
+    void prepareParams() override;
+
+    void executeDynamicImpl(mkldnn::stream strm) override { execute(strm); }
+
     void setDescs(const MemoryDesc& input, const MemoryDesc& output) {
         this->input = input.clone();
         inputShapes.clear();
@@ -50,16 +59,22 @@ class MKLDNNReorderNode : public MKLDNNNode {
 
     static std::string getReorderArgs(const MemoryDesc &parentDesc, const MemoryDesc &childDesc);
 
+    static void reorderData(const MKLDNNMemory &input, const MKLDNNMemory &output, size_t size = 0);
+
 private:
-    std::unique_ptr<MemoryDesc> input;
-    std::unique_ptr<MemoryDesc> output;
+    std::shared_ptr<MemoryDesc> input;
+    std::shared_ptr<MemoryDesc> output;
+
+    mkldnn::reorder::primitive_desc pd;
 
     MKLDNNMemoryPtr dst_blocked;
     MKLDNNMemoryPtr src_blocked;
 
     bool isOptimized = false;
-    bool canUseOptimizedNspc2Ncsp = false;
-    bool canUseOptimizedNcsp2Nspc = false;
+
+    bool isNspc2NcspCase = false;
+    bool canUseNspc2Ncsp = false;
+    bool canUseNcsp2Nspc = false;
 
     void optimizedNspc2Ncsp();
     void optimizedNcsp2Nspc();
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.cpp
index 48e2eaf9992fc9..194ddca390c416 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.cpp
@@ -11,8 +11,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNReorgYoloNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNReorgYoloNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto reorgYolo = std::dynamic_pointer_cast<const ngraph::opset2::ReorgYolo>(op);
         if (!reorgYolo) {
             errorMessage = "Only opset2 ReorgYolo operation is supported";
@@ -55,10 +59,11 @@ void MKLDNNReorgYoloNode::execute(mkldnn::stream strm) {
     const auto *src_data = reinterpret_cast<const float *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     auto *dst_data = reinterpret_cast<float *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
 
-    int IW = (getParentEdgeAt(0)->getShape().getRank() > 3) ? getParentEdgeAt(0)->getShape().getStaticDims()[3] : 1;
-    int IH = (getParentEdgeAt(0)->getShape().getRank() > 2) ? getParentEdgeAt(0)->getShape().getStaticDims()[2] : 1;
-    int IC = (getParentEdgeAt(0)->getShape().getRank() > 1) ? getParentEdgeAt(0)->getShape().getStaticDims()[1] : 1;
-    int B  = (getParentEdgeAt(0)->getShape().getRank() > 0) ? getParentEdgeAt(0)->getShape().getStaticDims()[0] : 1;
+    const auto &inDims = getParentEdgeAt(0)->getMemory().getStaticDims();
+    int IW = (inDims.size() > 3) ? inDims[3] : 1;
+    int IH = (inDims.size() > 2) ? inDims[2] : 1;
+    int IC = (inDims.size() > 1) ? inDims[1] : 1;
+    int B  = (inDims.size() > 0) ? inDims[0] : 1;
 
     int ic_off = IC / (stride * stride);
     int ih_off = IH * stride;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.h
index b88f19010e0491..d22147c48e0a4a 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reorg_yolo_node.h
@@ -19,7 +19,7 @@ class MKLDNNReorgYoloNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     int stride;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.cpp
index f4256042379500..9bc94c59cd5c42 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.cpp
@@ -6,13 +6,37 @@
 #include <string>
 #include <mkldnn_types.h>
 #include <mkldnn_extension_utils.h>
+#include <ngraph/opsets/opset1.hpp>
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
+bool MKLDNNReshapeNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
+    try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+        if (!std::dynamic_pointer_cast<const ngraph::opset1::Reshape>(op) &&
+            !std::dynamic_pointer_cast<const ngraph::opset1::Squeeze>(op) &&
+                !std::dynamic_pointer_cast<const ngraph::opset1::Unsqueeze>(op)) {
+            errorMessage = "Only opset1 Reshape, Squeeze, Unsqueeze operations are supported";
+            return false;
+        }
+    } catch (...) {
+        return false;
+    }
+    return true;
+}
+
 MKLDNNReshapeNode::MKLDNNReshapeNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache) :
-        MKLDNNNode(op, eng, cache) {}
+        MKLDNNNode(op, eng, cache) {
+    std::string errorMessage;
+    if (!isSupportedOperation(op, errorMessage)) {
+        IE_THROW(NotImplemented) << errorMessage;
+    }
+}
 
 MKLDNNReshapeNode::MKLDNNReshapeNode(const std::string& name, const Shape& inDims, const Shape& outDims, Precision precision,
         const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &wCache)
@@ -34,28 +58,27 @@ void MKLDNNReshapeNode::initSupportedPrimitiveDescriptors() {
     if (!supportedPrimitiveDescriptors.empty())
         return;
 
-    InferenceEngine::Precision precision = getOriginalInputPrecisionAtPort(0);
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
-    precision = getOriginalOutputPrecisionAtPort(0);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
+    InferenceEngine::Precision inPrec = getOriginalInputPrecisionAtPort(0);
+    InferenceEngine::Precision outPrec = getOriginalOutputPrecisionAtPort(0);
 
     // Current reshape implementation is simple memory reinterpret,
     // same precision on input and output is required
-    if (inputDataType != outputDataType)
-        inputDataType = outputDataType;
+    if (inPrec != outPrec)
+        inPrec = outPrec;
 
     NodeConfig config;
     config.dynBatchSupport = true;
     config.inConfs.resize(getParentEdges().size());
-    for (size_t i = 0; i <getParentEdges().size(); i++) {
+    auto& creatorsMap = BlockedDescCreator::getCommonCreators();
+    for (size_t i = 0; i < getParentEdges().size(); i++) {
         config.inConfs[i].inPlace = -1;
         config.inConfs[i].constant = false;
-        config.inConfs[i].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(i)->getShape().getStaticDims(), inputDataType);
+        config.inConfs[i].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(inPrec, getInputShapeAtPort(i));
     }
     config.outConfs.resize(1);
     config.outConfs[0].inPlace = 0;
     config.outConfs[0].constant = false;
-    config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType);
+    config.outConfs[0].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(outPrec, getOutputShapeAtPort(0));
     supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::unknown);
 }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.h
index cf88872f195701..c262e02a87ba8e 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reshape_node.h
@@ -26,6 +26,8 @@ class MKLDNNReshapeNode : public MKLDNNNode {
     void initSupportedPrimitiveDescriptors() override;
     void createPrimitive() override;
     bool created() const override;
+
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 };
 
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp
index ffa831a670db77..25f912b4f3832b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.cpp
@@ -12,8 +12,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNReverseSequenceNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNReverseSequenceNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto revSeq = std::dynamic_pointer_cast<const ngraph::opset1::ReverseSequence>(op);
         if (!revSeq) {
             errorMessage = "Only opset1 ReverseSequence operation is supported";
@@ -94,7 +98,7 @@ void MKLDNNReverseSequenceNode::execute(mkldnn::stream strm) {
     const float *src_data = reinterpret_cast<const float *>(getParentEdgeAt(REVERSESEQUENCE_DATA)->getMemoryPtr()->GetPtr());
     float* dst_data = reinterpret_cast<float *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
 
-    switch (getParentEdgeAt(REVERSESEQUENCE_LENGTHS)->getMemory().GetDesc().getPrecision()) {
+    switch (getParentEdgeAt(REVERSESEQUENCE_LENGTHS)->getMemory().getDesc().getPrecision()) {
         case Precision::FP32: {
             float *seq_lengths_data = reinterpret_cast<float *>(getParentEdgeAt(REVERSESEQUENCE_LENGTHS)->getMemoryPtr()->GetPtr());
             for (i = 0; i < src_dims[batch_axis]; i++) {
@@ -169,7 +173,7 @@ void MKLDNNReverseSequenceNode::execute(mkldnn::stream strm) {
         break;
         default:
             IE_THROW() << "ReverseSequence layer does not support "
-                        << getParentEdgeAt(REVERSESEQUENCE_LENGTHS)->getMemory().GetDesc().getPrecision()  << " precision";
+                        << getParentEdgeAt(REVERSESEQUENCE_LENGTHS)->getMemory().getDesc().getPrecision()  << " precision";
     }
 }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.h
index 4b3cf056c63afa..10fb8774abfa22 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_reverse_sequence_node.h
@@ -19,7 +19,7 @@ class MKLDNNReverseSequenceNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     const size_t REVERSESEQUENCE_DATA = 0;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.cpp
index 6e9086274d5a7d..2f7bd432cfc54f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.cpp
@@ -9,6 +9,7 @@
 #include "utils/bfloat16.hpp"
 #include "mkldnn_input_node.h"
 #include <mkldnn_extension_utils.h>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 #include <ngraph/node.hpp>
 
@@ -109,6 +110,11 @@ const std::map<InferenceEngine::Precision, InferenceEngine::Precision> MKLDNNRNN
 
 bool MKLDNNRNN::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (!one_of(op->get_type_info(),
                 ngraph::op::v3::GRUCell::type_info,
                 ngraph::op::v0::LSTMCell::type_info,
@@ -260,7 +266,7 @@ void MKLDNNRNN::initCell(const std::shared_ptr<ngraph::Node>& op) {
     Gb = (cell_type != mkldnn::algorithm::lbr_gru) ? G : G + 1;
 
     // Expected shapes
-    std::vector<size_t> D_shape {N, DC}, S_shape {N, SC}, S_4D_shape {L, D, N, SC};
+    VectorDims D_shape {N, DC}, S_shape {N, SC}, S_4D_shape {L, D, N, SC};
 
     if (in_data_dims != D_shape
         || in_h_state_dims != S_shape
@@ -281,15 +287,15 @@ void MKLDNNRNN::fillCellDesc() {
     runtimePrecision = getOriginalInputPrecisionAtPort(0);
     auto dataType = MKLDNNExtensionUtils::IEPrecisionToDataType(runtimePrecision);
 
-    std::vector<size_t> S_4D_shape {L, D, N, SC};
+    Shape S_4D_shape(VectorDims{L, D, N, SC});
 
     // layer input plus states
     in_data_d.reserve(S + 1);
     out_data_d.reserve(S + 1);
 
     // Shapes and Attributes are correct. Can start internal stuff initialization.
-    in_data_d.emplace_back(std::vector<size_t>{T, N, DC}, dataType, memory::format_tag::tnc);
-    out_data_d.emplace_back(std::vector<size_t>{T, N, SC}, dataType, memory::format_tag::tnc);
+    in_data_d.emplace_back(Shape(VectorDims{T, N, DC}), dataType, memory::format_tag::tnc);
+    out_data_d.emplace_back(Shape(VectorDims{T, N, SC}), dataType, memory::format_tag::tnc);
 
     in_data_d.emplace_back(S_4D_shape, dataType, memory::format_tag::ldnc);
     out_data_d.emplace_back(S_4D_shape, dataType, memory::format_tag::ldnc);
@@ -299,39 +305,34 @@ void MKLDNNRNN::fillCellDesc() {
         out_data_d.emplace_back(S_4D_shape, memory::data_type::f32, memory::format_tag::ldnc);
     }
 
-    w_data_d   = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::vector<size_t>{L, D, DC, G, SC}, dataType, memory::format_tag::ldigo);
-    w_state_d  = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::vector<size_t>{L, D, SC, G, SC}, dataType, memory::format_tag::ldigo);
+    w_data_d   = std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{L, D, DC, G, SC}), dataType, memory::format_tag::ldigo);
+    w_state_d  = std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{L, D, SC, G, SC}), dataType, memory::format_tag::ldigo);
 
     // Add 5th input
-    w_bias_d = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::vector<size_t>{L, D, Gb, SC}, memory::data_type::f32, memory::format_tag::ldgo);
+    w_bias_d = std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{L, D, Gb, SC}), memory::data_type::f32, memory::format_tag::ldgo);
 
     copyWeightsData();
 
     // Expected shapes
-    std::vector<size_t> D_shape {N, DC}, S_shape {N, SC}, WShape {SC * G, DC}, RShape {SC * G, SC}, BShape {SC * Gb};
-    std::vector<MKLDNNMemoryDesc> in_candidate, out_candidate;
+    Shape D_shape(VectorDims{N, DC}), S_shape(VectorDims{N, SC}), WShape(VectorDims{SC * G, DC}), RShape(VectorDims{SC * G, SC}), BShape(VectorDims{SC * Gb});
+    std::vector<MemoryDescPtr> in_candidate, out_candidate;
     in_candidate.reserve(6);
 
-    in_candidate.emplace_back(D_shape, dataType, memory::format_tag::nc);
-    in_candidate.emplace_back(S_shape, dataType, memory::format_tag::nc);
-    out_candidate.emplace_back(S_shape, dataType, memory::format_tag::nc);
+    in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(D_shape, dataType, memory::format_tag::nc));
+    in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(S_shape, dataType, memory::format_tag::nc));
+    out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(S_shape, dataType, memory::format_tag::nc));
 
     if (haveCellState(cell_type)) {
-        in_candidate.emplace_back(S_shape, memory::data_type::f32, memory::format_tag::nc);
-        out_candidate.emplace_back(S_shape, memory::data_type::f32, memory::format_tag::nc);
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(S_shape, memory::data_type::f32, memory::format_tag::nc));
+        out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(S_shape, memory::data_type::f32, memory::format_tag::nc));
     }
     if (one_of(cell_type, mkldnn::algorithm::vanilla_rnn, mkldnn::algorithm::vanilla_gru, mkldnn::algorithm::lbr_gru, mkldnn::algorithm::vanilla_lstm)) {
-        in_candidate.emplace_back(WShape, memory::data_type::f32, memory::format_tag::nc);
-        in_candidate.emplace_back(RShape, memory::data_type::f32, memory::format_tag::nc);
-        in_candidate.emplace_back(BShape, memory::data_type::f32, memory::format_tag::x);
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(WShape, memory::data_type::f32, memory::format_tag::nc));
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(RShape, memory::data_type::f32, memory::format_tag::nc));
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(BShape, memory::data_type::f32, memory::format_tag::x));
     }
 
-    std::vector<const MemoryDesc*> in_candidate_ptrs(in_candidate.size());
-    std::vector<const MemoryDesc*> out_candidate_ptrs(out_candidate.size());
-    std::transform(in_candidate.begin(), in_candidate.end(), in_candidate_ptrs.begin(), [](const MKLDNNMemoryDesc& item) { return &item; });
-    std::transform(out_candidate.begin(), out_candidate.end(), out_candidate_ptrs.begin(), [](const MKLDNNMemoryDesc& item) { return &item; });
-
-    createDescriptor(in_candidate_ptrs, out_candidate_ptrs);
+    createDescriptor(in_candidate, out_candidate);
 }
 
 void MKLDNNRNN::initSeq(const std::shared_ptr<ngraph::Node>& op) {
@@ -386,68 +387,84 @@ void MKLDNNRNN::fillSeqDesc() {
     runtimePrecision = getOriginalInputPrecisionAtPort(0);
     auto dataType = MKLDNNExtensionUtils::IEPrecisionToDataType(runtimePrecision);
 
-    std::vector<size_t> S_4D_shape {L, D, N, SC};
+    Shape S_4D_shape(VectorDims{L, D, N, SC});
 
     // Try to create descriptor and corresponding configuration
-    in_data_d.emplace_back(std::vector<size_t>{in_data_dims},  dataType, memory::format_tag::tnc);
-    out_data_d.emplace_back(std::vector<size_t>{out_data_dims}, dataType, memory::format_tag::tnc);
+    in_data_d.emplace_back(Shape(VectorDims{in_data_dims}),  dataType, memory::format_tag::tnc);
+    out_data_d.emplace_back(Shape(VectorDims{out_data_dims}), dataType, memory::format_tag::tnc);
 
-    in_data_d.emplace_back(std::vector<size_t>{S_4D_shape}, dataType, memory::format_tag::ldnc);
-    out_data_d.emplace_back(std::vector<size_t>{S_4D_shape}, dataType, memory::format_tag::ldnc);
+    in_data_d.emplace_back(S_4D_shape, dataType, memory::format_tag::ldnc);
+    out_data_d.emplace_back(S_4D_shape, dataType, memory::format_tag::ldnc);
 
     if (haveCellState(cell_type)) {
-        in_data_d.emplace_back(std::vector<size_t>{S_4D_shape}, memory::data_type::f32, memory::format_tag::ldnc);
-        out_data_d.emplace_back(std::vector<size_t>{S_4D_shape}, memory::data_type::f32, memory::format_tag::ldnc);
+        in_data_d.emplace_back(S_4D_shape, memory::data_type::f32, memory::format_tag::ldnc);
+        out_data_d.emplace_back(S_4D_shape, memory::data_type::f32, memory::format_tag::ldnc);
     }
 
-    w_data_d  = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::vector<size_t>{L, D, DC, G, SC}, dataType, memory::format_tag::ldigo);
-    w_state_d = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::vector<size_t>{L, D, SC, G, SC}, dataType, memory::format_tag::ldigo);
+    w_data_d  = std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{L, D, DC, G, SC}), dataType, memory::format_tag::ldigo);
+    w_state_d = std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{L, D, SC, G, SC}), dataType, memory::format_tag::ldigo);
 
-    w_bias_d = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(std::vector<size_t>{L, D, Gb, SC}, memory::data_type::f32, memory::format_tag::ldgo);
+    w_bias_d = std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{L, D, Gb, SC}), memory::data_type::f32, memory::format_tag::ldgo);
 
     copyWeightsData();
 
-    std::vector<MKLDNNMemoryDesc> in_candidate;
+    std::vector<MemoryDescPtr> in_candidate;
     in_candidate.reserve(7);
 
     if (nativeOrder)
-        in_candidate.emplace_back(inputShapes[RNNInOutKind::Layer].getStaticDims(), dataType, memory::format_tag::tnc);
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(inputShapes[RNNInOutKind::Layer], dataType, memory::format_tag::tnc));
     else if (N == 1)
         // WA to avoid reorder before sequence for some models
-        in_candidate.emplace_back(std::vector<size_t>{N, T, DC}, dataType, memory::format_tag::tnc);
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, T, DC}), dataType, memory::format_tag::tnc));
+    else
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, T, DC}), dataType, memory::format_tag::ntc));
+
+    // initial hidden state
+    // WA to avoid reorder before
+    if (D == 1)
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), dataType, memory::format_tag::tnc));
     else
-        in_candidate.emplace_back(std::vector<size_t>{N, T, DC}, dataType, memory::format_tag::ntc);
+        in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), dataType, memory::format_tag::ntc));
+
+    // initial cell state
+    if (haveCellState(cell_type)) {
+        if (D == 1)
+            in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), memory::data_type::f32, memory::format_tag::tnc));
+        else
+            in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), memory::data_type::f32, memory::format_tag::ntc));
+    }
 
-    in_candidate.emplace_back(std::vector<size_t>{N, D, SC}, dataType, memory::format_tag::ntc); // initial hidden state
-    if (haveCellState(cell_type))
-        in_candidate.emplace_back(std::vector<size_t>{N, D, SC}, memory::data_type::f32, memory::format_tag::ntc); // initial cell state
-    in_candidate.emplace_back(std::vector<size_t>{N}, memory::data_type::s32, memory::format_tag::x); // sequence lengths
-    in_candidate.emplace_back(std::vector<size_t>{D, G * SC, DC}, memory::data_type::f32, memory::format_tag::ntc); // W
-    in_candidate.emplace_back(std::vector<size_t>{D, G * SC, SC}, memory::data_type::f32, memory::format_tag::ntc); // R
-    in_candidate.emplace_back(std::vector<size_t>{D, Gb * SC}, memory::data_type::f32, memory::format_tag::nc); // B
+    in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N}), memory::data_type::s32, memory::format_tag::x)); // sequence lengths
+    in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{D, G * SC, DC}), memory::data_type::f32, memory::format_tag::ntc)); // W
+    in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{D, G * SC, SC}), memory::data_type::f32, memory::format_tag::ntc)); // R
+    in_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{D, Gb * SC}), memory::data_type::f32, memory::format_tag::nc)); // B
 
-    std::vector<MKLDNNMemoryDesc> out_candidate;
+    std::vector<MemoryDescPtr> out_candidate;
     out_candidate.reserve(3);
 
     if (nativeOrder) {
-        out_candidate.emplace_back(out_data_d[RNNInOutKind::Layer]);
+        out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(out_data_d[RNNInOutKind::Layer]));
     } else if (N == 1) {
         // WA to avoid reorder after sequence for some models
-        out_candidate.emplace_back(std::vector<size_t>{N, T, SC}, dataType, memory::format_tag::tnc);
+        out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, T, SC}), dataType, memory::format_tag::tnc));
     } else {
-        out_candidate.emplace_back(std::vector<size_t>{N, T, SC}, dataType, memory::format_tag::ntc);
+        out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, T, SC}), dataType, memory::format_tag::ntc));
     }
 
-    out_candidate.emplace_back(std::vector<size_t>{N, D, SC}, dataType, memory::format_tag::ntc);
-    if (haveCellState(cell_type))
-        out_candidate.emplace_back(std::vector<size_t>{N, D, SC}, memory::data_type::f32, memory::format_tag::ntc);
+    // WA to avoid reorder after
+    if (D == 1)
+        out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), dataType, memory::format_tag::tnc));
+    else
+        out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), dataType, memory::format_tag::ntc));
 
-    std::vector<const MemoryDesc*> in_candidate_ptrs(in_candidate.size());
-    std::vector<const MemoryDesc*> out_candidate_ptrs(out_candidate.size());
-    std::transform(in_candidate.begin(), in_candidate.end(), in_candidate_ptrs.begin(), [](const MKLDNNMemoryDesc& item) { return &item; });
-    std::transform(out_candidate.begin(), out_candidate.end(), out_candidate_ptrs.begin(), [](const MKLDNNMemoryDesc& item) { return &item; });
+    if (haveCellState(cell_type)) {
+        if (D == 1)
+            out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), memory::data_type::f32, memory::format_tag::tnc));
+        else
+            out_candidate.emplace_back(std::make_shared<DnnlBlockedMemoryDesc>(Shape(VectorDims{N, D, SC}), memory::data_type::f32, memory::format_tag::ntc));
+    }
 
-    createDescriptor(in_candidate_ptrs, out_candidate_ptrs);
+    createDescriptor(in_candidate, out_candidate);
 }
 
 bool MKLDNNRNN::verifyWeightsPrecision(const Precision &layerPrec, const Precision &weightsPrec) {
@@ -470,8 +487,8 @@ void MKLDNNRNN::fillWeights(const int *gate_map, const size_t wIdx, const size_t
     w_state_mem->Create(*w_state_d);
     internalBlobMemory.push_back(w_state_mem);
 
-    const size_t ie_w_vec_size = getParentEdgesAtPort(wIdx)[0]->getShape().getElementsCount();
-    const size_t ie_r_vec_size = getParentEdgesAtPort(rIdx)[0]->getShape().getElementsCount();
+    const size_t ie_w_vec_size = getInputShapeAtPort(wIdx).getElementsCount();
+    const size_t ie_r_vec_size = getInputShapeAtPort(rIdx).getElementsCount();
 
     auto *wInputNode = dynamic_cast<MKLDNNInputNode *>(getParentEdgesAtPort(wIdx)[0]->getParent().get());
     auto wConstBlob = wInputNode->getMemoryPtr();
@@ -526,7 +543,7 @@ void MKLDNNRNN::fillBiases(const int *gate_map) {
 
     auto *constInputNode = dynamic_cast<MKLDNNInputNode *>(getParentEdgesAtPort(bIdx)[0]->getParent().get());
     auto constBlob = constInputNode->getMemoryPtr();
-    auto const elementsCount = constBlob->GetElementsCount();
+    auto const elementsCount = constBlob->GetSize() / constBlob->getDesc().getPrecision().size();
 
     std::vector<dataType> ie_b_vec(elementsCount);
     cpu_convert(constBlob->GetPtr(),
@@ -607,57 +624,57 @@ void MKLDNNRNN::copyWeightsData() {
     if (runtimePrecision == Precision::BF16 || runtimePrecision == Precision::FP32)
         fillBiases<Precision::FP32>(gate_map);
 }
-void MKLDNNRNN::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc,
-                                 const std::vector<const MemoryDesc*> &outputDesc) {
+void MKLDNNRNN::createDescriptor(const std::vector<MemoryDescPtr> &inputDesc,
+                                 const std::vector<MemoryDescPtr> &outputDesc) {
     switch (cell_type) {
         case mkldnn::algorithm::vanilla_rnn: {
             MKLDNNDescriptor desc(std::shared_ptr<vanilla_rnn_forward::desc>(
                     new vanilla_rnn_forward::desc(prop_kind::forward_scoring, cell_act, direction,
-                            /* In Data       */ in_data_d[RNNInOutKind::Layer],
-                            /* In State      */ in_data_d[RNNInOutKind::HiddenState],
-                            /* Weights data  */ *w_data_d,
-                            /* Weights state */ *w_state_d,
-                            /* Bias          */ *w_bias_d,
-                            /* Out Data      */ out_data_d[RNNInOutKind::Layer],
-                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState])));
+                            /* In Data       */ in_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* In State      */ in_data_d[RNNInOutKind::HiddenState].getDnnlDesc(),
+                            /* Weights data  */ w_data_d->getDnnlDesc(),
+                            /* Weights state */ w_state_d->getDnnlDesc(),
+                            /* Bias          */ w_bias_d->getDnnlDesc(),
+                            /* Out Data      */ out_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState].getDnnlDesc())));
             descs.push_back(desc);
         } break;
         case mkldnn::algorithm::vanilla_gru: {
             MKLDNNDescriptor desc(std::shared_ptr<gru_forward::desc>(
                     new gru_forward::desc(prop_kind::forward_scoring, direction,
-                            /* In Data       */ in_data_d[RNNInOutKind::Layer],
-                            /* In State      */ in_data_d[RNNInOutKind::HiddenState],
-                            /* Weights data  */ *w_data_d,
-                            /* Weights state */ *w_state_d,
-                            /* Bias          */ *w_bias_d,
-                            /* Out Data      */ out_data_d[RNNInOutKind::Layer],
-                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState])));
+                            /* In Data       */ in_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* In State      */ in_data_d[RNNInOutKind::HiddenState].getDnnlDesc(),
+                            /* Weights data  */ w_data_d->getDnnlDesc(),
+                            /* Weights state */ w_state_d->getDnnlDesc(),
+                            /* Bias          */ w_bias_d->getDnnlDesc(),
+                            /* Out Data      */ out_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState].getDnnlDesc())));
             descs.push_back(desc);
         } break;
         case mkldnn::algorithm::lbr_gru: {
             MKLDNNDescriptor desc(std::shared_ptr<lbr_gru_forward::desc>(
                     new lbr_gru_forward::desc(prop_kind::forward_scoring, direction,
-                            /* In Data       */ in_data_d[RNNInOutKind::Layer],
-                            /* In State      */ in_data_d[RNNInOutKind::HiddenState],
-                            /* Weights data  */ *w_data_d,
-                            /* Weights state */ *w_state_d,
-                            /* Bias          */ *w_bias_d,
-                            /* Out Data      */ out_data_d[RNNInOutKind::Layer],
-                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState])));
+                            /* In Data       */ in_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* In State      */ in_data_d[RNNInOutKind::HiddenState].getDnnlDesc(),
+                            /* Weights data  */ w_data_d->getDnnlDesc(),
+                            /* Weights state */ w_state_d->getDnnlDesc(),
+                            /* Bias          */ w_bias_d->getDnnlDesc(),
+                            /* Out Data      */ out_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState].getDnnlDesc())));
             descs.push_back(desc);
         } break;
         case mkldnn::algorithm::vanilla_lstm: {
             MKLDNNDescriptor desc(std::shared_ptr<lstm_forward::desc>(
                     new lstm_forward::desc(prop_kind::forward_scoring, direction,
-                            /* In Data       */ in_data_d[RNNInOutKind::Layer],
-                            /* In State      */ in_data_d[RNNInOutKind::HiddenState],
-                            /* In State C    */ in_data_d[RNNInOutKind::CellState],
-                            /* Weights data  */ *w_data_d,
-                            /* Weights state */ *w_state_d,
-                            /* Bias          */ *w_bias_d,
-                            /* Out Data      */ out_data_d[RNNInOutKind::Layer],
-                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState],
-                            /* Out State C   */ out_data_d[RNNInOutKind::CellState])));
+                            /* In Data       */ in_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* In State      */ in_data_d[RNNInOutKind::HiddenState].getDnnlDesc(),
+                            /* In State C    */ in_data_d[RNNInOutKind::CellState].getDnnlDesc(),
+                            /* Weights data  */ w_data_d->getDnnlDesc(),
+                            /* Weights state */ w_state_d->getDnnlDesc(),
+                            /* Bias          */ w_bias_d->getDnnlDesc(),
+                            /* Out Data      */ out_data_d[RNNInOutKind::Layer].getDnnlDesc(),
+                            /* Out State     */ out_data_d[RNNInOutKind::HiddenState].getDnnlDesc(),
+                            /* Out State C   */ out_data_d[RNNInOutKind::CellState].getDnnlDesc())));
             descs.push_back(desc);
         } break;
         default:
@@ -671,7 +688,7 @@ void MKLDNNRNN::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc
         PortConfig dataConfig;
         dataConfig.inPlace = -1;
         dataConfig.constant = false;
-        dataConfig.desc = inputDesc[i]->clone();
+        dataConfig.desc = inputDesc[i];
         config.inConfs.push_back(dataConfig);
     }
 
@@ -679,7 +696,7 @@ void MKLDNNRNN::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc
         PortConfig dataConfig;
         dataConfig.inPlace = -1;
         dataConfig.constant = false;
-        dataConfig.desc = outputDesc[i]->clone();
+        dataConfig.desc = outputDesc[i];
         config.outConfs.push_back(dataConfig);
     }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.h
index 9e47637235f583..2dd4fe436ef529 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_rnn.h
@@ -8,6 +8,7 @@
 #include <string>
 #include <memory>
 #include <vector>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 namespace MKLDNNPlugin {
 
@@ -19,8 +20,8 @@ class MKLDNNRNN : public MKLDNNNode {
     void getSupportedDescriptors() override;
     void createPrimitive() override;
     bool created() const override;
-    void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                          const std::vector<const MemoryDesc*>& outputDesc) override;
+    void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                          const std::vector<MemoryDescPtr>& outputDesc) override;
 
     void execute(mkldnn::stream strm) override;
 
@@ -44,8 +45,6 @@ class MKLDNNRNN : public MKLDNNNode {
     void copyWeightsData();
 
 private:
-    using MKLDNNMemoryDescPtr = std::unique_ptr<MKLDNNMemoryDesc>;
-
     InferenceEngine::Precision runtimePrecision;
     /** Specify mode Cell or Seq. true - Cell, false - Seq */
     bool is_cell = false;
@@ -73,8 +72,8 @@ class MKLDNNRNN : public MKLDNNNode {
     const size_t L = 1;   /**< What is it??. Constant for mkldnn impl */
     const size_t D = 1;   /**< Num of direction. 1 or 2 */
 
-    std::vector<MKLDNNMemoryDesc> in_data_d;
-    std::vector<MKLDNNMemoryDesc> out_data_d;
+    std::vector<DnnlBlockedMemoryDesc> in_data_d;
+    std::vector<DnnlBlockedMemoryDesc> out_data_d;
 
     enum RNNInOutKind {
         Layer       = 0,
@@ -82,9 +81,9 @@ class MKLDNNRNN : public MKLDNNNode {
         CellState   = 2
     };
 
-    MKLDNNMemoryDescPtr w_data_d;
-    MKLDNNMemoryDescPtr w_state_d;
-    MKLDNNMemoryDescPtr w_bias_d;
+    DnnlBlockedMemoryDescPtr w_data_d;
+    DnnlBlockedMemoryDescPtr w_state_d;
+    DnnlBlockedMemoryDescPtr w_bias_d;
 
     std::vector<size_t > in_data_dims;
     std::vector<size_t > out_data_dims;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.cpp
index 0517350e09c6c1..5e258a4d765c01 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.cpp
@@ -23,8 +23,12 @@ using namespace mkldnn::impl::cpu::x64;
 
 using ngPoolingMode = ngraph::op::v3::ROIAlign::PoolingMode;
 
-bool MKLDNNROIAlignNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNROIAlignNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto roiAlign = std::dynamic_pointer_cast<const ngraph::opset3::ROIAlign>(op);
         if (!roiAlign) {
             errorMessage = "Only opset3 ROIAlign operation is supported";
@@ -73,31 +77,31 @@ void MKLDNNROIAlignNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << "has incorrect number of output edges: " << getChildEdges().size();
 
-    if (getParentEdgeAt(0)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getParentEdgeAt(0)->getShape().getRank();
+    if (getInputShapeAtPort(0).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getInputShapeAtPort(0).getRank();
     }
 
-    if (getParentEdgeAt(1)->getShape().getRank() != 2) {
-        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getParentEdgeAt(1)->getShape().getRank();
+    if (getInputShapeAtPort(1).getRank() != 2) {
+        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getInputShapeAtPort(1).getRank();
     }
 
-    if (getParentEdgeAt(2)->getShape().getRank() != 1) {
-        IE_THROW() << errorPrefix << "doesn't support 2nd input with rank: " << getParentEdgeAt(2)->getShape().getRank();
+    if (getInputShapeAtPort(2).getRank() != 1) {
+        IE_THROW() << errorPrefix << "doesn't support 2nd input with rank: " << getInputShapeAtPort(2).getRank();
     }
 
-    if (getChildEdgeAt(0)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getChildEdgeAt(0)->getShape().getRank();
+    if (getOutputShapeAtPort(0).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getOutputShapeAtPort(0).getRank();
     }
 
-    if (getParentEdgeAt(1)->getShape().getStaticDims()[1] != 4) {
+    if (getInputShapeAtPort(1).getStaticDims()[1] != 4) {
         IE_THROW() << errorPrefix << "has invalid shape on 1st input: ["
-                           << getParentEdgeAt(1)->getShape().getStaticDims()[0] << "," << getParentEdgeAt(1)->getShape().getStaticDims()[1] << "]";
+                           << getInputShapeAtPort(1).getStaticDims()[0] << "," << getInputShapeAtPort(1).getStaticDims()[1] << "]";
     }
 
-    if (getParentEdgeAt(1)->getShape().getStaticDims()[0] != getParentEdgeAt(2)->getShape().getStaticDims()[0]) {
+    if (getInputShapeAtPort(1).getStaticDims()[0] != getInputShapeAtPort(2).getStaticDims()[0]) {
         IE_THROW() << errorPrefix << "has different sizes of inputs for proposals ("
-                           << getParentEdgeAt(1)->getShape().getStaticDims()[0] << ") and indexes ("
-                           << getParentEdgeAt(2)->getShape().getStaticDims()[0] << ")";
+                           << getInputShapeAtPort(1).getStaticDims()[0] << ") and indexes ("
+                           << getInputShapeAtPort(2).getStaticDims()[0] << ")";
     }
 }
 
@@ -113,29 +117,24 @@ void MKLDNNROIAlignNode::initSupportedPrimitiveDescriptors() {
             outputPrec = inputPrec0 = Precision::FP32;
     }
 
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(inputPrec0);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(outputPrec);
-
     NodeConfig config;
     config.dynBatchSupport = false;
     config.inConfs.resize(3);
     config.outConfs.resize(1);
 
-    std::vector<std::pair<memory::format_tag, memory::format_tag>> supportedFormats {
-            {memory::format_tag::nchw, memory::format_tag::nchw},
-            {memory::format_tag::nhwc, memory::format_tag::nhwc},
-            {memory::format_tag::nChw16c, memory::format_tag::nChw16c},
-            {memory::format_tag::nChw8c, memory::format_tag::nChw8c}
+    std::vector<std::pair<LayoutType, LayoutType>> supportedFormats {
+            {LayoutType::ncsp, LayoutType::ncsp},
+            {LayoutType::nspc, LayoutType::nspc},
+            {LayoutType::nCsp16c, LayoutType::nCsp16c},
+            {LayoutType::nCsp8c, LayoutType::nCsp8c}
     };
 
     for (auto fmts : supportedFormats) {
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType, fmts.first);
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(1)->getShape().getStaticDims(), memory::data_type::f32,
-                                                               memory::format_tag::nc);
-        config.inConfs[2].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(2)->getShape().getStaticDims(), memory::data_type::s32,
-                                                               memory::format_tag::x);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType, fmts.second);
-        supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
+        addSupportedPrimDesc({{fmts.first, inputPrec0},
+                              {LayoutType::ncsp, Precision::FP32},
+                              {LayoutType::ncsp, Precision::I32}},
+                             {{fmts.second, outputPrec}},
+                              impl_desc_type::unknown);
     }
 }
 
@@ -155,8 +154,8 @@ struct MKLDNNROIAlignNode::ROIAlignExecute {
     }
 };
 void MKLDNNROIAlignNode::execute(mkldnn::stream strm) {
-    auto inputPrec = getParentEdgeAt(0)->getMemory().GetDescriptor().data.data_type;
-    auto outputPrec = getChildEdgeAt(0)->getMemory().GetDescriptor().data.data_type;
+    auto inputPrec = getParentEdgeAt(0)->getMemory().GetDataType();
+    auto outputPrec = getChildEdgeAt(0)->getMemory().GetDataType();
     if (!((inputPrec == mkldnn_bf16 && outputPrec == mkldnn_bf16) ||
           (inputPrec == mkldnn_f32 && outputPrec == mkldnn_f32)))
         IE_THROW() <<"ROIAlign doesn't support demanded precisions";
@@ -176,32 +175,37 @@ void MKLDNNROIAlignNode::executeSpecified() {
     auto &srcMemory1 = getParentEdgeAt(1)->getMemory();
     auto &dstMemory = getChildEdgeAt(0)->getMemory();
 
-    auto srcBlockDesc = srcMemory0.GetDescriptor().data.format_desc.blocking;
-    auto dstBlockDesc = dstMemory.GetDescriptor().data.format_desc.blocking;
+    auto srcBlockDesc = srcMemory0.GetDescWithType<BlockedMemoryDesc>();
+    auto dstBlockDesc = dstMemory.GetDescWithType<BlockedMemoryDesc>();
+
+    auto isPlainFmt = srcBlockDesc->hasLayoutType(LayoutType::ncsp);
+    auto isNhwcFmt =  srcBlockDesc->hasLayoutType(LayoutType::nspc);
+    auto isBlkFmt =   srcBlockDesc->hasLayoutType(LayoutType::nCsp16c) || srcBlockDesc->hasLayoutType(LayoutType::nCsp8c);
 
-    int blockSize = srcBlockDesc.inner_nblks > 0 ? srcBlockDesc.inner_blks[0] : 1;
-    auto isPlainFmt = srcMemory0.GetDesc().hasLayoutType(LayoutType::ncsp);
-    auto isNhwcFmt = srcMemory0.GetDesc().hasLayoutType(LayoutType::nspc);
+    int blockSize = isBlkFmt ? srcBlockDesc->getBlockDims().back() : 1;
 
     const auto *srcData = reinterpret_cast<const inputType *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     const auto *srcRoi = reinterpret_cast<const float *>(getParentEdgeAt(1)->getMemoryPtr()->GetPtr());
     const auto *srcRoiIdx = reinterpret_cast<const int *>(getParentEdgeAt(2)->getMemoryPtr()->GetPtr());
     auto *dst = reinterpret_cast<outputType *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
 
-    auto nominalRoiCount = static_cast<int>(srcMemory1.GetDims()[0]);
+    auto nominalRoiCount = static_cast<int>(srcMemory1.getStaticDims()[0]);
     int realRois = 0;
-    auto inputDimVector = srcMemory0.GetDims();
+    auto inputDimVector = srcMemory0.getStaticDims();
     const int C = static_cast<int>(inputDimVector[1]);
     const int H = static_cast<int>(inputDimVector[2]);
     const int W = static_cast<int>(inputDimVector[3]);
 
     const int binCount = pooledH * pooledW;
 
-    const int hInputStride = srcBlockDesc.strides[2];
-    const int wInputStride = srcBlockDesc.strides[3];
-    const int hOutputStride = dstBlockDesc.strides[2];
-    const int wOutputStride = dstBlockDesc.strides[3];
-    const int chPadding = srcMemory0.GetDescriptor().data.padded_dims[1];
+    const size_t tailDimsOffset = (isNhwcFmt ? -1 : 0);
+    const auto &srcStrides = srcBlockDesc->getStrides();
+    const auto &dstStrides = dstBlockDesc->getStrides();
+    const int hInputStride = srcStrides[2 + tailDimsOffset];
+    const int wInputStride = srcStrides[3 + tailDimsOffset];
+    const int hOutputStride = dstStrides[2 + tailDimsOffset];
+    const int wOutputStride = dstStrides[3 + tailDimsOffset];
+    const int chPadding = blockSize * srcBlockDesc->getBlockDims()[1];
     const int blockCount = chPadding / blockSize;
 
     for (; realRois < nominalRoiCount; realRois++) {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.h
index 9f3d31c478359d..4e6b835c95f8b7 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_align_node.h
@@ -23,7 +23,7 @@ class MKLDNNROIAlignNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     int pooledH = 7;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.cpp
index 23fd252ae2ba38..5f5b2c8641c268 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.cpp
@@ -306,8 +306,12 @@ struct jit_uni_roi_pooling_kernel_f32 : public jit_uni_roi_pooling_kernel, publi
     }
 };
 
-bool MKLDNNROIPoolingNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNROIPoolingNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto roiPooling = std::dynamic_pointer_cast<const ngraph::opset2::ROIPooling>(op);
         if (!roiPooling) {
             errorMessage = "Only opset2 ROIPooling operation is supported";
@@ -354,21 +358,21 @@ void MKLDNNROIPoolingNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << "has incorrect number of output edges: " << getChildEdges().size();
 
-    if (getParentEdgeAt(0)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getParentEdgeAt(0)->getShape().getRank();
+    if (getInputShapeAtPort(0).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getInputShapeAtPort(0).getRank();
     }
 
-    if (getParentEdgeAt(1)->getShape().getRank() != 2) {
-        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getParentEdgeAt(1)->getShape().getRank();
+    if (getInputShapeAtPort(1).getRank() != 2) {
+        IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getInputShapeAtPort(1).getRank();
     }
 
-    if (getChildEdgeAt(0)->getShape().getRank() != 4) {
-        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getChildEdgeAt(0)->getShape().getRank();
+    if (getOutputShapeAtPort(0).getRank() != 4) {
+        IE_THROW() << errorPrefix << "doesn't support output with rank: " << getOutputShapeAtPort(0).getRank();
     }
 
-    if (getParentEdgeAt(1)->getShape().getStaticDims()[1] != 5) {
+    if (getInputShapeAtPort(1).getStaticDims()[1] != 5) {
         IE_THROW() << errorPrefix << "has invalid shape on 1st input: ["
-                                  << getParentEdgeAt(1)->getShape().getStaticDims()[0] << "," << getParentEdgeAt(1)->getShape().getStaticDims()[1] << "]";
+                                  << getInputShapeAtPort(1).getStaticDims()[0] << "," << getInputShapeAtPort(1).getStaticDims()[1] << "]";
     }
 }
 
@@ -383,25 +387,10 @@ void MKLDNNROIPoolingNode::initSupportedPrimitiveDescriptors() {
             runtimePrecision = Precision::FP32;
     }
 
-    auto dataType = MKLDNNExtensionUtils::IEPrecisionToDataType(runtimePrecision);
-
-    src_data_size = MKLDNNExtensionUtils::sizeOfDataType(dataType);
-    dst_data_size = MKLDNNExtensionUtils::sizeOfDataType(dataType);
-
-    NodeConfig config;
-    config.dynBatchSupport = false;
-    config.inConfs.resize(2);
-    config.inConfs[0].constant = false;
-    config.inConfs[0].inPlace = -1;
-    config.inConfs[1].constant = false;
-    config.inConfs[1].inPlace = -1;
-
-    config.outConfs.resize(1);
-    config.outConfs[0].constant = false;
-    config.outConfs[0].inPlace = -1;
+    src_data_size = dst_data_size = runtimePrecision.size();
 
-    auto parentDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    auto format = mayiuse(avx512_common) ? memory::format_tag::nChw16c : memory::format_tag::nChw8c;
+    auto parentDims = getInputShapeAtPort(0).getStaticDims();
+    auto format = mayiuse(avx512_common) ? LayoutType::nCsp16c : LayoutType::nCsp8c;
     impl_desc_type impl_type;
     if (mayiuse(cpu::x64::avx512_common)) {
         impl_type = impl_desc_type::jit_avx512;
@@ -413,10 +402,10 @@ void MKLDNNROIPoolingNode::initSupportedPrimitiveDescriptors() {
         impl_type = impl_desc_type::ref;
     }
 
-    config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), dataType, format);
-    config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(1)->getShape().getStaticDims(), dataType, memory::format_tag::nc);
-    config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), dataType, format);
-    supportedPrimitiveDescriptors.push_back({config, impl_type});
+    addSupportedPrimDesc({{format, runtimePrecision},
+                          {LayoutType::ncsp, runtimePrecision}},
+                         {{format, runtimePrecision}},
+                          impl_type);
 }
 
 void MKLDNNROIPoolingNode::createPrimitive() {
@@ -428,8 +417,8 @@ void MKLDNNROIPoolingNode::createPrimitive() {
     const int simd_w = mayiuse(cpu::x64::avx512_common) ? 16 : 8;
     jpp.c_block = simd_w;
 
-    auto inDims = config.inConfs[0].desc->getShape().getStaticDims();
-    auto outDims = config.outConfs[0].desc->getShape().getStaticDims();
+    auto inDims = getParentEdgeAt(0)->getMemory().getStaticDims();
+    auto outDims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
 
     jpp.mb = outDims[0];
     jpp.c = rnd_up(inDims[1], simd_w);
@@ -481,9 +470,9 @@ void MKLDNNROIPoolingNode::execute() {
         IE_THROW() << "CPU ROI Pooling node with name '" << getName() << "' doesn't have primitive descriptors.";
     auto config = selectedPrimitiveDescriptor->getConfig();
 
-    auto src_strides = srcMemory0.GetDescWithType<BlockedMemoryDesc>().getStrides();
-    auto dst_strides = dstMemory.GetDescWithType<BlockedMemoryDesc>().getStrides();
-    size_t src_roi_step = srcMemory1.GetDescWithType<BlockedMemoryDesc>().getStrides()[0];
+    auto src_strides = srcMemory0.GetDescWithType<BlockedMemoryDesc>()->getStrides();
+    auto dst_strides = dstMemory.GetDescWithType<BlockedMemoryDesc>()->getStrides();
+    size_t src_roi_step = srcMemory1.GetDescWithType<BlockedMemoryDesc>()->getStrides()[0];
 
     int cb_work = impl::utils::div_up(jpp.nb_c, jpp.nb_c_blocking);
     int MB = jpp.mb;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.h
index 512616c60e486c..78f4dc146ffb66 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roi_pooling_node.h
@@ -75,7 +75,7 @@ class MKLDNNROIPoolingNode : public MKLDNNNode {
     bool created() const override;
 
 private:
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
     template<typename T> void execute();
     template<typename T> struct ROIPoolingExecute;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.cpp
index 410051c7be4b78..8150ae9b378a1f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.cpp
@@ -19,8 +19,12 @@ using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNRollNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNRollNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto interp = std::dynamic_pointer_cast<const ngraph::opset7::Roll>(op);
         if (!interp) {
             errorMessage = "Only opset7 Roll operation is supported";
@@ -90,33 +94,18 @@ void MKLDNNRollNode::initSupportedPrimitiveDescriptors() {
 
     InferenceEngine::Precision precision = getOriginalInputPrecisionAtPort(0);
 
-    auto dataType = MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
-
-    auto srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
-
-    NodeConfig config;
-    config.dynBatchSupport = false;
-
-    auto createDataConfig = [](const Shape& dims, memory::data_type dataType) -> PortConfig {
-        PortConfig dataConfig;
-        dataConfig.inPlace = -1;
-        dataConfig.constant = false;
-        dataConfig.desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(dims.getStaticDims(), dataType, MKLDNNMemory::GetPlainFormatByRank(dims.getRank()));
-        return dataConfig;
-    };
-
-    config.inConfs.push_back(createDataConfig(getParentEdgeAt(0)->getShape(), dataType));
-    config.inConfs.push_back(createDataConfig(getParentEdgeAt(1)->getShape(), memory::data_type::s32));
-    config.inConfs.push_back(createDataConfig(getParentEdgeAt(2)->getShape(), memory::data_type::s32));
-
-    config.outConfs.push_back(createDataConfig(getChildEdgeAt(0)->getShape(), dataType));
+    auto srcDims = getInputShapeAtPort(0).getStaticDims();
 
-    supportedPrimitiveDescriptors.push_back({config, impl_desc_type::ref});
+    addSupportedPrimDesc({{LayoutType::ncsp, precision},
+                          {LayoutType::ncsp, InferenceEngine::Precision::I32},
+                          {LayoutType::ncsp, InferenceEngine::Precision::I32}},
+                         {{LayoutType::ncsp, precision}},
+                         impl_desc_type::ref);
 }
 
 
 void MKLDNNRollNode::execute(mkldnn::stream strm) {
-    const auto dataPrecision = getParentEdgeAt(DATA_INDEX)->getMemory().GetDesc().getPrecision();
+    const auto dataPrecision = getParentEdgeAt(DATA_INDEX)->getMemory().getDesc().getPrecision();
     const auto& dataTypeSize = dataPrecision.size();
     switch (dataTypeSize) {
         case sizeof(PrecisionTrait<Precision::I8>::value_type): {
@@ -155,7 +144,7 @@ void MKLDNNRollNode::rollImpl() {
     auto *output = reinterpret_cast<DataType*>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
     std::vector<size_t> shiftsVector(numOfDims, 0);
 
-    const size_t axesLength = axesEdge->getShape().getStaticDims()[0];
+    const size_t axesLength = axesEdge->getMemory().getStaticDims()[0];
     for (size_t dim = 0; dim < axesLength ; ++dim) {
         int32_t currentAxis = axes[dim] < 0 ? axes[dim] + numOfDims : axes[dim];
         int32_t shiftSum = shiftsVector[currentAxis] + shifts[dim];
@@ -170,7 +159,7 @@ void MKLDNNRollNode::rollImpl() {
     const size_t elementSize = sizeof(DataType);
 
     const size_t nIterations = totalElements / blockSize;
-    const auto strides = dataEdge->getMemory().GetDescWithType<BlockedMemoryDesc>().getStrides();
+    const auto strides = dataEdge->getMemory().GetDescWithType<BlockedMemoryDesc>()->getStrides();
     parallel_for(nIterations, [&](size_t iter) {
         size_t start = iter * blockSize;
         size_t leftBlockStartOffset = start;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.h
index da597d4d9819ec..bb04dcd86fcd2c 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_roll_node.h
@@ -20,7 +20,7 @@ class MKLDNNRollNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     size_t calculateShiftOffset(size_t dataOffset, size_t dimShift, size_t segmentSize, size_t dimSize);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.cpp
index af7b36dd7f361b..1bce5ea3ea9425 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.cpp
@@ -19,8 +19,12 @@ using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNScatterUpdateNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNScatterUpdateNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto scatterElemUpd = std::dynamic_pointer_cast<const ngraph::opset3::ScatterElementsUpdate>(op);
         const auto scatterUpd = std::dynamic_pointer_cast<const ngraph::opset3::ScatterUpdate>(op);
         const auto scatterNdUpd = std::dynamic_pointer_cast<const ngraph::opset4::ScatterNDUpdate>(op);
@@ -52,9 +56,9 @@ void MKLDNNScatterUpdateNode::getSupportedDescriptors() {
     if (getChildEdges().empty())
         IE_THROW() << errorPrefix << " has incorrect number of output edges";
 
-    if (getParentEdgeAt(DATA_ID)->getShape().getRank() < 1 ||
-        getParentEdgeAt(INDICES_ID)->getShape().getRank() < 1 ||
-        getParentEdgeAt(UPDATE_ID)->getShape().getRank() < 1) {
+    if (getInputShapeAtPort(DATA_ID).getRank() < 1 ||
+        getInputShapeAtPort(INDICES_ID).getRank() < 1 ||
+            getInputShapeAtPort(UPDATE_ID).getRank() < 1) {
         IE_THROW() << errorPrefix << " do not support scalar input";
     }
 
@@ -77,10 +81,10 @@ void MKLDNNScatterUpdateNode::initSupportedPrimitiveDescriptors() {
     if (!supportedPrimitiveDescriptors.empty())
         return;
 
-    auto srcDataDim = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-    auto indicesDim = getParentEdgeAt(INDICES_ID)->getShape().getStaticDims();
-    auto updateDim = getParentEdgeAt(UPDATE_ID)->getShape().getStaticDims();
-    auto dstDataDim = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto srcDataDim = getInputShapeAtPort(DATA_ID).getStaticDims();
+    auto indicesDim = getInputShapeAtPort(INDICES_ID).getStaticDims();
+    auto updateDim =  getInputShapeAtPort(UPDATE_ID).getStaticDims();
+    auto dstDataDim = getOutputShapeAtPort(0).getStaticDims();
 
     size_t srcRank = srcDataDim.size();
     size_t indicesRank = indicesDim.size();
@@ -157,7 +161,6 @@ void MKLDNNScatterUpdateNode::initSupportedPrimitiveDescriptors() {
         indicesPrec = Precision::I32;
         indicesSize = 4;
     }
-    indicesType = MKLDNNExtensionUtils::IEPrecisionToDataType(indicesPrec);
 
     if (axisRelaxed) {
         axisPrec = getOriginalInputPrecisionAtPort(AXIS_ID);
@@ -173,8 +176,7 @@ void MKLDNNScatterUpdateNode::initSupportedPrimitiveDescriptors() {
     }
 
     dataPrec = getOriginalInputPrecisionAtPort(DATA_ID);
-    auto dataType = MKLDNNExtensionUtils::IEPrecisionToDataType(dataPrec);
-    dataSize = MKLDNNExtensionUtils::sizeOfDataType(dataType);
+    dataSize = dataPrec.size();
 
     bool canBeInplace = getParentEdgeAt(DATA_ID)->getParent()->getChildEdges().size() == 1 &&
             !getParentEdgeAt(DATA_ID)->getParent()->isConstant();
@@ -200,23 +202,12 @@ void MKLDNNScatterUpdateNode::initSupportedPrimitiveDescriptors() {
         config.inConfs[AXIS_ID].inPlace = -1;
     }
 
-    auto pushDesc = [&](memory::format_tag inFormat, memory::format_tag idxFormat, memory::format_tag updateFormat, memory::format_tag outFormat) {
-        config.inConfs[DATA_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(DATA_ID)->getShape().getStaticDims(), dataType, inFormat);
-        config.inConfs[INDICES_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(INDICES_ID)->getShape().getStaticDims(), indicesType,
-                                                                                      idxFormat);
-        config.inConfs[UPDATE_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(UPDATE_ID)->getShape().getStaticDims(), dataType,
-                                                                                     updateFormat);
-        if (axisRelaxed)
-            config.inConfs[AXIS_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(AXIS_ID)->getShape().getStaticDims(),
-                MKLDNNExtensionUtils::IEPrecisionToDataType(axisPrec), memory::format_tag::x);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), dataType, outFormat);
-        supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
-    };
-
-    pushDesc(MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(DATA_ID)->getShape().getRank()),
-             MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(INDICES_ID)->getShape().getRank()),
-             MKLDNNMemory::GetPlainFormatByRank(getParentEdgeAt(UPDATE_ID)->getShape().getRank()),
-             MKLDNNMemory::GetPlainFormatByRank(getChildEdgeAt(0)->getShape().getRank()));
+    std::vector<PortConfigurator> inPortConfig{{LayoutType::ncsp, dataPrec}, {LayoutType::ncsp, indicesPrec}, {LayoutType::ncsp, dataPrec}};
+    if (axisRelaxed)
+        inPortConfig.emplace_back(LayoutType::ncsp, axisPrec);
+    addSupportedPrimDesc(inPortConfig,
+                         {{LayoutType::ncsp, dataPrec}},
+                          impl_desc_type::unknown);
 }
 
 void MKLDNNScatterUpdateNode::createPrimitive() {
@@ -274,14 +265,13 @@ void MKLDNNScatterUpdateNode::execute(mkldnn::stream strm) {
     uint8_t *indicesPtr = reinterpret_cast<uint8_t*>(indicesMemPtr->GetPtr());
     uint8_t *updatePtr = reinterpret_cast<uint8_t*>(updateMemPtr->GetPtr());
 
-    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getShape().getStaticDims();
+    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getMemory().getStaticDims();
+    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getMemory().getStaticDims();
     size_t srcRank = srcDataDim.size();
     int axis = 0;
     if (axisRelaxed) {
         auto &axisMemPtr = getParentEdgeAt(AXIS_ID)->getMemoryPtr();
-        uint8_t *axisPtr = reinterpret_cast<uint8_t*>(axisMemPtr->GetData()) +
-            axisMemPtr->GetDescriptor().data.offset0 * axisSize;
+        uint8_t *axisPtr = reinterpret_cast<uint8_t*>(axisMemPtr->GetPtr());
         if (axisSize == 4) {
             auto *axisPtr32 = reinterpret_cast<int32_t*>(axisPtr);
             axis = *axisPtr32;
@@ -311,8 +301,8 @@ void MKLDNNScatterUpdateNode::execute(mkldnn::stream strm) {
         });
 
         if (scatterUpdateMode == ScatterUpdateMode::ScatterUpdate) {
-            SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getShape().getStaticDims();
-            SizeVector updateDim = getParentEdgeAt(UPDATE_ID)->getShape().getStaticDims();
+            SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getMemory().getStaticDims();
+            SizeVector updateDim = getParentEdgeAt(UPDATE_ID)->getMemory().getStaticDims();
             size_t indicesRank = indicesDim.size();
             size_t updateRank = updateDim.size();
             SizeVector expectUpdateShape = {};
@@ -372,9 +362,9 @@ void MKLDNNScatterUpdateNode::execute(mkldnn::stream strm) {
 // and indices tensor of shape [i_0, i_1, ..., i_k].
 // Updates tensor shape should be [d_0, d_1, ... d_(axis - 1), i_0, i_1, ..., i_k, d_(axis + 1), ..., d_n].
 void MKLDNNScatterUpdateNode::scatterUpdate(uint8_t *indices, uint8_t *update, int axis, uint8_t *dstData) {
-    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getShape().getStaticDims();
-    SizeVector updateDim = getParentEdgeAt(UPDATE_ID)->getShape().getStaticDims();
+    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getMemory().getStaticDims();
+    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getMemory().getStaticDims();
+    SizeVector updateDim = getParentEdgeAt(UPDATE_ID)->getMemory().getStaticDims();
     size_t indicesRank = indicesDim.size();
 
     std::vector<size_t> srcBlockND = getBlockND(srcDataDim);
@@ -405,8 +395,8 @@ void MKLDNNScatterUpdateNode::scatterUpdate(uint8_t *indices, uint8_t *update, i
 // k is indices.shape[-1] and should not be greater than rank of input, q is rank of indicies.
 // updates is a (q-1)-dimension tensor of replacement-slice-values
 void MKLDNNScatterUpdateNode::scatterNDUpdate(uint8_t *indices, uint8_t *update, uint8_t *dstData) {
-    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getShape().getStaticDims();
+    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getMemory().getStaticDims();
+    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getMemory().getStaticDims();
     size_t indicesRank = indicesDim.size();
 
     std::vector<size_t> srcBlockND = getBlockND(srcDataDim);
@@ -435,9 +425,9 @@ void MKLDNNScatterUpdateNode::scatterNDUpdate(uint8_t *indices, uint8_t *update,
 // output[i][indices[i][j][k]][k] = updates[i][j][k] if axis = 1,
 // output[i][j][indices[i][j][k]] = updates[i][j][k] if axis = 2.
 void MKLDNNScatterUpdateNode::scatterElementsUpdate(uint8_t *indices, uint8_t *update, int axis, uint8_t *dstData) {
-    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-    SizeVector updateDim = getParentEdgeAt(UPDATE_ID)->getShape().getStaticDims();
-    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getShape().getStaticDims();
+    SizeVector srcDataDim = getParentEdgeAt(DATA_ID)->getMemory().getStaticDims();
+    SizeVector updateDim = getParentEdgeAt(UPDATE_ID)->getMemory().getStaticDims();
+    SizeVector indicesDim = getParentEdgeAt(INDICES_ID)->getMemory().getStaticDims();
     size_t updateRank = updateDim.size();
 
     std::vector<size_t> srcBlockND = getBlockND(srcDataDim);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.h
index 41519bc6346c5a..7fc9d96818fa03 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_scatter_update_node.h
@@ -31,7 +31,7 @@ class MKLDNNScatterUpdateNode : public MKLDNNNode {
         return false;
     }
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     void scatterUpdate(uint8_t *indicesPtr, uint8_t *updatePtr, int axis, uint8_t *dstDataPtr);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.cpp
index 093ee7e82557b4..dc6001ad74aa73 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.cpp
@@ -15,8 +15,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNSelectNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNSelectNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto select = std::dynamic_pointer_cast<const ngraph::opset1::Select>(op);
         if (!select) {
             errorMessage = "Only opset1 Select operation is supported";
@@ -180,8 +184,8 @@ void MKLDNNSelectNode::execute_impl() {
 }
 
 void MKLDNNSelectNode::execute(mkldnn::stream strm) {
-    const size_t condPrecSize = getParentEdgeAt(CONDITION)->getMemory().GetDesc().getPrecision().size();
-    const size_t inputsPrecSize = getParentEdgeAt(THEN)->getMemory().GetDesc().getPrecision().size();
+    const size_t condPrecSize = getParentEdgeAt(CONDITION)->getMemory().getDesc().getPrecision().size();
+    const size_t inputsPrecSize = getParentEdgeAt(THEN)->getMemory().getDesc().getPrecision().size();
 
     switch (condPrecSize) {
         case 1: {
@@ -192,7 +196,7 @@ void MKLDNNSelectNode::execute(mkldnn::stream strm) {
                 case 8: { execute_impl<uint8_t, uint64_t>(); break; }
                 default:
                     IE_THROW() << "Select layer doesn't support 'Then' and 'Else' inputs' precision: "
-                                   + std::string(getParentEdgeAt(THEN)->getMemory().GetDesc().getPrecision().name());
+                                   + std::string(getParentEdgeAt(THEN)->getMemory().getDesc().getPrecision().name());
             }
             break;
         }
@@ -204,13 +208,13 @@ void MKLDNNSelectNode::execute(mkldnn::stream strm) {
                 case 8: { execute_impl<int32_t, uint64_t>(); break; }
                 default:
                     IE_THROW() << "Select layer doesn't support 'Then' and 'Else' inputs' precision: "
-                                  + std::string(getParentEdgeAt(THEN)->getMemory().GetDesc().getPrecision().name());
+                                  + std::string(getParentEdgeAt(THEN)->getMemory().getDesc().getPrecision().name());
             }
             break;
         }
         default: {
                 IE_THROW() << "Select layer doesn't support 'Condition' inputs' precision: "
-                              + std::string(getParentEdgeAt(CONDITION)->getMemory().GetDesc().getPrecision().name());
+                              + std::string(getParentEdgeAt(CONDITION)->getMemory().getDesc().getPrecision().name());
         }
     }
 }
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.h
index 1fc6adebb60e27..f6e84a34de9410 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_select_node.h
@@ -22,7 +22,7 @@ class MKLDNNSelectNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     enum { CONDITION, THEN, ELSE, numOfInputs };
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.cpp
index f83ddfed0d0a67..370dc9296bc329 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.cpp
@@ -23,8 +23,12 @@ using namespace InferenceEngine;
 using namespace mkldnn::impl;
 using namespace mkldnn::impl::cpu::x64;
 
-bool MKLDNNShuffleChannelsNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNShuffleChannelsNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto shuffleChannels = std::dynamic_pointer_cast<const ngraph::op::v0::ShuffleChannels>(op);
         if (!shuffleChannels) {
             errorMessage = "Only opset1 ShuffleChannels operation is supported";
@@ -127,8 +131,8 @@ void MKLDNNShuffleChannelsNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         THROW_SHCH_ERROR << "has unidentified preferable primitive descriptor";
 
-    const bool isBlocked = getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c) ||
-                           getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c);
+    const bool isBlocked = getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c) ||
+                           getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c);
 
     int batchRank = axis_;
     int spatialRank = dataRank_ - axis_ - 1;
@@ -160,9 +164,9 @@ void MKLDNNShuffleChannelsNode::createPrimitive() {
     const int channelDim = 1;
     if (isBlocked) {
         const auto blkDesc = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-        size_t blkSize = blkDesc.getBlockDims().back();
+        size_t blkSize = blkDesc->getBlockDims().back();
         size_t CB = div_up(inShape_[1], blkSize);
-        SizeVector srcBlockedDims = blkDesc.getBlockDims();
+        SizeVector srcBlockedDims = blkDesc->getBlockDims();
         if (axis_ > channelDim) {  // axis on spatial
             for (int i = 0; i < batchRank; i++) {
                 params.order[i] = i;
@@ -181,7 +185,7 @@ void MKLDNNShuffleChannelsNode::createPrimitive() {
             params.order[2] = 2;
             params.src_block_dims[2] = spatialShapeSize;
         }
-    } else if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc)) {
+    } else if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nspc)) {
         if (axis_ == channelDim) {  // axis on channel
             params.order[0] = 0;
             params.src_block_dims[0] = inShape_[0];
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.h
index 7206b1ae3637bc..3b5c52c6b3fd5b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_shuffle_channels_node.h
@@ -24,7 +24,7 @@ class MKLDNNShuffleChannelsNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     ngraph::Shape inShape_;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.cpp
index 9fe05e475fc1dc..21c1467507907a 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.cpp
@@ -7,21 +7,37 @@
 #include <string>
 #include <mkldnn_types.h>
 #include <mkldnn_extension_utils.h>
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include <ngraph/opsets/opset1.hpp>
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
+bool MKLDNNSoftMaxNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
+    try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+        if (!std::dynamic_pointer_cast<const ngraph::opset1::Softmax>(op)) {
+            errorMessage = "Only opset1 Softmax operation is supported";
+            return false;
+        }
+    } catch (...) {
+        return false;
+    }
+    return true;
+}
+
 MKLDNNSoftMaxNode::MKLDNNSoftMaxNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache) :
         MKLDNNNode(op, eng, cache) {
-    const auto softmaxOp = ngraph::as_type_ptr<ngraph::op::v1::Softmax>(op);
-    if (softmaxOp) {
-        axis = softmaxOp->get_axis();
-    } else {
-        IE_THROW(NotImplemented)
-                << "CPU Softmax node doesn't support ngraph operation " << op->get_type_name() << " with name " << op->get_friendly_name();
+    std::string errorMessage;
+    if (!isSupportedOperation(op, errorMessage)) {
+        IE_THROW(NotImplemented) << errorMessage;
     }
+    axis = ngraph::as_type_ptr<ngraph::op::v1::Softmax>(op)->get_axis();
 }
 
 void MKLDNNSoftMaxNode::getSupportedDescriptors() {
@@ -38,20 +54,19 @@ void MKLDNNSoftMaxNode::getSupportedDescriptors() {
     if (!getChildEdges().size())
         IE_THROW() << "Incorrect number of output edges for layer " << getName();
 
-    if (getParentEdgeAt(0)->getShape().getRank() == 3) {
-        MemoryDescPtr in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                                 memory::format_tag::abc);
-        createDescriptor({in_candidate.get()}, {});
+    const auto &inShape = getInputShapeAtPort(0);
+    if (inShape.getRank() == 3) {
+        auto in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inShape, inputDataType, memory::format_tag::abc);
+        createDescriptor({in_candidate}, {});
     }
 
-    for (auto format : getAvailableFormatsForDims(getParentEdgeAt(0)->getShape())) {
-        const auto dims = getParentEdgeAt(0)->getShape().getStaticDims();
-        if (MKLDNNMemoryDesc(dims, inputDataType, format).blocksExtended())
-            continue;
+    for (auto format : getAvailableFormatsForDims(inShape)) {
+        auto in_candidate = std::make_shared<DnnlBlockedMemoryDesc>(inShape, inputDataType, format);
 
-        MemoryDescPtr in_candidate = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(dims, inputDataType, format);
+        if (in_candidate->blocksExtended())
+            continue;
 
-        createDescriptor({in_candidate.get()}, {});
+        createDescriptor({in_candidate}, {});
     }
 }
 
@@ -59,7 +74,7 @@ void MKLDNNSoftMaxNode::createPrimitive() {
     if (prim)
         return;
 
-    memory::desc in_candidate = getParentEdgeAt(0)->getMemory().GetDescriptor();
+    auto in_candidate = getParentEdgeAt(0)->getMemory().GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc();
     MKLDNNDescriptor desc(std::shared_ptr<softmax_forward::desc>(
             new softmax_forward::desc(prop_kind::forward_scoring, in_candidate, axis)));
     descs[0] = desc;
@@ -94,34 +109,34 @@ bool MKLDNNSoftMaxNode::created() const {
     return getType() == Softmax;
 }
 
- void MKLDNNSoftMaxNode::initOptimalPrimitiveDescriptor() {
-     auto selected_pd = getSelectedPrimitiveDescriptor();
-     if (selected_pd == nullptr)
-         IE_THROW() << "Preferable primitive descriptor is not set.";
-     auto config = selected_pd->getConfig();
-     if (isConfigDefined(config))
-         return;
-
-     if (config.inConfs.size() != 1 || config.outConfs.size() != 1 ||
-             (config.inConfs[0].desc->isDefined() &&
-                     config.outConfs[0].desc->isDefined() && !config.inConfs[0].desc->isCompatible(*config.outConfs[0].desc)))
-         IE_THROW() << "Layer " << getName() << " has incorrect selected config!";
-
-     if (config.inConfs[0].desc->isDefined()) {
-         config.outConfs[0].desc = config.inConfs[0].desc->clone();
-     } else if (config.outConfs[0].desc->isDefined()) {
-         config.inConfs[0].desc = config.outConfs[0].desc->clone();
-     } else {
-         config.inConfs[0].desc = getDefinedInputDesc(config, 0);
-         config.outConfs[0].desc = config.inConfs[0].desc->clone();
-     }
-
-     initDescriptor(config);
- }
-
-void MKLDNNSoftMaxNode::createDescriptor(const std::vector<const MemoryDesc*> &inputDesc,
-                                         const std::vector<const MemoryDesc*> &outputDesc) {
-    MKLDNNMemoryDesc in_candidate = MemoryDescUtils::convertToMKLDNNMemoryDesc(*inputDesc[0]);
+void MKLDNNSoftMaxNode::initOptimalPrimitiveDescriptor() {
+    auto selected_pd = getSelectedPrimitiveDescriptor();
+    if (selected_pd == nullptr)
+        IE_THROW() << "Preferable primitive descriptor is not set.";
+    auto config = selected_pd->getConfig();
+    if (isConfigDefined(config))
+        return;
+
+    if (config.inConfs.size() != 1 || config.outConfs.size() != 1 ||
+            (config.inConfs[0].desc->isDefined() &&
+                    config.outConfs[0].desc->isDefined() && !config.inConfs[0].desc->isCompatible(*config.outConfs[0].desc)))
+        IE_THROW() << "Layer " << getName() << " has incorrect selected config!";
+
+    if (config.inConfs[0].desc->isDefined()) {
+        config.outConfs[0].desc = config.inConfs[0].desc;
+    } else if (config.outConfs[0].desc->isDefined()) {
+        config.inConfs[0].desc = config.outConfs[0].desc;
+    } else {
+        config.inConfs[0].desc = getDefinedInputDesc(config, 0);
+        config.outConfs[0].desc = config.inConfs[0].desc;
+    }
+
+    initDescriptor(config);
+}
+
+void MKLDNNSoftMaxNode::createDescriptor(const std::vector<MemoryDescPtr> &inputDesc,
+                                         const std::vector<MemoryDescPtr> &outputDesc) {
+    auto in_candidate = MemoryDescUtils::convertToDnnlMemoryDesc(inputDesc[0])->getDnnlDesc();
 
     MKLDNNDescriptor desc(std::shared_ptr<softmax_forward::desc>(
             new softmax_forward::desc(prop_kind::forward_scoring, in_candidate, axis)));
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.h
index fd200cdb1457fa..81944c829f12c2 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.h
@@ -17,12 +17,14 @@ class MKLDNNSoftMaxNode : public MKLDNNNode {
     MKLDNNSoftMaxNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache);
 
     void initOptimalPrimitiveDescriptor() override;
-    void createDescriptor(const std::vector<const MemoryDesc*>& inputDesc,
-                          const std::vector<const MemoryDesc*>& outputDesc) override;
+    void createDescriptor(const std::vector<MemoryDescPtr>& inputDesc,
+                          const std::vector<MemoryDescPtr>& outputDesc) override;
     void getSupportedDescriptors() override;
     void createPrimitive() override;
     bool created() const override;
 
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
+
 private:
     size_t axis = 0;
 };
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.cpp
index 1861799f97c32b..486c1bc4a411c5 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.cpp
@@ -16,8 +16,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNSpaceToBatchNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNSpaceToBatchNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto spaceToBatch = std::dynamic_pointer_cast<const ngraph::opset2::SpaceToBatch>(op);
         if (!spaceToBatch) {
             errorMessage = "Only opset2 SpaceToBatch operation is supported";
@@ -112,15 +116,15 @@ void MKLDNNSpaceToBatchNode::SpaceToBatchKernel() {
     const auto *srcData = reinterpret_cast<const T *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
     auto *dstData = reinterpret_cast<T *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr());
 
-    const bool blocked = getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c) ||
-                         getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c);
+    const bool blocked = getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c) ||
+                         getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c);
     const auto dimsSize = inDims.size();
 
     auto inShape5D  = getShape5D(outDims);
     auto outShape5D = getShape5D(inDims);
     auto blockShape = getShape5D(blockShapeIn);
 
-    if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc)) {
+    if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nspc)) {
         inShape5D.push_back(inShape5D[1]);
         inShape5D.erase(inShape5D.begin() + 1);
         outShape5D.push_back(outShape5D[1]);
@@ -129,10 +133,10 @@ void MKLDNNSpaceToBatchNode::SpaceToBatchKernel() {
         blockShape.erase(blockShape.begin() + 1);
     }
 
-    const auto outBlkDims = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getBlockDims();
+    const auto outBlkDims = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getBlockDims();
     const size_t blockSize = blocked ? outBlkDims.back() : 1lu;
     const size_t blockCountInput = outBlkDims[1];
-    const size_t blockCountOutput = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getBlockDims()[1];
+    const size_t blockCountOutput = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getBlockDims()[1];
     const auto blockRemainder = inShape5D[1] % blockSize;
     const auto lastBlock = blockRemainder == 0 ? blockSize : blockRemainder;
 
@@ -173,7 +177,7 @@ void MKLDNNSpaceToBatchNode::SpaceToBatchKernel() {
             oAdd[2] = dimsSize == 5 ? bIdx % blockShapeIn[2] - padsBeginIn[2] : 0lu;
             bIdx = dimsSize == 5 ? bIdx / blockShapeIn[2] : bIdx;
             oAdd[1] = bIdx % blockShapeIn[1] - padsBeginIn[1];
-            if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc)) {
+            if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nspc)) {
                 oAdd.push_back(oAdd[1]);
                 oAdd.erase(oAdd.begin() + 1);
             }
@@ -227,12 +231,12 @@ void MKLDNNSpaceToBatchNode::SpaceToBatchKernel() {
 }
 
 void MKLDNNSpaceToBatchNode::execute(mkldnn::stream strm) {
-    switch (getParentEdgeAt(0)->getMemory().GetDesc().getPrecision().size()) {
+    switch (getParentEdgeAt(0)->getMemory().getDesc().getPrecision().size()) {
         case 1: SpaceToBatchKernel<PrecisionTrait<Precision::U8>::value_type>();  break;
         case 2: SpaceToBatchKernel<PrecisionTrait<Precision::U16>::value_type>(); break;
         case 4: SpaceToBatchKernel<PrecisionTrait<Precision::I32>::value_type>(); break;
         default:
-            IE_THROW() << "SpaceToBatch layer does not support precision '" + std::string(getParentEdgeAt(0)->getMemory().GetDesc().getPrecision().name())
+            IE_THROW() << "SpaceToBatch layer does not support precision '" + std::string(getParentEdgeAt(0)->getMemory().getDesc().getPrecision().name())
                           + "'";
     }
 }
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.h
index f5c9fd1ec9d05b..128e1b71226339 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_batch_node.h
@@ -22,7 +22,7 @@ class MKLDNNSpaceToBatchNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     InferenceEngine::SizeVector inDims;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.cpp
index 25003088139af9..7097a88df5d324 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.cpp
@@ -21,8 +21,12 @@ using namespace mkldnn;
 using namespace mkldnn::impl;
 using namespace mkldnn::impl::cpu::x64;
 
-bool MKLDNNSpaceToDepthNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNSpaceToDepthNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto spaceToDepth = std::dynamic_pointer_cast<const ngraph::opset1::SpaceToDepth>(op);
         if (!spaceToDepth) {
             errorMessage = "Only opset1 SpaceToDepth operation is supported";
@@ -98,7 +102,7 @@ void MKLDNNSpaceToDepthNode::initSupportedPrimitiveDescriptors() {
         return;
 
     InferenceEngine::Precision precision = getOriginalInputPrecisionAtPort(0);
-    auto srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
+    auto srcDims = getInputShapeAtPort(0).getStaticDims();
     const size_t nDims = srcDims.size();
 
     impl_desc_type impl_type;
@@ -138,8 +142,8 @@ void MKLDNNSpaceToDepthNode::initSupportedPrimitiveDescriptors() {
     auto range = BlockedDescCreator::makeFilteredRange(creators, nDims, supportedTypes);
 
     for (auto itr = range.first; itr != range.second; ++itr) {
-        config.inConfs[0].desc = itr->second->createUniqueDesc(precision, getParentEdgeAt(0)->getShape().getStaticDims());
-        config.outConfs[0].desc = itr->second->createUniqueDesc(precision, getChildEdgeAt(0)->getShape().getStaticDims());
+        config.inConfs[0].desc = itr->second->createSharedDesc(precision, getInputShapeAtPort(0));
+        config.outConfs[0].desc = itr->second->createSharedDesc(precision, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.emplace_back(config, impl_type);
     }
 }
@@ -154,13 +158,13 @@ void MKLDNNSpaceToDepthNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         THROW_ERROR << "has unidentified preferable primitive descriptor";
 
-    SizeVector srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
-    SizeVector dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    VectorDims srcDims = srcMemPtr->getStaticDims();
+    VectorDims dstDims = dstMemPtr->getStaticDims();
 
     size_t nDims = srcDims.size();
     const size_t nSpatialDims = nDims - 2;
-    const bool isBlocked = getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c) ||
-                           getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c);
+    const bool isBlocked = getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c) ||
+                           getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c);
     const size_t reshapedRank = nDims + nSpatialDims + static_cast<int>(isBlocked) + static_cast<int>(isBlocked && mode == Mode::DEPTH_FIRST);
     const size_t lastIdx = reshapedRank - 1;
     size_t firstSpatialOrder = 2;
@@ -191,8 +195,8 @@ void MKLDNNSpaceToDepthNode::createPrimitive() {
     };
 
     if (isBlocked) {
-        SizeVector srcBlockedDims = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getBlockDims();
-        SizeVector dstBlockedDims = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>().getBlockDims();
+        VectorDims srcBlockedDims = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getBlockDims();
+        VectorDims dstBlockedDims = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getBlockDims();
 
         size_t orderShiftForBlocks, orderShiftForDims;
         if (mode == Mode::BLOCKS_FIRST) {
@@ -219,7 +223,7 @@ void MKLDNNSpaceToDepthNode::createPrimitive() {
         }
 
         reshapeAndSetPermOrder(orderShiftForBlocks, orderShiftForDims, firstSpatialOrder, dstBlockedDims);
-    } else if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc)) {
+    } else if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::nspc)) {
         srcDims.push_back(srcDims[1]);
         dstDims.push_back(dstDims[1]);
         srcDims.erase(srcDims.begin() + 1);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.h
index b7639b90a18029..11a39670654140 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_space_to_depth_node.h
@@ -21,7 +21,7 @@ class MKLDNNSpaceToDepthNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     enum Mode {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_split_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_split_node.cpp
index a95bd0c4f758e3..b815b02111abf8 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_split_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_split_node.cpp
@@ -10,7 +10,8 @@
 #include <mkldnn_extension_utils.h>
 #include <ie_parallel.hpp>
 #include "utils/general_utils.h"
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
+#include "utils/ngraph_utils.hpp"
 
 #define THROW_ERROR IE_THROW() << "Split layer with name '" << getName() <<"' "
 
@@ -20,6 +21,11 @@ using namespace InferenceEngine;
 
 bool MKLDNNSplitNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (!MKLDNNPlugin::one_of(op->get_type_info(), ngraph::op::v1::Split::type_info, ngraph::op::v1::VariadicSplit::type_info)) {
             errorMessage = "Only opset1 Split and VariadicSplit operations are supported";
             return false;
@@ -75,9 +81,9 @@ void MKLDNNSplitNode::initSupportedPrimitiveDescriptors() {
     if (!supportedPrimitiveDescriptors.empty())
         return;
 
-    auto srcShape = getParentEdgeAt(0)->getShape();
+    auto srcShape = getInputShapeAtPort(0);
     auto axis_size = 0;
-    auto dstFirstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto dstFirstDims = getOutputShapeAtPort(0).getStaticDims();
     for (size_t i = 0; i < outputShapes.size(); i++) {
         auto o_Dims = outputShapes[i].getStaticDims();
         if (dstFirstDims.size() != o_Dims.size()) {
@@ -139,12 +145,12 @@ void MKLDNNSplitNode::initSupportedPrimitiveDescriptors() {
         config.inConfs.resize(INPUTS_NUM);
         config.inConfs[0].inPlace = -1;
         config.inConfs[0].constant = false;
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(itr->second->createDesc(inpPrecision, srcShape.getStaticDims()));
+        config.inConfs[0].desc = std::make_shared<CpuBlockedMemoryDesc>(itr->second->createDesc(inpPrecision, srcShape));
         config.inConfs[1].inPlace = -1;
         config.inConfs[1].constant = true;
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(axisPrecision, SizeVector{1});
+        config.inConfs[1].desc = std::make_shared<CpuBlockedMemoryDesc>(axisPrecision, Shape(SizeVector {1}));
         if (INPUTS_NUM == 3) {
-            config.inConfs[2].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(axisPrecision, SizeVector{outputShapes.size()});
+            config.inConfs[2].desc = std::make_shared<CpuBlockedMemoryDesc>(axisPrecision, Shape(SizeVector{outputShapes.size()}));
             config.inConfs[2].constant = true;
         }
 
@@ -153,7 +159,7 @@ void MKLDNNSplitNode::initSupportedPrimitiveDescriptors() {
         for (size_t i = 0; i < outputShapes.size(); i++) {
             config.outConfs[i].inPlace = -1;
             config.outConfs[i].constant = false;
-            config.outConfs[i].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(itr->second->createDesc(inpPrecision, outputShapes[i].getStaticDims()));
+            config.outConfs[i].desc = std::make_shared<CpuBlockedMemoryDesc>(itr->second->createDesc(inpPrecision, outputShapes[i]));
         }
         supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::ref);
 
@@ -171,7 +177,7 @@ void MKLDNNSplitNode::initSupportedPrimitiveDescriptors() {
     for (auto refPdIndex : pdIndexesToReuse) {
         const auto& refConfig = supportedPrimitiveDescriptors[refPdIndex].getConfig();
         auto config = refConfig;
-        const auto inBlockingDesc = refConfig.inConfs[0].desc->as<BlockedMemoryDesc>();
+        const auto inBlockingDesc = refConfig.inConfs[0].desc->as<CpuBlockedMemoryDesc>();
         const auto& order = inBlockingDesc->getOrder();
         const auto& blkDims = inBlockingDesc->getBlockDims();
         auto numOfDim = blkDims.size();
@@ -189,15 +195,15 @@ void MKLDNNSplitNode::initSupportedPrimitiveDescriptors() {
             }
         }
 
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(inpPrecision, srcShape.getStaticDims(), blkDims, order, offset, offsets, strides);
+        config.inConfs[0].desc = std::make_shared<CpuBlockedMemoryDesc>(inpPrecision, srcShape, blkDims, order, offset, offsets, strides);
 
         for (size_t i = 0; i < outputShapes.size(); i++) {
-            auto outBlockingDesc = refConfig.outConfs[i].desc->as<BlockedMemoryDesc>();
+            auto outBlockingDesc = refConfig.outConfs[i].desc->as<CpuBlockedMemoryDesc>();
             const auto& outBlkDims = outBlockingDesc->getBlockDims();
             const auto& dims = outBlockingDesc->getShape().getStaticDims();
 
             config.outConfs[i].inPlace = 0;
-            config.outConfs[i].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(outPrecision, dims, outBlkDims, order, offset, offsets, strides);
+            config.outConfs[i].desc = std::make_shared<CpuBlockedMemoryDesc>(outPrecision, Shape(dims), outBlkDims, order, offset, offsets, strides);
         }
         supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::unknown);
     }
@@ -210,12 +216,12 @@ void MKLDNNSplitNode::initSupportedPrimitiveDescriptors() {
         config.inConfs.resize(INPUTS_NUM);
         config.inConfs[0].inPlace = -1;
         config.inConfs[0].constant = false;
-        config.inConfs[0].desc = creatorsMap.at(LayoutType::nspc)->createUniqueDesc(inpPrecision, srcShape.getStaticDims());
+        config.inConfs[0].desc = creatorsMap.at(LayoutType::nspc)->createSharedDesc(inpPrecision, srcShape);
         config.inConfs[1].inPlace = -1;
         config.inConfs[1].constant = true;
-        config.inConfs[1].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(axisPrecision, SizeVector{1});
+        config.inConfs[1].desc = std::make_shared<CpuBlockedMemoryDesc>(axisPrecision, Shape(SizeVector{1}));
         if (INPUTS_NUM == 3) {
-            config.inConfs[2].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(axisPrecision, SizeVector{outputShapes.size()});
+            config.inConfs[2].desc = std::make_shared<CpuBlockedMemoryDesc>(axisPrecision, Shape(SizeVector{outputShapes.size()}));
             config.inConfs[2].constant = true;
         }
         config.outConfs.resize(outputShapes.size());
@@ -223,7 +229,7 @@ void MKLDNNSplitNode::initSupportedPrimitiveDescriptors() {
         for (size_t i = 0; i < outputShapes.size(); i++) {
             config.outConfs[i].inPlace = -1;
             config.outConfs[i].constant = false;
-            config.outConfs[i].desc = creatorsMap.at(LayoutType::ncsp)->createUniqueDesc(inpPrecision, outputShapes[i].getStaticDims());
+            config.outConfs[i].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(inpPrecision, outputShapes[i]);
         }
         supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::ref);
     }
@@ -240,13 +246,13 @@ void MKLDNNSplitNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         THROW_ERROR << "Preferable primitive descriptor is not set.";
 
-    auto& memDesc = getParentEdgeAt(0)->getMemoryPtr()->GetDesc();
+    auto& memDesc = getParentEdgeAt(0)->getMemoryPtr()->getDesc();
 
     canUseOptimizedNspc2Ncsp = false;
     if (axis == 1 && one_of(memDesc.getShape().getRank(), 4, 5) && memDesc.hasLayoutType(LayoutType::nspc)) {
         canUseOptimizedNspc2Ncsp = true;
         for (size_t i = 0; i < getChildEdges().size(); i++) {
-            auto& childMemDesc = getChildEdgeAt(i)->getMemoryPtr()->GetDesc();
+            auto& childMemDesc = getChildEdgeAt(i)->getMemoryPtr()->getDesc();
             if (!childMemDesc.hasLayoutType(LayoutType::ncsp))
                 canUseOptimizedNspc2Ncsp = false;
         }
@@ -274,7 +280,7 @@ void MKLDNNSplitNode::execute(mkldnn::stream strm) {
     }
 
     uint8_t* srcData = reinterpret_cast<uint8_t*>(this->getParentEdgeAt(0)->getMemoryPtr()->GetPtr());
-    size_t batch = this->getParentEdgeAt(0)->getShape().getStaticDims()[0];
+    size_t batch = getParentEdgesAtPort(0)[0]->getMemory().getStaticDims()[0];
 
     if (batch != MB)
         optimizedParams.countStrides = optimizedParams.countStrides / batch * MB;
@@ -320,33 +326,34 @@ void MKLDNNSplitNode::initOptimalPrimitiveDescriptor() {
                 if (!parentConfig.desc->isDefined() && parentConfig.inPlace >= 0)
                     getParentEdgeAt(i)->getParent()->initOptimalPrimitiveDescriptor();
                 if (parentConfig.desc->isDefined() && parentConfig.desc->isCompatible(*config.inConfs[i].desc)) {
-                    config.inConfs[i].desc = parentConfig.desc->clone();
+                    config.inConfs[i].desc = parentConfig.desc;
                     continue;
                 }
             }
         }
 
         // reset undefined offsets
-        config.inConfs[i].desc = MemoryDescUtils::resetOffset(config.inConfs[i].desc.get());
+        config.inConfs[i].desc = MemoryDescUtils::cloneWithDefaultStridesAndOffset(*config.inConfs[i].desc);
     }
     if (config.outConfs.size() != outputShapes.size())
         THROW_ERROR << "has invalid config";
 
-    auto firstInBlockingDesc = MemoryDescUtils::convertToBlockedDescriptor(*config.inConfs[0].desc);
+    auto firstInBlockingDesc = config.inConfs[0].desc->as<BlockedMemoryDesc>();
     size_t offset = 0;
     for (size_t i = 0; i < outputShapes.size(); i++) {
-        auto outBlockingDesc = MemoryDescUtils::convertToBlockedDescriptor(*config.outConfs[i].desc);
-        config.outConfs[i].desc = MKLDNNPlugin::make_unique<BlockedMemoryDesc>(outBlockingDesc.getPrecision(),
-                                                                 outBlockingDesc.getShape().getStaticDims(),
-                                                                 outBlockingDesc.getBlockDims(),
-                                                                 outBlockingDesc.getOrder(),
-                                                                 firstInBlockingDesc.getOffsetPadding() + offset,
-                                                                 firstInBlockingDesc.getOffsetPaddingToData(),
-                                                                 firstInBlockingDesc.getStrides());
+        auto oldDesc = config.outConfs[i].desc;
+        auto outBlockingDesc = oldDesc->as<BlockedMemoryDesc>();
+        config.outConfs[i].desc = std::make_shared<CpuBlockedMemoryDesc>(outBlockingDesc->getPrecision(),
+                                                                 outBlockingDesc->getShape(),
+                                                                 outBlockingDesc->getBlockDims(),
+                                                                 outBlockingDesc->getOrder(),
+                                                                 firstInBlockingDesc->getOffsetPadding() + offset,
+                                                                 firstInBlockingDesc->getOffsetPaddingToData(),
+                                                                 firstInBlockingDesc->getStrides());
 
         size_t axisSize = 1;
-        for (size_t j = axis; j < outBlockingDesc.getBlockDims().size(); j++) {
-            axisSize *= outBlockingDesc.getBlockDims()[j];
+        for (size_t j = axis; j < outBlockingDesc->getBlockDims().size(); j++) {
+            axisSize *= outBlockingDesc->getBlockDims()[j];
         }
         offset += axisSize;
     }
@@ -464,7 +471,7 @@ void MKLDNNSplitNode::prepareOptimizedParams() {
     const auto outputPortsCount = outputShapes.size();
 
     //find axis order position
-    const auto& order = inpTensorDesc.getOrder();
+    const auto& order = inpTensorDesc->getOrder();
     unsigned axisOrderPos = std::numeric_limits<unsigned>::max();
     for (size_t i = 0; i < order.size(); ++i) {
         if (order[i] == axis) {
@@ -476,8 +483,8 @@ void MKLDNNSplitNode::prepareOptimizedParams() {
         THROW_ERROR << "Can't find the axis in the input tensor order list";
     }
 
-    uint8_t srcDataSize = inpTensorDesc.getPrecision().size();
-    const auto& srcDims = inpTensorDesc.getBlockDims();
+    uint8_t srcDataSize = inpTensorDesc->getPrecision().size();
+    const auto& srcDims = inpTensorDesc->getBlockDims();
     const auto getRank = srcDims.size();
 
     optimizedParams.countStrides = 1;
@@ -491,7 +498,7 @@ void MKLDNNSplitNode::prepareOptimizedParams() {
         auto outputEdge = this->getChildEdgesAtPort(i).front();
         optimizedParams.dataSize[i] = srcDataSize;
 
-        auto desc = outputEdge->getMemory().GetDesc().as<BlockedMemoryDesc>();
+        auto desc = outputEdge->getMemory().getDesc().as<CpuBlockedMemoryDesc>();
         for (size_t j = axisOrderPos; j < getRank; j++)
             optimizedParams.dataSize[i] *= desc->getBlockDims()[j];
 
@@ -507,8 +514,8 @@ void MKLDNNSplitNode::prepareOptimizedParams() {
 
 void MKLDNNSplitNode::optimizedNspc2Ncsp(size_t MB) {
     auto parentEdge = getParentEdgeAt(0);
-    const int rank = parentEdge->getShape().getRank();
-    const auto parentDims = parentEdge->getShape().getStaticDims();
+    const int rank = parentEdge->getMemory().GetShape().getRank();
+    const auto parentDims = parentEdge->getMemory().getStaticDims();
     const size_t IC = parentDims[1];
     const size_t D = rank == 5 ? parentDims[rank - 3] : 1;
     const size_t H = parentDims[rank - 2];
@@ -516,7 +523,7 @@ void MKLDNNSplitNode::optimizedNspc2Ncsp(size_t MB) {
 
     auto& srcMem = parentEdge->getMemory();
     auto srcData = reinterpret_cast<const uint8_t*>(srcMem.GetData());
-    const auto dataSize = srcMem.GetDesc().getPrecision().size();
+    const auto dataSize = srcMem.getDesc().getPrecision().size();
 
     const size_t DHW = D*H*W;
     const size_t strideIB = DHW * IC * dataSize;
@@ -532,7 +539,7 @@ void MKLDNNSplitNode::optimizedNspc2Ncsp(size_t MB) {
         for (size_t j = axis; j < dims.size(); j++) {
             innerSize *= dims[j];
         }
-        auto srcPtr = srcData + srcMem.GetDesc().getElementOffset(sIdx) * dataSize;
+        auto srcPtr = srcData + srcMem.getDesc().getElementOffset(sIdx) * dataSize;
 
         const size_t OC = dims[1];
         const size_t strideOB = OC * strideOC;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.cpp
index 8e87617d3692b4..54d6a99dd75017 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.cpp
@@ -35,8 +35,13 @@ static inline size_t parallel_init(size_t start, size_t nDims, const SizeVector&
     return start;
 }
 
-bool MKLDNNStridedSliceNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNStridedSliceNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto ss = std::dynamic_pointer_cast<const ngraph::opset1::StridedSlice>(op);
         if (!ss) {
             errorMessage = "Only opset1 StridedSlice operation is supported";
@@ -199,15 +204,13 @@ void MKLDNNStridedSliceNode::initSupportedPrimitiveDescriptors() {
     const bool hasStrides = getParentEdges().size() > 3;
     InferenceEngine::Precision dataPrecision = getOriginalInputPrecisionAtPort(DATA_ID);
     InferenceEngine::Precision beginPrecision = getOriginalInputPrecisionAtPort(BEGIN_ID);
-    auto beginDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(beginPrecision);
     InferenceEngine::Precision endPrecision = getOriginalInputPrecisionAtPort(END_ID);
-    auto endDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(endPrecision);
     InferenceEngine::Precision stridePrecision;
     if (hasStrides)
         stridePrecision = getOriginalInputPrecisionAtPort(STRIDE_ID);
 
-    auto srcDims = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-    auto dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+    auto srcDims = getInputShapeAtPort(DATA_ID).getStaticDims();
+    auto dstDims = getOutputShapeAtPort(0).getStaticDims();
     size_t nDims = srcDims.size();
 
     NodeConfig config;
@@ -242,17 +245,13 @@ void MKLDNNStridedSliceNode::initSupportedPrimitiveDescriptors() {
     auto range = BlockedDescCreator::makeFilteredRange(creators, nDims, supportedTypes);
 
     for (auto itr = range.first; itr != range.second; ++itr) {
-        config.inConfs[0].desc = itr->second->createUniqueDesc(dataPrecision, getParentEdgeAt(DATA_ID)->getShape().getStaticDims());
-        config.inConfs[BEGIN_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(BEGIN_ID)->getShape().getStaticDims(), beginDataType,
-                                                                      mkldnn::memory::format_tag::x);
-        config.inConfs[END_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(END_ID)->getShape().getStaticDims(), endDataType,
-                                                                    mkldnn::memory::format_tag::x);
+        config.inConfs[0].desc = itr->second->createSharedDesc(dataPrecision, getInputShapeAtPort(DATA_ID));
+        config.inConfs[BEGIN_ID].desc = creators.at(LayoutType::ncsp)->createSharedDesc(beginPrecision, getInputShapeAtPort(BEGIN_ID));
+        config.inConfs[END_ID].desc = creators.at(LayoutType::ncsp)->createSharedDesc(endPrecision, getInputShapeAtPort(END_ID));
         if (hasStrides)
-            config.inConfs[STRIDE_ID].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(STRIDE_ID)->getShape().getStaticDims(),
-                                                              MKLDNNExtensionUtils::IEPrecisionToDataType(stridePrecision),
-                                                              mkldnn::memory::format_tag::x);
+            config.inConfs[STRIDE_ID].desc = creators.at(LayoutType::ncsp)->createSharedDesc(stridePrecision, getInputShapeAtPort(STRIDE_ID));
 
-        config.outConfs[0].desc = itr->second->createUniqueDesc(dataPrecision, getChildEdgeAt(DATA_ID)->getShape().getStaticDims());
+        config.outConfs[0].desc = itr->second->createSharedDesc(dataPrecision, getOutputShapeAtPort(DATA_ID));
         supportedPrimitiveDescriptors.emplace_back(config, impl_desc_type::ref);
     }
 }
@@ -269,16 +268,16 @@ void MKLDNNStridedSliceNode::createPrimitive() {
 
     auto srcBlockingDesc = getParentEdgeAt(DATA_ID)->getMemory().GetDescWithType<BlockedMemoryDesc>();
     auto dstBlockingDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    auto srcOrder = srcBlockingDesc.getOrder();
-    params.srcDims = srcBlockingDesc.getBlockDims();
-    params.dstDims = dstBlockingDesc.getBlockDims();
+    auto srcOrder = srcBlockingDesc->getOrder();
+    params.srcDims = srcBlockingDesc->getBlockDims();
+    params.dstDims = dstBlockingDesc->getBlockDims();
     params.srcMemPtr = srcMemPtr;
     params.dstMemPtr = dstMemPtr;
     params.dataSize = getSelectedPrimitiveDescriptor()->getConfig().inConfs[DATA_ID].desc->getPrecision().size();
 
     if (params.parametersAreConstant) {
         size_t realNDims = params.dstDims.size();
-        if (!getParentEdgeAt(DATA_ID)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp))
+        if (!getParentEdgeAt(DATA_ID)->getMemory().getDesc().hasLayoutType(LayoutType::ncsp))
             orderParametersByLayouts();
 
         SizeVector newSrcDims, newDstDims;
@@ -289,10 +288,10 @@ void MKLDNNStridedSliceNode::createPrimitive() {
 }
 
 void MKLDNNStridedSliceNode::orderParametersByLayouts() {
-    const bool isPerChannelLayout = getParentEdgeAt(DATA_ID)->getMemory().GetDesc().hasLayoutType(LayoutType::nspc);
-    const bool isBlockedLayout = getParentEdgeAt(DATA_ID)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp8c) ||
-                                 getParentEdgeAt(DATA_ID)->getMemory().GetDesc().hasLayoutType(LayoutType::nCsp16c);
-    auto srcOrder = getParentEdgeAt(DATA_ID)->getMemory().GetDescWithType<BlockedMemoryDesc>().getOrder();
+    const bool isPerChannelLayout = getParentEdgeAt(DATA_ID)->getMemory().getDesc().hasLayoutType(LayoutType::nspc);
+    const bool isBlockedLayout = getParentEdgeAt(DATA_ID)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp8c) ||
+                                 getParentEdgeAt(DATA_ID)->getMemory().getDesc().hasLayoutType(LayoutType::nCsp16c);
+    auto srcOrder = getParentEdgeAt(DATA_ID)->getMemory().GetDescWithType<BlockedMemoryDesc>()->getOrder();
 
     if (isBlockedLayout) {
         const size_t blk = params.srcDims.back();
@@ -596,8 +595,8 @@ void MKLDNNStridedSliceNode::indicesCalculationForOptimized() {
 
 void MKLDNNStridedSliceNode::execute(mkldnn::stream strm) {
     if (!params.parametersAreConstant) {
-        auto srcDims = getParentEdgeAt(DATA_ID)->getShape().getStaticDims();
-        auto dstDims = getChildEdgeAt(0)->getShape().getStaticDims();
+        auto srcDims = getParentEdgeAt(DATA_ID)->getMemory().getStaticDims();
+        auto dstDims = getChildEdgesAtPort(DATA_ID)[0]->getMemory().getStaticDims();
         const size_t nDims = std::max(srcDims.size(), dstDims.size());
         const size_t ellipsisMaskCounter = std::accumulate(ellipsisMask.begin(), ellipsisMask.end(), 0);
 
@@ -620,7 +619,7 @@ void MKLDNNStridedSliceNode::execute(mkldnn::stream strm) {
         if (srcDims.size() > 3 && params.equalDims && ellipsisMaskCounter != 0)
             addHiddenDims(srcDims.size());
 
-        if (!getParentEdgeAt(DATA_ID)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp))
+        if (!getParentEdgeAt(DATA_ID)->getMemory().getDesc().hasLayoutType(LayoutType::ncsp))
             orderParametersByLayouts();
 
         SizeVector newSrcDims, newDstDims;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.h
index 672bc0b6ce9c9b..8883311903d010 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_strided_slice_node.h
@@ -24,7 +24,7 @@ class MKLDNNStridedSliceNode : public MKLDNNNode {
         return false;
     }
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     inline void stridedSlice();
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tensoriterator_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tensoriterator_node.cpp
index 2e1a9f426ef55a..d42d168b4e4786 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tensoriterator_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tensoriterator_node.cpp
@@ -11,6 +11,7 @@
 #include <ie_ngraph_utils.hpp>
 #include <utils/general_utils.h>
 #include "common/blocked_desc_creator.h"
+#include "utils/ngraph_utils.hpp"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -22,22 +23,24 @@ static NodeConfig make_plain_config(const std::shared_ptr<ngraph::Node>& op) {
     NodeConfig config;
 
     for (size_t i = 0; i < op->get_input_size(); i++) {
-        const auto& dims = op->get_input_shape(i);
+        const auto &origShape = op->get_input_partial_shape(i);
+        const auto& shape = Shape(origShape.rank().get_length() == 0 ? ngraph::PartialShape{1} : origShape);
         const auto prec = InferenceEngine::details::convertPrecision(op->get_input_element_type(i));
 
         PortConfig data_conf {};
         auto descCreator = BlockedDescCreator::getCommonCreators().at(LayoutType::ncsp);
-        data_conf.desc = descCreator->createUniqueDesc(prec, dims);
+        data_conf.desc = descCreator->createSharedDesc(prec, shape);
         config.inConfs.push_back(data_conf);
     }
 
     for (size_t i = 0; i < op->get_output_size(); i++) {
-        const auto& dims = op->get_output_shape(i);
+        const auto &origShape = op->get_output_partial_shape(i);
+        const auto& shape = Shape(origShape.rank().get_length() == 0 ? ngraph::PartialShape{1} : origShape);
         const auto prec = InferenceEngine::details::convertPrecision(op->get_output_element_type(i));
 
         PortConfig data_conf {};
         auto descCreator = BlockedDescCreator::getCommonCreators().at(LayoutType::ncsp);
-        data_conf.desc = descCreator->createUniqueDesc(prec, dims);
+        data_conf.desc = descCreator->createSharedDesc(prec, shape);
         config.outConfs.push_back(data_conf);
     }
 
@@ -56,8 +59,8 @@ class PortIteratorHelper : public PortMapHelper {
         auto axis = slice_rule.axis;
         auto stride = slice_rule.stride;
 
-        auto full_dims = full_blob->GetDims();
-        auto part_dims = part_blob->GetDims();
+        auto full_dims = full_blob->GetShape().getStaticDims();
+        auto part_dims = part_blob->GetShape().getStaticDims();
 
         auto abs_stride = std::abs(stride);
         auto sign_of_stride = stride < 0.0f ? -1 : 1;
@@ -68,7 +71,7 @@ class PortIteratorHelper : public PortMapHelper {
         IE_ASSERT(full_dims == part_dims) << "Shape mismatch for tensor iterator port";
 
         // make chunk view
-        auto chunk_desc =  full_blob->GetDescriptor();
+        auto chunk_desc = full_blob->GetDescWithType<DnnlMemoryDesc>()->getDnnlDesc();
         chunk_desc.data.dims[axis] = abs_stride;
         chunk_desc.data.padded_dims[axis] = abs_stride;  // TODO: asamption that plain tensor
 
@@ -132,7 +135,7 @@ class IterCountPortHelper : public PortMapHelper {
     IterCountPortHelper(const MKLDNNMemoryPtr &to, const mkldnn::engine& eng) {
         // Only scalar I32 tensor is supported
         IE_ASSERT(to->GetDataType() == memory::data_type::s32);
-        IE_ASSERT(to->GetDims() == memory::dims{1});
+        IE_ASSERT(to->GetShape() == Shape(InferenceEngine::SizeVector{1}));
         mem_holder_dst = to->GetPrimitive();
     }
 
@@ -150,7 +153,7 @@ class asBoolCheck : public PortChecker {
 public:
     asBoolCheck(const MKLDNNMemoryPtr &mem) {
         IE_ASSERT(mem->GetDataType() == memory::data_type::u8);
-        IE_ASSERT(mem->GetDims() == memory::dims{1});
+        IE_ASSERT(mem->GetShape() == Shape(InferenceEngine::SizeVector{1}));
         mem_holder = mem->GetPrimitive();
     }
 
@@ -167,7 +170,8 @@ class asIntCheck : public PortChecker {
 public:
     asIntCheck(const MKLDNNMemoryPtr &mem) {
         IE_ASSERT(mem->GetDataType() == memory::data_type::s32);
-        IE_ASSERT(mem->GetDims() == memory::dims{1});
+        const auto a = Shape(InferenceEngine::SizeVector{1});
+        IE_ASSERT(mem->GetShape() == a);
         mem_holder = mem->GetPrimitive();
     }
 
@@ -273,6 +277,11 @@ int getNumIteration(const std::shared_ptr<const ngraph::Node>& op, const std::ve
 
 bool MKLDNNTensorIteratorNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         if (!one_of(op->get_type_info(),
                 ngraph::op::v0::TensorIterator::type_info,
                 ngraph::op::v5::Loop::type_info)) {
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.cpp
index c92193c6e927c0..00fc9ba787323f 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.cpp
@@ -13,8 +13,12 @@ using namespace mkldnn;
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNTileNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNTileNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto tile = std::dynamic_pointer_cast<const ngraph::opset1::Tile>(op);
         if (!tile) {
             errorMessage = "Only opset1 Tile operation is supported";
@@ -86,17 +90,12 @@ void MKLDNNTileNode::initSupportedPrimitiveDescriptors() {
         IE_THROW() << errorPrefix << " has unsupported input precision: " << precision;
     }
 
-    auto descCreator = BlockedDescCreator::getCommonCreators().at(LayoutType::ncsp);
-
-    NodeConfig config;
-    config.dynBatchSupport = true;
-    config.inConfs.resize(2);
-    config.outConfs.resize(1);
-    config.inConfs[TILE_INPUT].desc = descCreator->createUniqueDesc(precision, getParentEdgeAt(TILE_INPUT)->getShape().getStaticDims());
-    config.inConfs[TILE_REPEATS].desc = descCreator->createUniqueDesc(Precision::I32, getParentEdgeAt(TILE_REPEATS)->getShape().getStaticDims());
-    config.outConfs[0].desc = descCreator->createUniqueDesc(precision, getChildEdgeAt(0)->getShape().getStaticDims());
-    config.outConfs[0].inPlace = noTiling ? 0 : -1;
-    supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
+    int inPlace = noTiling ? 0 : -1;
+    addSupportedPrimDesc({{LayoutType::ncsp, precision},
+                           {LayoutType::ncsp, Precision::I32}},
+                          {{LayoutType::ncsp, precision, false, inPlace}},
+                           impl_desc_type::unknown,
+                           true);
 }
 
 void MKLDNNTileNode::createPrimitive() {
@@ -122,7 +121,7 @@ void MKLDNNTileNode::execute(mkldnn::stream strm) {
 
     int m_inner_dim = 1;
     int m_outer_dim = 1;
-    memory::dims inDims = srcMemory.GetDims();
+    auto inDims = srcMemory.getStaticDims();
     for (int i=0; i < axis; i++ ) m_outer_dim *= inDims[i];
     for (int i=axis; i < inDims.size(); i++ ) m_inner_dim *= inDims[i];
     if (axis > 0) {
@@ -133,13 +132,13 @@ void MKLDNNTileNode::execute(mkldnn::stream strm) {
         m_inner_dim *= batchToProcess();
     }
 
-    if (m_inner_dim == 1 && m_outer_dim % 8 == 0 && srcMemory.GetDesc().hasLayoutType(LayoutType::nCsp8c)) {
+    if (m_inner_dim == 1 && m_outer_dim % 8 == 0 && srcMemory.getDesc().hasLayoutType(LayoutType::nCsp8c)) {
         /*
          * We may enable tile processing directly to appropriate output format (nChw8c)
          */
         m_inner_dim *= 8;
         m_outer_dim /= 8;
-    } else if (m_inner_dim == 1 && m_outer_dim % 16 == 0 && srcMemory.GetDesc().hasLayoutType(LayoutType::nCsp16c)) {
+    } else if (m_inner_dim == 1 && m_outer_dim % 16 == 0 && srcMemory.getDesc().hasLayoutType(LayoutType::nCsp16c)) {
         /*
          * We may enable tile processing directly to appropriate output format (nChw16c)
          */
@@ -147,7 +146,7 @@ void MKLDNNTileNode::execute(mkldnn::stream strm) {
         m_outer_dim /= 16;
     }
 
-    m_inner_dim *= srcMemory.GetDesc().getPrecision().size();
+    m_inner_dim *= srcMemory.getDesc().getPrecision().size();
     for (int i = 0; i < m_outer_dim; ++i) {
         for (int t = 0; t < tiles; ++t) {
             cpu_memcpy(dst_ptr, src_ptr, m_inner_dim);
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.h
index a6fd6e51168ff1..2eeb96ae3d8687 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_tile_node.h
@@ -20,7 +20,7 @@ class MKLDNNTileNode : public MKLDNNNode {
     void execute(mkldnn::stream strm) override;
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept;
 
 private:
     static const size_t TILE_INPUT = 0;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.cpp
index f3fa2e69b5fa8d..ffef15396cdb84 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.cpp
@@ -16,8 +16,12 @@
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
 
-bool MKLDNNTopKNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept {
+bool MKLDNNTopKNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
         const auto topKOp = ngraph::as_type_ptr<const ngraph::op::v1::TopK>(op);
         if (!topKOp) {
             errorMessage = "Node is not an instance of the TopK from the operations set v1 or v3";
@@ -48,7 +52,7 @@ MKLDNNTopKNode::MKLDNNTopKNode(const std::shared_ptr<ngraph::Node>& op, const mk
     }
     auto topK1Op = ngraph::as_type_ptr<ngraph::op::v1::TopK>(op);
 
-    SizeVector dstDims = topK1Op->get_output_shape(TOPK_VALUE);
+    VectorDims dstDims = topK1Op->get_output_shape(TOPK_VALUE);
     src_dims = topK1Op->get_input_shape(TOPK_DATA);
 
     axis = topK1Op->get_axis();
@@ -85,9 +89,9 @@ void MKLDNNTopKNode::initSupportedPrimitiveDescriptors() {
         return;
 
     std::vector<PortConfigurator> outDataConf;
-    outDataConf.reserve(getOriginalOutputsNumber());
+    outDataConf.reserve(outputShapes.size());
     outDataConf.emplace_back(LayoutType::ncsp, Precision::FP32);
-    for (int i = 1; i < getOriginalOutputsNumber(); ++i)
+    for (int i = 1; i < outputShapes.size(); ++i)
         outDataConf.emplace_back(LayoutType::ncsp, Precision::I32);
 
     addSupportedPrimDesc({{LayoutType::ncsp, Precision::FP32},
@@ -108,7 +112,7 @@ void MKLDNNTopKNode::execute(mkldnn::stream strm) {
         } else {
             dst_idx = reinterpret_cast<int *>(getChildEdgesAtPort(0)[0]->getMemoryPtr()->GetPtr());
         }
-        SizeVector dstDims = getChildEdgesAtPort(0)[0]->getShape().getStaticDims();
+        const VectorDims& dstDims = getChildEdgesAtPort(0)[0]->getMemory().getStaticDims();
 
         if (dstDims[axis] != static_cast<size_t>(src_k)) {
             std::string errorMsg = "Output tensor dimension mismatch";
@@ -116,10 +120,10 @@ void MKLDNNTopKNode::execute(mkldnn::stream strm) {
         }
     } else if (outputShapes.size() == 2) {
         dst_data = reinterpret_cast<float *>(getChildEdgesAtPort(TOPK_VALUE)[0]->getMemoryPtr()->GetPtr());
-        SizeVector dst_data_dims = getChildEdgesAtPort(TOPK_VALUE)[0]->getShape().getStaticDims();
+        const VectorDims& dst_data_dims = getChildEdgesAtPort(TOPK_VALUE)[0]->getMemory().getStaticDims();
 
         dst_idx = reinterpret_cast<int *>(getChildEdgesAtPort(TOPK_INDEX)[0]->getMemoryPtr()->GetPtr());
-        SizeVector dst_idx_dims = getChildEdgesAtPort(TOPK_INDEX)[0]->getShape().getStaticDims();
+        const VectorDims& dst_idx_dims = getChildEdgesAtPort(TOPK_INDEX)[0]->getMemory().getStaticDims();
 
         if (dst_idx_dims[axis] != static_cast<size_t>(src_k) || dst_data_dims[axis] != static_cast<size_t>(src_k)) {
             std::string errorMsg = "Output tensors dimension mismatch";
@@ -133,7 +137,7 @@ void MKLDNNTopKNode::execute(mkldnn::stream strm) {
     if (src_dims[axis] < static_cast<size_t>(src_k))
         src_k = src_dims[axis];
 
-    SizeVector in_dims = getParentEdgeAt(TOPK_DATA)->getShape().getStaticDims();
+    const VectorDims& in_dims = getParentEdgeAt(TOPK_DATA)->getMemory().getStaticDims();
 
     if (src_k == 1) {
         if (is_last_dim) {
@@ -167,7 +171,7 @@ bool MKLDNNTopKNode::created() const {
 }
 
 template <class Compare1, template <typename> class Compare2>
-void MKLDNNTopKNode::top1_axis(const float* src_data, float* dst_data, int* dst_idx, SizeVector in_dims) {
+void MKLDNNTopKNode::top1_axis(const float* src_data, float* dst_data, int* dst_idx, VectorDims in_dims) {
     int after_num = count(in_dims, axis + 1, in_dims.size());
     int first_index = 0;
 
@@ -216,7 +220,7 @@ void MKLDNNTopKNode::top1_axis(const float* src_data, float* dst_data, int* dst_
 }
 
 template <template <typename> class Compare>
-void MKLDNNTopKNode::top1(const float* src_data, float* dst_data, int* dst_idx, SizeVector in_dims) {
+void MKLDNNTopKNode::top1(const float* src_data, float* dst_data, int* dst_idx, VectorDims in_dims) {
     parallel_for(before_num, [&](int i0) {
         int index_max_val = 0;
         int s_index = i0 * dim;
@@ -236,7 +240,7 @@ void MKLDNNTopKNode::top1(const float* src_data, float* dst_data, int* dst_idx,
 }
 
 template <class Compare1, template <typename> class Compare2>
-void MKLDNNTopKNode::topk_axis(const float* src_data, float* dst_data, int* dst_idx, SizeVector in_dims) {
+void MKLDNNTopKNode::topk_axis(const float* src_data, float* dst_data, int* dst_idx, VectorDims in_dims) {
     int after_num = count(in_dims, axis + 1, in_dims.size());
     int first_index = 0;
 
@@ -403,7 +407,7 @@ void MKLDNNTopKNode::topk_axis(const float* src_data, float* dst_data, int* dst_
 }
 
 template <template <typename> class Compare>
-void MKLDNNTopKNode::topk(const float* src_data, float* dst_data, int* dst_idx, SizeVector in_dims) {
+void MKLDNNTopKNode::topk(const float* src_data, float* dst_data, int* dst_idx, VectorDims in_dims) {
     parallel_for(before_num, [&](int i0) {
         std::vector<float> max_values(src_k + 1);
         std::vector<int> max_indexes(src_k + 1);
@@ -464,14 +468,14 @@ void MKLDNNTopKNode::topk(const float* src_data, float* dst_data, int* dst_idx,
     });
 }
 
-inline int MKLDNNTopKNode::count(SizeVector dims, size_t start_ind, size_t end_ind) {
+inline int MKLDNNTopKNode::count(VectorDims dims, size_t start_ind, size_t end_ind) {
     size_t count = 1;
     for (size_t i = start_ind; i < end_ind; i++)
         count *= dims[i];
     return static_cast<int>(count);
 }
 
-inline int MKLDNNTopKNode::count(SizeVector dims, size_t start_ind) {
+inline int MKLDNNTopKNode::count(VectorDims dims, size_t start_ind) {
     return count(dims, start_ind, dims.size());
 }
 
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.h b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.h
index b8594c40363731..3cf879f433826b 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.h
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_topk_node.h
@@ -25,7 +25,7 @@ class MKLDNNTopKNode : public MKLDNNNode {
 
     bool created() const override;
 
-    static bool isSupportedOperation(const std::shared_ptr<ngraph::Node> &op, std::string &errorMessage) noexcept;
+    static bool isSupportedOperation(const std::shared_ptr<const ngraph::Node> &op, std::string &errorMessage) noexcept;
 
 #if defined(HAVE_AVX512F)
     const int block_size = 16;
diff --git a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_transpose_node.cpp b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_transpose_node.cpp
index 5ea5b902e3e212..850f651b2efc2c 100644
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_transpose_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_transpose_node.cpp
@@ -11,6 +11,7 @@
 #include "ie_parallel.hpp"
 #include "utils/bfloat16.hpp"
 #include <utils/general_utils.h>
+#include "utils/ngraph_utils.hpp"
 
 using namespace mkldnn;
 using namespace MKLDNNPlugin;
@@ -19,6 +20,11 @@ using namespace InferenceEngine;
 
 bool MKLDNNTransposeNode::isSupportedOperation(const std::shared_ptr<const ngraph::Node>& op, std::string& errorMessage) noexcept {
     try {
+        if (isDynamicNgraphNode(op)) {
+            errorMessage = "Doesn't support op with dynamic shapes";
+            return false;
+        }
+
         const auto transposeOp = ngraph::as_type_ptr<const ngraph::op::v1::Transpose>(op);
         if (!transposeOp) {
             errorMessage = "Node is not an instance of the Transpose operation.";
@@ -62,9 +68,8 @@ void MKLDNNTransposeNode::initSupportedPrimitiveDescriptors() {
         return;
 
     prec = getOriginalInputPrecisionAtPort(0);
-    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(prec);
-    auto outputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(prec);
-    auto inputOrderDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(getOriginalInputPrecisionAtPort(1));
+
+    auto& creatorsMap = BlockedDescCreator::getCommonCreators();
 
     NodeConfig config;
     config.dynBatchSupport = true;
@@ -74,66 +79,33 @@ void MKLDNNTransposeNode::initSupportedPrimitiveDescriptors() {
     config.inConfs[0].constant = false;
     config.outConfs[0].inPlace = -1;
     config.outConfs[0].constant = false;
-    config.inConfs[1].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(1)->getShape().getStaticDims(), inputOrderDataType,
-                                                                         memory::format_tag::x);
-    if (getParentEdgeAt(0)->getShape().getRank() == 4) {
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                             memory::format_tag::nchw);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType,
-                                                                              memory::format_tag::nchw);
-        supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
-
-        auto srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
-        if (srcDims[1] % 8 == 0) {
-            config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                   memory::format_tag::nChw8c);
-            supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
-        }
-
-        if (srcDims[1] % 16 == 0) {
-            config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                   memory::format_tag::nChw16c);
-            supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
-        }
+    config.inConfs[1].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(getOriginalInputPrecisionAtPort(1), getInputShapeAtPort(1));
 
-        if (prec == Precision::FP32 || prec == Precision::I8 || prec == Precision::U8) {
-            config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                   memory::format_tag::nhwc);
-            config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType,
-                                                                    memory::format_tag::nhwc);
-            supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
-        }
-    } else if (getParentEdgeAt(0)->getShape().getRank() == 5) {
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                               memory::format_tag::ncdhw);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType,
-                                                                memory::format_tag::ncdhw);
+    if (getInputShapeAtPort(0).getRank() == 4 || getInputShapeAtPort(0).getRank() == 5) {
+        config.inConfs[0].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(prec, getInputShapeAtPort(0));
+        config.outConfs[0].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(prec, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
 
-        auto srcDims = getParentEdgeAt(0)->getShape().getStaticDims();
+        auto srcDims = getInputShapeAtPort(0).getStaticDims();
         if (srcDims[1] % 8 == 0) {
-            config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                   memory::format_tag::nCdhw8c);
+            config.inConfs[0].desc = creatorsMap.at(LayoutType::nCsp8c)->createSharedDesc(prec, getInputShapeAtPort(0));
             supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
         }
 
         if (srcDims[1] % 16 == 0) {
-            config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                   memory::format_tag::nCdhw16c);
+            config.inConfs[0].desc = creatorsMap.at(LayoutType::nCsp16c)->createSharedDesc(prec, getInputShapeAtPort(0));
             supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
         }
 
         if (prec == Precision::FP32 || prec == Precision::I8 || prec == Precision::U8) {
-            config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType,
-                                                                   memory::format_tag::ndhwc);
-            config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType,
-                                                                    memory::format_tag::ndhwc);
+            config.inConfs[0].desc = creatorsMap.at(LayoutType::nspc)->createSharedDesc(prec, getInputShapeAtPort(0));
+            config.outConfs[0].desc = creatorsMap.at(LayoutType::nspc)->createSharedDesc(prec, getOutputShapeAtPort(0));
             supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
         }
     } else {
         // general plain case
-        config.inConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getParentEdgeAt(0)->getShape().getStaticDims(), inputDataType);
-        config.outConfs[0].desc = MKLDNNPlugin::make_unique<MKLDNNMemoryDesc>(getChildEdgeAt(0)->getShape().getStaticDims(), outputDataType);
+        config.inConfs[0].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(prec, getInputShapeAtPort(0));
+        config.outConfs[0].desc = creatorsMap.at(LayoutType::ncsp)->createSharedDesc(prec, getOutputShapeAtPort(0));
         supportedPrimitiveDescriptors.push_back({config, impl_desc_type::unknown});
     }
 }
@@ -148,7 +120,7 @@ void MKLDNNTransposeNode::createPrimitive() {
     if (getSelectedPrimitiveDescriptor() == nullptr)
         IE_THROW() << "Preferable primitive descriptor is not set.";
 
-    if (getParentEdgeAt(0)->getMemory().GetDesc().hasLayoutType(LayoutType::ncsp) &&
+    if (getParentEdgeAt(0)->getMemory().getDesc().hasLayoutType(LayoutType::ncsp) &&
         std::find(optimizedOrders.begin(), optimizedOrders.end(), order) != optimizedOrders.end()) {
         isOptimized = true;
         return;
@@ -158,12 +130,12 @@ void MKLDNNTransposeNode::createPrimitive() {
     params.data_size = getSelectedPrimitiveDescriptor()->getConfig().inConfs[0].desc->getPrecision().size();
     params.order = order;
     auto srcDesc = getParentEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    params.src_block_dims = srcDesc.getBlockDims();
-    params.src_block_order = srcDesc.getOrder();
+    params.src_block_dims = srcDesc->getBlockDims();
+    params.src_block_order = srcDesc->getOrder();
 
     auto dstDesc = getChildEdgeAt(0)->getMemory().GetDescWithType<BlockedMemoryDesc>();
-    params.dst_block_dims = dstDesc.getBlockDims();
-    params.dst_block_order = dstDesc.getOrder();
+    params.dst_block_dims = dstDesc->getBlockDims();
+    params.dst_block_order = dstDesc->getOrder();
 
     permuteKernel = std::unique_ptr<PermuteKernel>(new PermuteKernel(params));
 }
@@ -173,9 +145,9 @@ static void transpose_to_0312(const int MB, const MKLDNNMemoryPtr& srcMemPtr, MK
     const auto src_data = reinterpret_cast<const T*>(srcMemPtr->GetPtr());
     auto dst_data = reinterpret_cast<T*>(dstMemPtr->GetPtr());
 
-    const int DIM1 = srcMemPtr->GetDims()[1];
-    const int DIM2 = srcMemPtr->GetDims()[2];
-    const int DIM3 = srcMemPtr->GetDims()[3];
+    const int DIM1 = srcMemPtr->getStaticDims()[1];
+    const int DIM2 = srcMemPtr->getStaticDims()[2];
+    const int DIM3 = srcMemPtr->getStaticDims()[3];
 
     parallel_for3d(MB, DIM1, DIM2, [&](const int n, const int dim1, const int dim2) {
         for (int dim3 = 0; dim3 < DIM3; ++dim3) {
@@ -198,10 +170,10 @@ static void transpose_to_04123(const int MB, const MKLDNNMemoryPtr& srcMemPtr, M
     const auto src_data = reinterpret_cast<const T*>(srcMemPtr->GetPtr());
     auto dst_data = reinterpret_cast<T*>(dstMemPtr->GetPtr());
 
-    const int DIM1 = srcMemPtr->GetDims()[1];
-    const int DIM2 = srcMemPtr->GetDims()[2];
-    const int DIM3 = srcMemPtr->GetDims()[3];
-    const int DIM4 = srcMemPtr->GetDims()[4];
+    const int DIM1 = srcMemPtr->getStaticDims()[1];
+    const int DIM2 = srcMemPtr->getStaticDims()[2];
+    const int DIM3 = srcMemPtr->getStaticDims()[3];
+    const int DIM4 = srcMemPtr->getStaticDims()[4];
 
     parallel_for4d(MB, DIM1, DIM2, DIM3, [&](const int n, const int dim1, const int dim2, const int dim3) {
         for (int dim4 = 0; dim4 < DIM4; ++dim4) {
@@ -226,11 +198,11 @@ static void transpose_to_051234(const int MB, const MKLDNNMemoryPtr& srcMemPtr,
     const auto src_data = reinterpret_cast<const T*>(srcMemPtr->GetPtr());
     auto dst_data = reinterpret_cast<T*>(dstMemPtr->GetPtr());
 
-    const int DIM1 = srcMemPtr->GetDims()[1];
-    const int DIM2 = srcMemPtr->GetDims()[2];
-    const int DIM3 = srcMemPtr->GetDims()[3];
-    const int DIM4 = srcMemPtr->GetDims()[4];
-    const int DIM5 = srcMemPtr->GetDims()[5];
+    const int DIM1 = srcMemPtr->getStaticDims()[1];
+    const int DIM2 = srcMemPtr->getStaticDims()[2];
+    const int DIM3 = srcMemPtr->getStaticDims()[3];
+    const int DIM4 = srcMemPtr->getStaticDims()[4];
+    const int DIM5 = srcMemPtr->getStaticDims()[5];
 
     parallel_for5d(MB, DIM1, DIM2, DIM3, DIM4, [&](const int n, const int dim1, const int dim2, const int dim3, const int dim4) {
         for (int dim5 = 0; dim5 < DIM5; ++dim5) {
@@ -254,7 +226,7 @@ static void transpose_to_051234(const int MB, const MKLDNNMemoryPtr& srcMemPtr,
 
 template<typename T>
 void MKLDNNTransposeNode::optimizedExecute(const int MB, const MKLDNNMemoryPtr& srcMemPtr, MKLDNNMemoryPtr& dstMemPtr) {
-    switch (srcMemPtr->GetDims().size()) {
+    switch (srcMemPtr->getStaticDims().size()) {
         case 4:
             transpose_to_0312<T>(MB, srcMemPtr, dstMemPtr);
             break;
@@ -275,7 +247,7 @@ void MKLDNNTransposeNode::execute(mkldnn::stream strm) {
     int MB = batchToProcess();
 
     if (isOptimized) {
-        const size_t dataSize = getParentEdgeAt(0)->getMemory().GetDesc().getPrecision().size();
+        const size_t dataSize = getParentEdgeAt(0)->getMemory().getDesc().getPrecision().size();
         TransposeContext ctx = {this, srcMemPtr, dstMemPtr, MB};
         OV_SWITCH(MKLDNNPlugin, TransposeOptimizedEmitter, ctx, dataSize,
                   OV_CASE(1, PrecisionTrait<Precision::U8>::value_type),
diff --git a/inference-engine/src/mkldnn_plugin/utils/blob_dump.cpp b/inference-engine/src/mkldnn_plugin/utils/blob_dump.cpp
index 1272183c68beea..fb5d285de8192a 100644
--- a/inference-engine/src/mkldnn_plugin/utils/blob_dump.cpp
+++ b/inference-engine/src/mkldnn_plugin/utils/blob_dump.cpp
@@ -11,7 +11,7 @@
 #include "common/memory_desc_wrapper.hpp"
 
 #include <fstream>
-#include <cpu_memory_desc_utils.h>
+#include <memory_desc/cpu_memory_desc_utils.h>
 
 using namespace InferenceEngine;
 
@@ -65,7 +65,7 @@ static IEB_HEADER prepare_header(const MemoryDesc& desc) {
     return header;
 }
 
-static MKLDNNMemoryDesc parse_header(IEB_HEADER &header) {
+static DnnlBlockedMemoryDesc parse_header(IEB_HEADER &header) {
     if (header.magic[0] != IEB_MAGIC[0] ||
         header.magic[1] != IEB_MAGIC[1] ||
         header.magic[2] != IEB_MAGIC[2] ||
@@ -76,16 +76,16 @@ static MKLDNNMemoryDesc parse_header(IEB_HEADER &header) {
         header.ver[1] != 1)
         IE_THROW() << "Dumper cannot parse file. Unsupported IEB format version.";
 
-    const auto prc = MKLDNNExtensionUtils::IEPrecisionToDataType(Precision(static_cast<Precision::ePrecision>(header.precision)));
+    const auto prc = Precision(static_cast<Precision::ePrecision>(header.precision));
     SizeVector dims(header.ndims);
     for (int i = 0; i < header.ndims; i++)
         dims[i] = header.dims[i];
 
-    return MKLDNNMemoryDesc{dims, prc, MKLDNNMemory::GetPlainFormatByRank(dims.size()) };
+    return DnnlBlockedMemoryDesc{prc, Shape(dims)};
 }
 
 void BlobDumper::prepare_plain_data(const MKLDNNMemoryPtr &memory, std::vector<uint8_t> &data) const {
-    const auto &desc = memory->GetDesc();
+    const auto &desc = memory->getDesc();
     size_t data_size = desc.getShape().getElementsCount();
     const auto size = data_size * desc.getPrecision().size();
     data.resize(size);
@@ -132,7 +132,7 @@ void BlobDumper::dump(std::ostream &stream) const {
     if (memory == nullptr)
         IE_THROW() << "Dumper cannot dump. Memory is not allocated.";
 
-    IEB_HEADER header = prepare_header(memory->GetDesc());
+    IEB_HEADER header = prepare_header(memory->getDesc());
     std::vector<uint8_t> data;
     prepare_plain_data(this->memory, data);
 
@@ -149,12 +149,12 @@ void BlobDumper::dumpAsTxt(std::ostream &stream) const {
     if (memory == nullptr)
         IE_THROW() << "Dumper cannot dump. Memory is not allocated.";
 
-    const auto dims = memory->GetDims();
-    const auto &desc = memory->GetDesc();
+    const auto &desc = memory->getDesc();
+    const auto dims = desc.getShape().getStaticDims();
     size_t data_size = desc.getShape().getElementsCount();
 
     // Header like "U8 4D shape: 2 3 224 224 ()
-    stream << memory->GetDesc().getPrecision().name() << " "
+    stream << memory->getDesc().getPrecision().name() << " "
            << dims.size() << "D "
            << "shape: ";
     for (size_t d : dims) stream << d << " ";
diff --git a/inference-engine/src/mkldnn_plugin/utils/blob_dump.h b/inference-engine/src/mkldnn_plugin/utils/blob_dump.h
index 5271f351d6b492..5d079e797ef57a 100644
--- a/inference-engine/src/mkldnn_plugin/utils/blob_dump.h
+++ b/inference-engine/src/mkldnn_plugin/utils/blob_dump.h
@@ -5,6 +5,7 @@
 #pragma once
 
 #include "mkldnn_memory.h"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 #include <string>
 
@@ -25,7 +26,7 @@ class BlobDumper {
 
 public:
     BlobDumper() = default;
-    BlobDumper(const MKLDNNMemoryDesc &desc) {
+    BlobDumper(const DnnlBlockedMemoryDesc &desc) {
         mkldnn::engine eng(mkldnn::engine::kind::cpu, 0);
         memory = std::make_shared<MKLDNNMemory>(eng);
         memory->Create(desc);
diff --git a/inference-engine/src/mkldnn_plugin/utils/cpu_utils.hpp b/inference-engine/src/mkldnn_plugin/utils/cpu_utils.hpp
index 0cd3975c39a88c..38a4f7ac0d7a8b 100644
--- a/inference-engine/src/mkldnn_plugin/utils/cpu_utils.hpp
+++ b/inference-engine/src/mkldnn_plugin/utils/cpu_utils.hpp
@@ -4,7 +4,6 @@
 
 #pragma once
 
-
 namespace MKLDNNPlugin {
 
 /**
@@ -90,4 +89,5 @@ inline InferenceEngine::Precision normalizeToSupportedPrecision(InferenceEngine:
     }
     return precision;
 }
+
 }  // namespace MKLDNNPlugin
diff --git a/inference-engine/src/mkldnn_plugin/utils/general_utils.h b/inference-engine/src/mkldnn_plugin/utils/general_utils.h
index 35640212a5555b..f50164eb422c53 100644
--- a/inference-engine/src/mkldnn_plugin/utils/general_utils.h
+++ b/inference-engine/src/mkldnn_plugin/utils/general_utils.h
@@ -41,29 +41,6 @@ constexpr inline bool implication(bool cause, bool cond) {
     return !cause || !!cond;
 }
 
-template<typename T, typename... Args>
-std::unique_ptr<T> make_unique(Args&&... args) {
-    return std::unique_ptr<T>(new T(std::forward<Args>(args)...));
-}
-
-inline std::string getExceptionDescWithoutStatus(const InferenceEngine::Exception& ex) {
-    std::string desc = ex.what();
-    IE_SUPPRESS_DEPRECATED_START
-    if (ex.getStatus() != 0) {
-        size_t pos = desc.find("]");
-        if (pos != std::string::npos) {
-            if (desc.size() == pos + 1) {
-                desc.erase(0, pos + 1);
-            } else {
-                desc.erase(0, pos + 2);
-            }
-        }
-    }
-    IE_SUPPRESS_DEPRECATED_END
-
-    return desc;
-}
-
 template<typename T>
 std::string vec2str(const std::vector<T> &vec) {
     if (!vec.empty()) {
diff --git a/inference-engine/src/mkldnn_plugin/utils/ngraph_utils.hpp b/inference-engine/src/mkldnn_plugin/utils/ngraph_utils.hpp
index c6b54febc5a6ec..f014b418f12faf 100644
--- a/inference-engine/src/mkldnn_plugin/utils/ngraph_utils.hpp
+++ b/inference-engine/src/mkldnn_plugin/utils/ngraph_utils.hpp
@@ -39,4 +39,12 @@ inline const std::shared_ptr<T> getNgraphOpAs(const std::shared_ptr<ngraph::Node
     return typedOp;
 }
 
+inline bool isDynamicNgraphNode(const std::shared_ptr<const ngraph::Node>& op) {
+    bool ret = op->is_dynamic();
+    for (size_t i = 0; i < op->get_output_size(); i++) {
+        ret |= op->get_output_partial_shape(i).is_dynamic();
+    }
+    return ret;
+}
+
 }  // namespace MKLDNNPlugin
\ No newline at end of file
diff --git a/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp b/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp
index 2e0b06c0e4d362..256a55a7710646 100644
--- a/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp
+++ b/inference-engine/src/mkldnn_plugin/utils/node_dumper.cpp
@@ -9,7 +9,7 @@
 #include "ie_common.h"
 #include "utils/blob_dump.h"
 #include "utils/debug_capabilities.h"
-#include "cpu_memory_desc_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
 
 #include <array>
 #include <regex>
@@ -66,7 +66,7 @@ void NodeDumper::dumpInputBlobs(const MKLDNNNodePtr& node) const {
         auto dump_file = dumpDirName + "/#" + exec_order + "_" + file_name;
         std::cout << "Dump inputs: " << dump_file << std::endl;
 
-        auto& desc = prEdge->getMemory().GetDesc();
+        auto& desc = prEdge->getMemory().getDesc();
         if (desc.getPrecision() == Precision::BIN)
             continue;
 
@@ -99,7 +99,7 @@ void NodeDumper::dumpOutputBlobs(const MKLDNNNodePtr& node) const {
         auto dump_file = dumpDirName + "/#" + exec_order + "_" + file_name;
         std::cout << "Dump outputs:  " << dump_file << std::endl;
 
-        auto& desc = childEdge->getMemory().GetDesc();
+        auto& desc = childEdge->getMemory().getDesc();
         if (desc.getPrecision() == Precision::BIN)
             continue;
 
@@ -122,7 +122,7 @@ void NodeDumper::dumpInternalBlobs(const MKLDNNNodePtr& node) const {
             continue;
 
         MKLDNNMemoryPtr memory = std::make_shared<MKLDNNMemory>(node->getEngine());
-        memory->Create(MemoryDescUtils::convertToMKLDNNMemoryDesc(desc), blb->buffer());
+        memory->Create(MemoryDescUtils::convertToDnnlBlockedMemoryDesc(desc), blb->buffer());
         BlobDumper dumper(memory);
         dump(dumper, dump_file);
     }
diff --git a/inference-engine/src/multi_device/CMakeLists.txt b/inference-engine/src/multi_device/CMakeLists.txt
index 75c6d43b615b95..3c6ffbf72e1c6b 100644
--- a/inference-engine/src/multi_device/CMakeLists.txt
+++ b/inference-engine/src/multi_device/CMakeLists.txt
@@ -12,6 +12,11 @@ ie_add_plugin(NAME ${TARGET_NAME}
               SOURCES ${SOURCES} ${HEADERS}
               VERSION_DEFINES_FOR multi_device_plugin.cpp)
 
+ie_add_plugin(NAME ${TARGET_NAME}
+              DEVICE_NAME "AUTO"
+              PSEUDO_PLUGIN
+              DEFAULT_CONFIG "MULTI_WORK_MODE_AS_AUTO:YES")
+
 target_link_libraries(${TARGET_NAME} PRIVATE inference_engine ngraph inference_engine_transformations)
 
 set_ie_threading_interface_for(${TARGET_NAME})
diff --git a/inference-engine/src/multi_device/multi_device_async_infer_request.cpp b/inference-engine/src/multi_device/multi_device_async_infer_request.cpp
index 9f845586a55330..ae461d8fce5002 100644
--- a/inference-engine/src/multi_device/multi_device_async_infer_request.cpp
+++ b/inference-engine/src/multi_device/multi_device_async_infer_request.cpp
@@ -46,7 +46,8 @@ MultiDeviceAsyncInferRequest::MultiDeviceAsyncInferRequest(
                        const auto res = std::find_if(
                                _multiDeviceExecutableNetwork->_devicePrioritiesInitial.cbegin(),
                                _multiDeviceExecutableNetwork->_devicePrioritiesInitial.cend(),
-                               [&name](const MultiDevicePlugin::DeviceInformation& d){ return d.deviceName == name; });
+                               [&name](const MultiDevicePlugin::DeviceInformation& d){
+                                    return d.deviceName == name; });
                        if (_multiDeviceExecutableNetwork->_devicePrioritiesInitial.cend() == res) {
                            IE_THROW() << "None of the devices (for which current MULTI-device configuration was "
                                                  "initialized) supports a remote blob created on the device named " << name;
diff --git a/inference-engine/src/multi_device/multi_device_exec_network.cpp b/inference-engine/src/multi_device/multi_device_exec_network.cpp
index 08ff59237e17ee..3a2a3673e14aa8 100644
--- a/inference-engine/src/multi_device/multi_device_exec_network.cpp
+++ b/inference-engine/src/multi_device/multi_device_exec_network.cpp
@@ -11,16 +11,46 @@
 #include <map>
 #include <unordered_map>
 
-
+#include "ie_icore.hpp"
 #include "ie_metric_helpers.hpp"
 #include <ie_plugin_config.hpp>
 #include "multi_device_exec_network.hpp"
 #include "multi_device_async_infer_request.hpp"
 #include "multi_device_plugin.hpp"
 
+#include "ngraph/opsets/opset1.hpp"
+#include "ngraph_ops/convolution_ie.hpp"
+#include "ngraph_ops/deconvolution_ie.hpp"
+#include "transformations/utils/utils.hpp"
+
 // ------------------------------MultiDeviceExecutableNetwork----------------------------
 namespace MultiDevicePlugin {
-    using namespace InferenceEngine;
+using namespace InferenceEngine;
+
+namespace {
+std::string GetNetworkPrecision(const InferenceEngine::CNNNetwork &network) {
+    auto nGraphFunc = network.getFunction();
+    bool isINTModel = ngraph::op::util::has_op_with_type<ngraph::op::FakeQuantize>(nGraphFunc);
+    if (isINTModel) {
+        return METRIC_VALUE(INT8);
+    }
+    for (auto & node : nGraphFunc->get_ordered_ops()) {
+        if (std::dynamic_pointer_cast<ngraph::opset1::Convolution>(node) ||
+            std::dynamic_pointer_cast<ngraph::opset1::GroupConvolution>(node) ||
+            std::dynamic_pointer_cast<ngraph::opset1::GroupConvolutionBackpropData>(node) ||
+            std::dynamic_pointer_cast<ngraph::opset1::ConvolutionBackpropData>(node) ||
+            std::dynamic_pointer_cast<ngraph::op::ConvolutionIE>(node) ||
+            std::dynamic_pointer_cast<ngraph::op::DeconvolutionIE>(node)) {
+            auto layerType = node->input(1).get_element_type().get_type_name();
+            if (layerType == "f32")
+                return METRIC_VALUE(FP32);
+            if (layerType == "f16")
+                return METRIC_VALUE(FP16);
+        }
+    }
+    return METRIC_VALUE(FP32);
+}
+}  // namespace
 
 thread_local MultiDeviceExecutableNetwork::WorkerInferRequest* MultiDeviceExecutableNetwork::_thisWorkerInferRequest = nullptr;
 // TODO: revert to the plain variable (see header file), when we moved to the next CentOS 8.x in our support matrix
@@ -60,74 +90,215 @@ MultiDeviceExecutableNetwork::MultiDeviceExecutableNetwork(const DeviceMap<Infer
     for (auto&& networkValue : _networksPerDevice) {
         auto& device  = networkValue.first;
         auto& network = networkValue.second;
+        GenerateWorkers(device, network);
+    }
+}
+
+void MultiDeviceExecutableNetwork::GenerateWorkers(const std::string& device, const SoExecutableNetworkInternal& executableNetwork) {
+    auto itNumRequests = std::find_if(_devicePriorities.cbegin(), _devicePriorities.cend(),
+                                      [&device](const DeviceInformation& d){ return d.deviceName == device;});
+    unsigned int optimalNum = 0;
+    try {
+        optimalNum = executableNetwork->GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)).as<unsigned int>();
+    } catch (const InferenceEngine::Exception &iie) {
+        IE_THROW()
+            << "Every device used with the Multi-Device should "
+            << "support OPTIMAL_NUMBER_OF_INFER_REQUESTS ExecutableNetwork metric. "
+            << "Failed to query the metric for the " << device << " with error:" << iie.what();
+    }
+    const auto numRequests = (_devicePriorities.end() == itNumRequests ||
+                              itNumRequests->numRequestsPerDevices == -1) ? optimalNum : itNumRequests->numRequestsPerDevices;
+    auto& workerRequests = _workerRequests[device];
+    auto& idleWorkerRequests = _idleWorkerRequests[device];
+    workerRequests.resize(numRequests);
+    _inferPipelineTasksDeviceSpecific[device] = std::unique_ptr<ThreadSafeQueue<Task>>(new ThreadSafeQueue<Task>);
+    auto* idleWorkerRequestsPtr = &(idleWorkerRequests);
+    idleWorkerRequests.set_capacity(numRequests);
+    for (auto&& workerRequest : workerRequests) {
+        workerRequest._inferRequest = { executableNetwork, executableNetwork->CreateInferRequest() };
+        auto* workerRequestPtr = &workerRequest;
+        IE_ASSERT(idleWorkerRequests.try_push(workerRequestPtr) == true);
+        workerRequest._inferRequest->SetCallback(
+            [workerRequestPtr, this, device, idleWorkerRequestsPtr] (std::exception_ptr exceptionPtr) mutable {
+                IdleGuard idleGuard{workerRequestPtr, *idleWorkerRequestsPtr};
+                workerRequestPtr->_exceptionPtr = exceptionPtr;
+                {
+                    auto capturedTask = std::move(workerRequestPtr->_task);
+                    capturedTask();
+                }
+                // try to return the request to the idle list (fails if the overall object destruction has began)
+                if (idleGuard.Release()->try_push(workerRequestPtr)) {
+                    // let's try to pop a task, as we know there is at least one idle request, schedule if succeeded
+                    // if no device-agnostic tasks, let's try pop the device specific task, schedule if succeeded
+                    Task t;
+                    if (_inferPipelineTasks.try_pop(t))
+                        ScheduleToWorkerInferRequest(std::move(t));
+                    else if (_inferPipelineTasksDeviceSpecific[device]->try_pop(t))
+                        ScheduleToWorkerInferRequest(std::move(t), device);
+                }
+            });
+    }
+}
+
+MultiDeviceExecutableNetwork::MultiDeviceExecutableNetwork(const std::string&                         modelPath,
+                                                           const InferenceEngine::CNNNetwork&         network,
+                                                           const std::vector<DeviceInformation>&      metaDevices,
+                                                           const std::string&                         strDevices,
+                                                           MultiDeviceInferencePlugin*                plugin,
+                                                           const bool                                needPerfCounters)
+                                                           : _devicePriorities{metaDevices}
+                                                           , _devicePrioritiesInitial{metaDevices}
+                                                           , _needPerfCounters(needPerfCounters)
+                                                           , _multiPlugin(plugin)
+                                                           , _workModeIsAUTO(true) {
+    if (_multiPlugin->GetCore() == nullptr) {
+        IE_THROW() << "Please, work with MULTI device via InferencEngine::Core object";
+    }
+
+    if (modelPath.empty() && network.getFunction() == nullptr) {
+        IE_THROW() << "MULTI device supports just ngraph network representation";
+    }
+
+    _core = _multiPlugin->GetCore(); // shared_ptr that holds the Core
+    _config[MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES] = strDevices;
+
+    std::vector<DeviceInformation> needLoadDevices;
+
+    // check if have cpu device
+    const auto CPUIter = std::find_if(metaDevices.begin(), metaDevices.end(),
+                                      [=](const DeviceInformation& d)->bool{return d.deviceName.find("CPU") != std::string::npos;});
+    if (CPUIter != metaDevices.end()) {
+        _cpuDevice = *CPUIter;
+        _config.insert(_cpuDevice.config.begin(), _cpuDevice.config.end());
+        needLoadDevices.push_back(_cpuDevice);
+        _cpuFuture = _cpuPromise.get_future();
+    }
+
+    // get accelerator device, like GPU
+    auto networkPrecision = GetNetworkPrecision(network);
+    _acceleratorDevice = _multiPlugin->SelectDevice(metaDevices, networkPrecision);
+    bool isAccelerator =
+        _acceleratorDevice.deviceName.find("CPU") == std::string::npos;
+    if (isAccelerator) {
+        _config.insert(_acceleratorDevice.config.begin(), _acceleratorDevice.config.end());
+        needLoadDevices.push_back(_acceleratorDevice);
+        _acceleratorFuture = _acceleratorPromise.get_future();
+    }
+
+    if (needLoadDevices.size() == 0) {
+        IE_THROW() << "No device set";
+    }
+
+    // will not wait for loading accelerator network,
+    // so the executor can't be destroyed before finished the task,
+    // so use executor as a member of MultiDeviceExecutableNetwork.
+    _executor = InferenceEngine::ExecutorManager::getInstance()->getIdleCPUStreamsExecutor(
+            IStreamsExecutor::Config{"AutoDeviceAsyncLoad",
+            static_cast<int>(std::thread::hardware_concurrency()) /* max possible #streams*/,
+            1 /*single thread per stream*/,
+            IStreamsExecutor::ThreadBindingType::NONE});
+
+    for (auto& p : needLoadDevices) {
+        // initialize these containers firstly to avoid insert operation in threads
+        _idleWorkerRequests[p.deviceName];
+        _workerRequests[p.deviceName];
+        _inferPipelineTasksDeviceSpecific[p.deviceName] = NULL;
+        const auto device = p.deviceName;
+        const auto deviceConfig = p.config;
+        // will not wait for loading accelerator network,
+        // so some parameters need to be transferred by value.
+       _executor->run([&, modelPath, network, device, deviceConfig]() {
+            SoExecutableNetworkInternal executableNetwork;
+            if (!modelPath.empty()) {
+                executableNetwork = _core->LoadNetwork(modelPath, device, deviceConfig);
+            } else {
+                executableNetwork = _core->LoadNetwork(network, device, deviceConfig);
+            }
+
+            GenerateWorkers(device, executableNetwork);
+
+            if (device.find("CPU") == std::string::npos) {
+                _alreadyActualNetwork = true;
+                _acceleratorPromise.set_value(executableNetwork);
+            } else {
+                _cpuPromise.set_value(executableNetwork);
+            }
+        });
+    }
+
+    WaitFirstNetworkReady();
+}
 
-        auto itNumRequests = std::find_if(_devicePriorities.cbegin(), _devicePriorities.cend(),
-                [&device](const DeviceInformation& d){ return d.deviceName == device;});
-        unsigned int optimalNum = 0;
+void MultiDeviceExecutableNetwork::WaitFirstNetworkReady() {
+    if (_alreadyActualNetwork) {
+        return;
+    }
+    if (_cpuFuture.valid() && _acceleratorFuture.valid()) {
         try {
-            optimalNum = network->GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)).as<unsigned int>();
-        } catch (const InferenceEngine::Exception &iie) {
-            IE_THROW()
-                    << "Every device used with the Multi-Device should "
-                    << "support OPTIMAL_NUMBER_OF_INFER_REQUESTS ExecutableNetwork metric. "
-                    << "Failed to query the metric for the " << device << " with error:" << iie.what();
-        }
-        const auto numRequests = (_devicePriorities.end() == itNumRequests ||
-            itNumRequests->numRequestsPerDevices == -1) ? optimalNum : itNumRequests->numRequestsPerDevices;
-        auto& workerRequests = _workerRequests[device];
-        auto& idleWorkerRequests = _idleWorkerRequests[device];
-        workerRequests.resize(numRequests);
-        _inferPipelineTasksDeviceSpecific[device] = std::unique_ptr<ThreadSafeQueue<Task>>(new ThreadSafeQueue<Task>);
-        auto* idleWorkerRequestsPtr = &(idleWorkerRequests);
-        idleWorkerRequests.set_capacity(numRequests);
-        for (auto&& workerRequest : workerRequests) {
-            workerRequest._inferRequest = { network, network->CreateInferRequest() };
-            auto* workerRequestPtr = &workerRequest;
-            IE_ASSERT(idleWorkerRequests.try_push(workerRequestPtr) == true);
-            workerRequest._inferRequest->SetCallback(
-                [workerRequestPtr, this, device, idleWorkerRequestsPtr] (std::exception_ptr exceptionPtr) mutable {
-                    IdleGuard idleGuard{workerRequestPtr, *idleWorkerRequestsPtr};
-                    workerRequestPtr->_exceptionPtr = exceptionPtr;
-                    {
-                        auto capturedTask = std::move(workerRequestPtr->_task);
-                        capturedTask();
-                    }
-                    // try to return the request to the idle list (fails if the overall object destruction has began)
-                    if (idleGuard.Release()->try_push(workerRequestPtr)) {
-                        // let's try to pop a task, as we know there is at least one idle request, schedule if succeeded
-                        // if no device-agnostic tasks, let's try pop the device specific task, schedule if succeeded
-                        Task t;
-                        if (_inferPipelineTasks.try_pop(t))
-                            ScheduleToWorkerInferRequest(std::move(t));
-                        else if (_inferPipelineTasksDeviceSpecific[device]->try_pop(t))
-                            ScheduleToWorkerInferRequest(std::move(t), device);
-                    }
-                });
+            _networkFirstReady = _cpuFuture.get();
+        } catch (const std::exception& e) {
+            printf("Warning: load network to CPU failed: %s\n", e.what());
+            _networkActualNeeded = _acceleratorFuture.get();
         }
+    } else if (_acceleratorFuture.valid()) {  // only accelerator is valid, like AUTO:GPU
+        _networkActualNeeded = _acceleratorFuture.get();
+    } else if (_cpuFuture.valid()) {  // only CPU is valid, like AUTO:CPU
+        _networkActualNeeded = _cpuFuture.get();
+    } else {
+        IE_THROW() << "No device task available";
+    }
+
+    // if there is only one device or loading CPU device is failed,
+    // the ActualNetwork is already ok now.
+    if (!_acceleratorFuture.valid()) {
+        _alreadyActualNetwork = true;
     }
 }
 
+void MultiDeviceExecutableNetwork::WaitActualNetworkReady() const {
+    // Maybe different API will call this function, so add call once here
+    // for every MultiDeviceExecutableNetwork instance
+    std::call_once(_oc, [&] () {
+            if (_acceleratorFuture.valid()) {
+                _networkActualNeeded = _acceleratorFuture.get();
+            }
+            });
+}
+
 void MultiDeviceExecutableNetwork::ScheduleToWorkerInferRequest(Task inferPipelineTask, DeviceName preferred_device) {
-    auto devices = [&] {
-        std::lock_guard<std::mutex> lock(_mutex);
-        return _devicePriorities;
-    }();
+    std::vector<DeviceInformation> devices;
+    // AUTO work mode
+    if (_workModeIsAUTO) {
+        if (!preferred_device.empty()) {
+            // the preferred_device should be the selected device in AUTO work mode
+            if (preferred_device != _acceleratorDevice.deviceName) {
+                IE_THROW(NotFound) << "The preferred_device should be the selected device";
+            }
+            // if the device needed by customer is not ready, need to wait for it
+            WaitActualNetworkReady();
+            devices.push_back(_acceleratorDevice);
+        } else {
+            // _acceleratorDevice could be the same as _cpuDevice, such as AUTO:CPU
+            if (_alreadyActualNetwork) {
+                devices.push_back(_acceleratorDevice);
+            } else {
+                devices.push_back(_cpuDevice);
+            }
+        }
+    } else {
+        devices = [&] {
+            std::lock_guard<std::mutex> lock(_mutex);
+            return _devicePriorities;
+        }();
+    }
     for (auto&& device : devices) {
         if (!preferred_device.empty() && (device.deviceName != preferred_device))
             continue;
-        WorkerInferRequest* workerRequestPtr = nullptr;
-        NotBusyWorkerRequests& idleWorkerRequests = _idleWorkerRequests[device.deviceName];
-        if (idleWorkerRequests.try_pop(workerRequestPtr)) {
-            IdleGuard idleGuard{workerRequestPtr, idleWorkerRequests};
-            _thisWorkerInferRequest = workerRequestPtr;
-            {
-                auto capturedTask = std::move(inferPipelineTask);
-                capturedTask();
-            }
-            idleGuard.Release();
+        if (RunPipelineTask(inferPipelineTask, _idleWorkerRequests[device.deviceName], preferred_device)) {
             return;
         }
     }
+
     // no vacant requests this time, storing the task to the respective queue
     if (!preferred_device.empty())
         _inferPipelineTasksDeviceSpecific[preferred_device]->push(std::move(inferPipelineTask));
@@ -135,11 +306,35 @@ void MultiDeviceExecutableNetwork::ScheduleToWorkerInferRequest(Task inferPipeli
         _inferPipelineTasks.push(std::move(inferPipelineTask));
 }
 
+bool MultiDeviceExecutableNetwork::RunPipelineTask(Task& inferPipelineTask,
+                                            NotBusyWorkerRequests& idleWorkerRequests,
+                                            const DeviceName& preferred_device) {
+  WorkerInferRequest *workerRequestPtr = nullptr;
+  if (idleWorkerRequests.try_pop(workerRequestPtr)) {
+      IdleGuard idleGuard{workerRequestPtr, idleWorkerRequests};
+      _thisWorkerInferRequest = workerRequestPtr;
+      {
+          auto capturedTask = std::move(inferPipelineTask);
+          capturedTask();
+      }
+      idleGuard.Release();
+      return true;
+  }
+  return false;
+}
+
 void MultiDeviceExecutableNetwork::run(Task inferPipelineTask) {
     ScheduleToWorkerInferRequest(std::move(inferPipelineTask), _thisPreferredDeviceName);
 }
 
 MultiDeviceExecutableNetwork::~MultiDeviceExecutableNetwork() {
+    // this is necessary to guarantee member destroyed after getting future
+    if (_workModeIsAUTO) {
+        WaitActualNetworkReady();
+        // it's necessary to wait the loading network threads to stop here.
+        InferenceEngine::ExecutorManager::getInstance()->clear("AutoDeviceAsyncLoad");
+        _executor.reset();
+    }
     {
         std::lock_guard<std::mutex> lock(_mutex);
         _devicePriorities.clear();
@@ -147,14 +342,19 @@ MultiDeviceExecutableNetwork::~MultiDeviceExecutableNetwork() {
     /* NOTE: The only threads that use `MultiDeviceExecutableNetwork` worker infer requests' threads.
      *       But AsyncInferRequest destructor should wait for all asynchronous tasks by the request
      */
-    for (auto&& networkValue : _networksPerDevice) {
+    for (auto&& idleWorker : _idleWorkerRequests) {
         // stop accepting any idle requests back (for re-scheduling)
-        _idleWorkerRequests.at(networkValue.first).set_capacity(0);
+        idleWorker.second.set_capacity(0);
     }
     _workerRequests.clear();
 }
 
-std::shared_ptr<InferenceEngine::IRemoteContext> MultiDeviceExecutableNetwork::GetContext() const {
+std::shared_ptr<InferenceEngine::RemoteContext> MultiDeviceExecutableNetwork::GetContext() const {
+    if (_workModeIsAUTO) {
+        WaitActualNetworkReady();
+        return _networkActualNeeded->GetContext();
+    }
+
     auto devices = [&] {
         std::lock_guard<std::mutex> lock(_mutex);
         return _devicePriorities;
@@ -169,7 +369,7 @@ std::shared_ptr<InferenceEngine::IRemoteContext> MultiDeviceExecutableNetwork::G
         } catch (const NotImplemented&) {}
     }
     IE_THROW(NotImplemented) << "None of the devices in the MULTI has an associated remote context."
-                       << " Current list of devices allowed via the DEVICE_PRIORITIES config: " << devices_names;
+                             << " Current list of devices allowed via the DEVICE_PRIORITIES config: " << devices_names;
 }
 
 InferenceEngine::IInferRequestInternal::Ptr MultiDeviceExecutableNetwork::CreateInferRequestImpl(InferenceEngine::InputsDataMap networkInputs,
@@ -177,6 +377,11 @@ InferenceEngine::IInferRequestInternal::Ptr MultiDeviceExecutableNetwork::Create
     auto num = _numRequestsCreated++;
     size_t sum = 0;
     InferenceEngine::SoIInferRequestInternal request_to_share_blobs_with;
+
+    if (_workModeIsAUTO) {
+        return std::make_shared<MultiDeviceInferRequest>(networkInputs, networkOutputs, request_to_share_blobs_with);
+    }
+
     // borrowing device-specific blobs from the underlying requests for the device-agnostic, user-facing requests
     // this allows to potentially save on the data-copy later (if the requests are scheduled in the same order)
     for (const auto& device : _devicePrioritiesInitial) {
@@ -200,6 +405,10 @@ IInferRequestInternal::Ptr MultiDeviceExecutableNetwork::CreateInferRequest() {
 }
 
 void MultiDeviceExecutableNetwork::SetConfig(const std::map<std::string, InferenceEngine::Parameter> &config) {
+    if (_workModeIsAUTO) {
+        IE_THROW(NotImplemented);
+    }
+
     auto priorities = config.find(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
     if (priorities == config.end() || config.size() > 1) {
         IE_THROW() << "The only config supported for the Network's SetConfig is MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES";
@@ -221,8 +430,7 @@ void MultiDeviceExecutableNetwork::SetConfig(const std::map<std::string, Inferen
                 if (_networksPerDevice.find(device.deviceName) == _networksPerDevice.end()) {
                     IE_THROW(NotFound) << "You can only change device priorities but not add new devices with"
                         << " the Network's SetConfig(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES. "
-                        << device.deviceName <<
-                            " device was not in the original device list!";
+                        << device.deviceName << " device was not in the original device list!";
                 }
             }
             _devicePriorities = metaDevices;
@@ -238,11 +446,30 @@ InferenceEngine::Parameter MultiDeviceExecutableNetwork::GetConfig(const std::st
     if (it != _config.end()) {
         return it->second;
     } else {
+        // find config key among networks config keys
+        for (const auto& desc : _networksPerDevice) {
+            const auto& execNetwork = desc.second;
+            auto param = execNetwork->GetMetric(METRIC_KEY(SUPPORTED_CONFIG_KEYS));
+            for (auto &&configKey : param.as<std::vector<std::string>>()) {
+                if (configKey == name) {
+                    return execNetwork->GetConfig(configKey);
+                }
+            }
+        }
         IE_THROW(NotFound) << name <<" not found in the ExecutableNetwork config";
     }
 }
 
 InferenceEngine::Parameter MultiDeviceExecutableNetwork::GetMetric(const std::string &name) const {
+    if (_workModeIsAUTO) {
+        // fixme: should we wait actual device? meanwhile it will block inference, how to fix?
+        if (_alreadyActualNetwork) {
+            WaitActualNetworkReady();
+            return _networkActualNeeded->GetMetric(name);
+        }
+        return _networkFirstReady->GetMetric(name);
+    }
+
     if (name == METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)) {
         unsigned int res = 0u;
         for (auto n : _networksPerDevice) {
@@ -275,5 +502,4 @@ InferenceEngine::Parameter MultiDeviceExecutableNetwork::GetMetric(const std::st
         IE_THROW() << "Unsupported Network metric: " << name;
     }
 }
-
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/multi_device/multi_device_exec_network.hpp b/inference-engine/src/multi_device/multi_device_exec_network.hpp
index a771ec2531caae..2fd86c63170fad 100644
--- a/inference-engine/src/multi_device/multi_device_exec_network.hpp
+++ b/inference-engine/src/multi_device/multi_device_exec_network.hpp
@@ -16,14 +16,21 @@
 #include <cpp_interfaces/impl/ie_executable_network_thread_safe_default.hpp>
 #include <ie_parallel.hpp>
 #include <threading/ie_itask_executor.hpp>
+#include <threading/ie_executor_manager.hpp>
+#include "ie_icore.hpp"
 
 #if (IE_THREAD == IE_THREAD_TBB || IE_THREAD == IE_THREAD_TBB_AUTO)
 # include <tbb/concurrent_queue.h>
 #endif
 
+
 namespace MultiDevicePlugin {
 
+class MultiDeviceInferencePlugin;
+
 using DeviceName = std::string;
+using NetworkFuture = std::future<InferenceEngine::SoExecutableNetworkInternal>;
+using NetworkPromise = std::promise<InferenceEngine::SoExecutableNetworkInternal>;
 
 struct DeviceInformation {
     DeviceName deviceName;
@@ -105,10 +112,16 @@ class MultiDeviceExecutableNetwork : public InferenceEngine::ExecutableNetworkTh
     };
     using NotBusyWorkerRequests = ThreadSafeBoundedQueue<WorkerInferRequest*>;
 
-    explicit MultiDeviceExecutableNetwork(const DeviceMap<InferenceEngine::SoExecutableNetworkInternal>&                  networksPerDevice,
+    explicit MultiDeviceExecutableNetwork(const DeviceMap<InferenceEngine::SoExecutableNetworkInternal>&        networksPerDevice,
                                           const std::vector<DeviceInformation>&                                 networkDevices,
                                           const std::unordered_map<std::string, InferenceEngine::Parameter>&    config,
                                           const bool                                                            needPerfCounters = false);
+    MultiDeviceExecutableNetwork(const std::string&                           modelPath,
+                                 const InferenceEngine::CNNNetwork&           network,
+                                 const std::vector<DeviceInformation>&        metaDevices,
+                                 const std::string&                           strDevices,
+                                 MultiDeviceInferencePlugin*                  plugin,
+                                 const bool                                   needPerfCounters = false);
 
     void SetConfig(const std::map<std::string, InferenceEngine::Parameter> &config) override;
     InferenceEngine::Parameter GetConfig(const std::string &name) const override;
@@ -117,7 +130,7 @@ class MultiDeviceExecutableNetwork : public InferenceEngine::ExecutableNetworkTh
     InferenceEngine::IInferRequestInternal::Ptr CreateInferRequest() override;
     InferenceEngine::IInferRequestInternal::Ptr CreateInferRequestImpl(InferenceEngine::InputsDataMap networkInputs,
                                                                        InferenceEngine::OutputsDataMap networkOutputs) override;
-    std::shared_ptr<InferenceEngine::IRemoteContext> GetContext() const override;
+    std::shared_ptr<InferenceEngine::RemoteContext> GetContext() const override;
     ~MultiDeviceExecutableNetwork() override;
 
     void ScheduleToWorkerInferRequest(InferenceEngine::Task, DeviceName preferred_device = "");
@@ -138,6 +151,30 @@ class MultiDeviceExecutableNetwork : public InferenceEngine::ExecutableNetworkTh
     std::unordered_map<std::string, InferenceEngine::Parameter> _config;
     bool                                                        _needPerfCounters = false;
     std::atomic_size_t                                          _numRequestsCreated = {0};
+
+private:
+    void GenerateWorkers(const std::string& device, const InferenceEngine::SoExecutableNetworkInternal& executableNetwork);
+    void WaitActualNetworkReady() const;
+    void WaitFirstNetworkReady();
+    static bool RunPipelineTask(InferenceEngine::Task& inferPipelineTask,
+                                NotBusyWorkerRequests& idleWorkerRequests,
+                                const DeviceName& preferred_device);
+
+private:
+    std::shared_ptr<InferenceEngine::ICore>                             _core;
+    InferenceEngine::IStreamsExecutor::Ptr                              _executor;
+    MultiDeviceInferencePlugin*                                         _multiPlugin;
+    InferenceEngine::SoExecutableNetworkInternal                        _networkFirstReady;
+    mutable InferenceEngine::SoExecutableNetworkInternal                _networkActualNeeded;
+    NetworkFuture                                                       _cpuFuture;
+    NetworkPromise                                                      _cpuPromise;
+    mutable NetworkFuture                                               _acceleratorFuture;
+    mutable NetworkPromise                                              _acceleratorPromise;
+    mutable bool                                                        _alreadyActualNetwork = {false};
+    bool                                                                _workModeIsAUTO = {false};
+    DeviceInformation                                                   _cpuDevice;
+    DeviceInformation                                                   _acceleratorDevice;
+    mutable std::once_flag                                              _oc;
 };
 
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/multi_device/multi_device_plugin.cpp b/inference-engine/src/multi_device/multi_device_plugin.cpp
index 263cfdf165ef09..b4f6e3aa49ed94 100644
--- a/inference-engine/src/multi_device/multi_device_plugin.cpp
+++ b/inference-engine/src/multi_device/multi_device_plugin.cpp
@@ -16,6 +16,7 @@
 #include "ngraph_ops/deconvolution_ie.hpp"
 
 #include <ie_metric_helpers.hpp>
+#include <ie_performance_hints.hpp>
 #include <threading/ie_executor_manager.hpp>
 #include "multi_device_plugin.hpp"
 #include <ie_algorithm.hpp>
@@ -56,10 +57,12 @@ namespace {
         }
         return config;
     }
-    std::vector<std::string> supported_configKeys = {
-        MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES,
-        CONFIG_KEY_INTERNAL(WORK_MODE)
-    };
+    std::vector<std::string> supported_configKeys = []() -> decltype(PerfHintsConfig::SupportedKeys()) {
+                    auto res = PerfHintsConfig::SupportedKeys();
+                    res.push_back(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
+                    res.push_back(CONFIG_KEY_INTERNAL(MULTI_WORK_MODE_AS_AUTO));
+                    return res;
+                }();
 }  // namespace
 
 std::map<std::string, std::string> MultiDeviceInferencePlugin::GetSupportedConfig(
@@ -142,12 +145,16 @@ InferenceEngine::Parameter MultiDeviceInferencePlugin::GetConfig(const std::stri
 }
 
 void MultiDeviceInferencePlugin::SetConfig(const std::map<std::string, std::string> & config) {
+    const auto perf_hints_configs = PerfHintsConfig::SupportedKeys();
     for (auto && kvp : config) {
         const auto& name = kvp.first;
-        if (supported_configKeys.end() != std::find(supported_configKeys.begin(), supported_configKeys.end(), name))
+        if (supported_configKeys.end() != std::find(supported_configKeys.begin(), supported_configKeys.end(), name)) {
+            if (std::find(perf_hints_configs.begin(), perf_hints_configs.end(), kvp.first) != perf_hints_configs.end())
+                PerfHintsConfig::CheckConfigAndValue(kvp);
             _config[name] = kvp.second;
-        else
+        } else {
             IE_THROW() << "Unsupported config key: " << name;
+        }
     }
 }
 
@@ -167,7 +174,7 @@ InferenceEngine::Parameter MultiDeviceInferencePlugin::GetMetric(const std::stri
         metrics.push_back(METRIC_KEY(SUPPORTED_CONFIG_KEYS));
         IE_SET_METRIC_RETURN(SUPPORTED_METRICS, metrics);
     } else if (name == METRIC_KEY(FULL_DEVICE_NAME)) {
-        std::string device_name = { "MULTI" };
+        std::string device_name = { GetName() };
         IE_SET_METRIC_RETURN(FULL_DEVICE_NAME, device_name);
     } else if (name == METRIC_KEY(SUPPORTED_CONFIG_KEYS)) {
         IE_SET_METRIC_RETURN(SUPPORTED_CONFIG_KEYS, supported_configKeys);
@@ -185,7 +192,7 @@ IExecutableNetworkInternal::Ptr MultiDeviceInferencePlugin::LoadNetwork(const st
 IExecutableNetworkInternal::Ptr MultiDeviceInferencePlugin::LoadExeNetworkImpl(const CNNNetwork &network,
                                                                                const std::map<std::string, std::string>& config) {
     if (network.getFunction() == nullptr) {
-        IE_THROW() << "MULTI device supports just ngraph network representation";
+        IE_THROW() << GetName() << " device supports just ngraph network representation";
     }
 
     auto networkPrecision = GetNetworkPrecision(network);
@@ -197,47 +204,65 @@ IExecutableNetworkInternal::Ptr MultiDeviceInferencePlugin::LoadNetworkImpl(cons
                                                                               const std::map<std::string, std::string>& config,
                                                                               const std::string &networkPrecision) {
     if (GetCore() == nullptr) {
-        IE_THROW() << "Please, work with MULTI device via InferenceEngine::Core object";
+        IE_THROW() << "Please, work with " << GetName() << " device via InferenceEngine::Core object";
     }
 
     if (modelPath.empty() && network.getFunction() == nullptr) {
-        IE_THROW() << "MULTI device supports just ngraph network representation";
+        IE_THROW() << GetName() << " device supports just ngraph network representation";
     }
 
     auto fullConfig = mergeConfigs(_config, config);
     // collect the settings that are applicable to the devices we are loading the network to
     std::unordered_map<std::string, InferenceEngine::Parameter> multiNetworkConfig;
     std::vector<DeviceInformation> metaDevices;
-    auto workMode = fullConfig.find(CONFIG_KEY_INTERNAL(WORK_MODE));
+    auto workMode = fullConfig.find(CONFIG_KEY_INTERNAL(MULTI_WORK_MODE_AS_AUTO));
+    bool workModeAuto = workMode != fullConfig.end() && workMode->second == InferenceEngine::PluginConfigParams::YES;
     auto priorities = fullConfig.find(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
 
-    // not found device priorities for -d AUTO use case
-    if (priorities == fullConfig.end()) {
-        if (workMode != fullConfig.end()) {
-            std::string allDevices;
-            auto availableDevices = GetCore()->GetAvailableDevices();
-            if (availableDevices.empty()) {
-                IE_THROW(NotFound) << "No available device found";
-            }
-            for (auto&& device : availableDevices) {
-                allDevices += device;
-                allDevices += ((device == availableDevices[availableDevices.size()-1]) ? "" : ",");
-            }
-            metaDevices = ParseMetaDevices(allDevices, fullConfig);
-            multiNetworkConfig.insert({MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES, allDevices});
-        } else {
-            IE_THROW() << "KEY_MULTI_DEVICE_PRIORITIES key is not set for MULTI device";
+    // if workMode is AUTO
+    if (workModeAuto) {
+        // check the configure and check if need to set PerfCounters configure to device
+        // and set filter configure
+        bool needPerfCounters = false;
+        std::map<std::string, std::string> filterConfig;
+        CheckConfig(fullConfig, needPerfCounters, filterConfig);
+        // filter the device that supports filter configure
+        auto strDevices = GetDeviceList(fullConfig);
+        auto metaDevices = ParseMetaDevices(strDevices, fullConfig);
+        auto supportDevices = FilterDevice(metaDevices, filterConfig);
+        if (supportDevices.size() == 0) {
+             IE_THROW() << "there is no device support the configure";
+        }
+        // replace the configure with configure that auto want to pass to device
+        // and reset the strDevices to support devices
+        std::vector<std::string> validConfigKey;
+        validConfigKey.push_back(PluginConfigParams::KEY_PERF_COUNT);
+        validConfigKey.push_back(PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS);
+        validConfigKey.push_back(PluginConfigParams::KEY_PERFORMANCE_HINT);
+        validConfigKey.push_back(PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS);
+        strDevices = "";
+        for (auto iter = supportDevices.begin(); iter != supportDevices.end(); iter++) {
+             std::map<std::string, std::string> deviceConfig;
+             auto& configs = iter->config;
+             for (auto& config : configs) {
+                 if (std::find(validConfigKey.begin(), validConfigKey.end(), config.first) != validConfigKey.end()) {
+                     deviceConfig.insert({config.first, config.second});
+                 }
+             }
+             iter->config = deviceConfig;
+             strDevices = iter->deviceName;
+             strDevices += ((iter + 1) == supportDevices.end()) ? "" : ",";
         }
+
+        return std::make_shared<MultiDeviceExecutableNetwork>(modelPath, network, supportDevices, strDevices, this, needPerfCounters);
+    }
+
+    if (priorities == fullConfig.end()) {
+        IE_THROW() << "KEY_MULTI_DEVICE_PRIORITIES key is not set for " << GetName() << " device";
     } else {  // for use case -d MULTI:xPU or -d AUTO:xPU
         metaDevices = ParseMetaDevices(priorities->second, fullConfig);
         multiNetworkConfig.insert(*priorities);
     }
-    // check if it is -d AUTO or -d AUTO:xPU use case
-    if (workMode != fullConfig.end()) {
-        auto targetDevice = SelectDevice(metaDevices, networkPrecision);
-        // std::cout << "!!! DEBUG: select device is " << targetDevice.deviceName << std::endl;
-        metaDevices = { targetDevice };
-    }
 
     DeviceMap<SoExecutableNetworkInternal> executableNetworkPerDevice;
     std::mutex load_mutex;
@@ -271,7 +296,7 @@ IExecutableNetworkInternal::Ptr MultiDeviceInferencePlugin::LoadNetworkImpl(cons
     executor->runAndWait(loads);
     if (executableNetworkPerDevice.empty())
         IE_THROW(NotFound) << "Failed to load network to any device "
-                                            <<  "that the MULTI device is initialized to work with";
+                           <<  "that the " << GetName() << " device is initialized to work with";
 
     // checking the perf counters config from the loaded network to respect both device's plugin and load-specific setting
     size_t num_plugins_supporting_perf_counters = 0;
@@ -293,6 +318,7 @@ IExecutableNetworkInternal::Ptr MultiDeviceInferencePlugin::LoadNetworkImpl(cons
         SetExeNetworkInfo(impl,
                           executableNetworkPerDevice.begin()->second->GetInputsInfo(),
                           executableNetworkPerDevice.begin()->second->GetOutputsInfo());
+        SetExeNetworkInfo(impl, executableNetworkPerDevice.begin()->second->GetExecGraphInfo());
     }
     return impl;
 }
@@ -302,11 +328,11 @@ QueryNetworkResult MultiDeviceInferencePlugin::QueryNetwork(const CNNNetwork&
     QueryNetworkResult queryResult;
 
     if (GetCore() == nullptr) {
-        IE_THROW() << "Please, work with MULTI device via InferencEngine::Core object";
+        IE_THROW() << "Please, work with " << GetName() <<  " device via InferencEngine::Core object";
     }
 
     if (network.getFunction() == nullptr) {
-        IE_THROW() << "MULTI device supports just ngraph network representation";
+        IE_THROW() << GetName() << " device supports just ngraph network representation";
     }
 
     queryResult.rc = StatusCode::OK;
@@ -315,7 +341,7 @@ QueryNetworkResult MultiDeviceInferencePlugin::QueryNetwork(const CNNNetwork&
     auto fullConfig = mergeConfigs(_config, config);
     auto priorities = fullConfig.find(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
     if (priorities == fullConfig.end()) {
-        IE_THROW() << "KEY_MULTI_DEVICE_PRIORITIES key is not set for MULTI device";
+        IE_THROW() << "KEY_MULTI_DEVICE_PRIORITIES key is not set for " << GetName() <<  " device";
     }
     auto metaDevices = ParseMetaDevices(priorities->second, fullConfig);
     std::unordered_set<std::string> supportedLayers;
@@ -335,10 +361,9 @@ QueryNetworkResult MultiDeviceInferencePlugin::QueryNetwork(const CNNNetwork&
     return queryResult;
 }
 
-
 DeviceInformation MultiDeviceInferencePlugin::SelectDevice(const std::vector<DeviceInformation>& metaDevices, const std::string& networkPrecision) {
     if (metaDevices.empty()) {
-        IE_THROW(NotFound) << "No available device to select in AUTO plugin";
+        IE_THROW(NotFound) << "No available device to select in " << GetName() <<  " plugin";
     }
     if (metaDevices.size() == 1) {
         return metaDevices.at(0);
@@ -456,4 +481,94 @@ DeviceInformation MultiDeviceInferencePlugin::SelectDevice(const std::vector<Dev
     return CPU[0];
 }
 
+std::string MultiDeviceInferencePlugin::GetDeviceList(const std::map<std::string, std::string>& config) const {
+    std::string allDevices;
+
+    auto deviceListConfig = config.find(MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES);
+    if (deviceListConfig == config.end()) {
+        auto deviceList = GetCore()->GetAvailableDevices();
+        for (auto&& device : deviceList) {
+            allDevices += device;
+            allDevices += ((device == deviceList[deviceList.size()-1]) ? "" : ",");
+        }
+    } else {
+        allDevices = deviceListConfig->second;
+    }
+
+    if (allDevices.empty()) {
+        IE_THROW() << "Please, check environment due to no supported devices can be used";
+    }
+
+    return allDevices;
+}
+
+void MultiDeviceInferencePlugin::CheckConfig(const std::map<std::string, std::string>& config,
+        bool& needPerfCounters, std::map<std::string, std::string>& filterConfig) {
+    // TODO need to optimize this code, too much duplicated code
+    const auto perf_hints_configs = PerfHintsConfig::SupportedKeys();
+    for (auto&& kvp : config) {
+        if (kvp.first.find("AUTO_") == 0) {
+            continue;
+        } else if (kvp.first == PluginConfigParams::KEY_PERF_COUNT) {
+            if (kvp.second == PluginConfigParams::YES) {
+                needPerfCounters = true;
+                filterConfig.insert({kvp.first, kvp.second});
+            } else if (kvp.second == PluginConfigParams::NO) {
+                needPerfCounters = false;
+            } else {
+                IE_THROW() << "Unsupported config value: " << kvp.second
+                           << " for key: " << kvp.first;
+            }
+        } else if (kvp.first == PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS) {
+            if (kvp.second == PluginConfigParams::YES ||
+                kvp.second == PluginConfigParams::NO) {
+                continue;
+            } else {
+                IE_THROW() << "Unsupported config value: " << kvp.second
+                           << " for key: " << kvp.first;
+            }
+        } else if (std::find(perf_hints_configs.begin(), perf_hints_configs.end(), kvp.first) != perf_hints_configs.end()) {
+            PerfHintsConfig::CheckConfigAndValue(kvp);
+        } else if (supported_configKeys.end() == std::find(supported_configKeys.begin(), supported_configKeys.end(), kvp.first)) {
+            IE_THROW() << "Unsupported config key: " << kvp.first;
+        }
+    }
+}
+
+std::vector<DeviceInformation> MultiDeviceInferencePlugin::FilterDevice(const std::vector<DeviceInformation>& metaDevices,
+        const std::map<std::string, std::string>& config) {
+    if (metaDevices.empty()) {
+        IE_THROW(NotFound) << "No available device to filter " << GetName() <<  " plugin";
+    }
+
+    if (config.size() == 0) {
+        return metaDevices;
+    }
+
+    std::vector<DeviceInformation> filterDevice;
+    for (auto&& item : metaDevices) {
+        bool support = true;
+        std::vector<std::string> supportedMetrics = GetCore()->GetMetric(item.deviceName, METRIC_KEY(SUPPORTED_METRICS));
+        if (std::find(supportedMetrics.begin(), supportedMetrics.end(), METRIC_KEY(SUPPORTED_CONFIG_KEYS)) != supportedMetrics.end()) {
+            std::vector<std::string> supportKeys = GetCore()->GetMetric(item.deviceName, METRIC_KEY(SUPPORTED_CONFIG_KEYS));
+            for (auto&& kvp : config) {
+                auto targetKey = std::find(supportKeys.begin(), supportKeys.end(), kvp.first);
+                // if device have the key, we think the device support it
+                if (targetKey != supportKeys.end()) {
+                    continue;
+                } else {
+                    support = false;
+                    break;
+                }
+            }
+        } else {
+            support = false;
+        }
+
+        if (support) {
+            filterDevice.push_back(item);
+        }
+    }
+    return filterDevice;
+}
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/multi_device/multi_device_plugin.hpp b/inference-engine/src/multi_device/multi_device_plugin.hpp
index 4021c5ec9e1aea..f6f0ed39809bb2 100644
--- a/inference-engine/src/multi_device/multi_device_plugin.hpp
+++ b/inference-engine/src/multi_device/multi_device_plugin.hpp
@@ -36,6 +36,9 @@ class MultiDeviceInferencePlugin : public InferenceEngine::IInferencePlugin {
     std::vector<MultiDevicePlugin::DeviceInformation> ParseMetaDevices(const std::string & devicesRequestsCfg,
                                                                        const std::map<std::string, std::string> & config) const;
 
+    std::string GetDeviceList(const std::map<std::string, std::string>& config) const;
+    DeviceInformation SelectDevice(const std::vector<DeviceInformation>& metaDevices, const std::string& networkPrecision = METRIC_VALUE(FP32));
+
 protected:
     std::map<std::string, std::string> GetSupportedConfig(const std::map<std::string, std::string>& config,
                                                           const MultiDevicePlugin::DeviceName & deviceName) const;
@@ -45,7 +48,10 @@ class MultiDeviceInferencePlugin : public InferenceEngine::IInferencePlugin {
                                                                        InferenceEngine::CNNNetwork network,
                                                                        const std::map<std::string, std::string>& config,
                                                                        const std::string &networkPrecision = METRIC_VALUE(FP32));
-    DeviceInformation SelectDevice(const std::vector<DeviceInformation>& metaDevices, const std::string& networkPrecision = METRIC_VALUE(FP32));
+    static void CheckConfig(const std::map<std::string, std::string>& config, bool& needPerfCounters,
+                            std::map<std::string, std::string>& filterConfig);
+    std::vector<DeviceInformation> FilterDevice(const std::vector<DeviceInformation>& metaDevices,
+                                                const std::map<std::string, std::string>& config);
 };
 
 }  // namespace MultiDevicePlugin
diff --git a/inference-engine/src/offline_transformations/src/moc_transformations.cpp b/inference-engine/src/offline_transformations/src/moc_transformations.cpp
index 95aae8c819a3f4..40952e9494ed66 100644
--- a/inference-engine/src/offline_transformations/src/moc_transformations.cpp
+++ b/inference-engine/src/offline_transformations/src/moc_transformations.cpp
@@ -38,6 +38,8 @@
 #include <transformations/low_precision/disable_convert_constant_folding_on_const_path.hpp>
 #include <transformations/common_optimizations/leaky_relu_fusion.hpp>
 #include <transformations/common_optimizations/normalize_l2_fusion.hpp>
+#include <transformations/common_optimizations/random_uniform_fusion.hpp>
+#include "transformations/common_optimizations/mul_conv_fusion.hpp"
 
 NGRAPH_RTTI_DEFINITION(ngraph::pass::MOCTransformations, "MOCTransformations", 0);
 
@@ -91,6 +93,7 @@ bool ngraph::pass::MOCTransformations::run_on_function(std::shared_ptr<ngraph::F
     common_fusions->add_matcher<ngraph::pass::DilatedConvolutionConverter>();
     common_fusions->add_matcher<ngraph::pass::GeluFusion>();
     common_fusions->add_matcher<ngraph::pass::LeakyReluFusion>();
+    common_fusions->add_matcher<ngraph::pass::RandomUniformFusion>();
     common_fusions->set_name("ngraph::pass::CommonFusions");
 
     manager.register_pass<ngraph::pass::BinarizeWeights>();
@@ -106,6 +109,10 @@ bool ngraph::pass::MOCTransformations::run_on_function(std::shared_ptr<ngraph::F
     conv_fusions->add_matcher<ngraph::pass::GroupConvolutionMultiplyFusion>();
     conv_fusions->add_matcher<ngraph::pass::ConvolutionBackpropDataMultiplyFusion>();
     conv_fusions->add_matcher<ngraph::pass::GroupConvolutionBackpropDataMultiplyFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyConvolutionFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyGroupConvolutionFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyConvolutionBackpropDataFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyGroupConvolutionBackpropDataFusion>();
     conv_fusions->set_name("ngraph::pass::ConvFusions");
 
     manager.run_passes(f);
@@ -117,4 +124,4 @@ bool ngraph::pass::MOCTransformations::run_on_function(std::shared_ptr<ngraph::F
     f->validate_nodes_and_infer_types();
 
     return false;
-}
\ No newline at end of file
+}
diff --git a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iexecutable_network_internal.hpp b/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iexecutable_network_internal.hpp
index cee656e2f4e1db..695f3dc5a99386 100644
--- a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iexecutable_network_internal.hpp
+++ b/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iexecutable_network_internal.hpp
@@ -15,11 +15,14 @@
 #include "ie_parameter.hpp"
 #include "ie_remote_context.hpp"
 
+namespace ov {
+class Function;
+}
 namespace InferenceEngine {
 
 class IInferencePlugin;
 class IInferRequestInternal;
-class IRemoteContext;
+class RemoteContext;
 class IVariableStateInternal;
 
 /**
@@ -47,6 +50,12 @@ class INFERENCE_ENGINE_API_CLASS(IExecutableNetworkInternal)
      */
     virtual void setNetworkOutputs(const OutputsDataMap& networkOutputs);
 
+    /**
+     * @brief      Sets function with network inputs and outpus info
+     * @param[in]  function The function with network inputs and outpus info
+     */
+    virtual void setRuntimeFunction(std::shared_ptr<ov::Function> function);
+
     /**
      * @brief Gets the Executable network output Data node information. The received info is stored in the given Data
      * node.
@@ -125,7 +134,7 @@ class INFERENCE_ENGINE_API_CLASS(IExecutableNetworkInternal)
      * @brief Gets the remote context.
      * @return A reference to a context
      */
-    virtual std::shared_ptr<IRemoteContext> GetContext() const;
+    virtual std::shared_ptr<RemoteContext> GetContext() const;
 
 protected:
     ~IExecutableNetworkInternal() = default;
@@ -141,6 +150,7 @@ class INFERENCE_ENGINE_API_CLASS(IExecutableNetworkInternal)
     virtual std::shared_ptr<IInferRequestInternal> CreateInferRequestImpl(InputsDataMap networkInputs,
                                                                           OutputsDataMap networkOutputs);
 
+    std::shared_ptr<ov::Function> _runtime_function;  //!< Holds information about network inputs and outputs
     InferenceEngine::InputsDataMap _networkInputs;    //!< Holds information about network inputs info
     InferenceEngine::OutputsDataMap _networkOutputs;  //!< Holds information about network outputs data
 
diff --git a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_internal_plugin_config.hpp b/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_internal_plugin_config.hpp
index 913ea53130578e..69c1c9a3daa2fb 100644
--- a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_internal_plugin_config.hpp
+++ b/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_internal_plugin_config.hpp
@@ -26,6 +26,13 @@ namespace PluginConfigInternalParams {
  */
 #define CONFIG_KEY_INTERNAL(name) ::InferenceEngine::PluginConfigInternalParams::_CONFIG_KEY(name)
 
+/**
+ * @def CONFIG_VALUE_INTERNAL(name)
+ * @ingroup ie_dev_api_plugin_api
+ * @brief Shortcut for defining internal configuration values
+ */
+#define CONFIG_VALUE_INTERNAL(name) ::InferenceEngine::PluginConfigInternalParams::name
+
 /**
  * @brief Defines a low precision mode key
  * @ingroup ie_dev_api_plugin_api
@@ -47,12 +54,8 @@ DECLARE_CONFIG_KEY(FORCE_DISABLE_CACHE);
 
 /**
  * @brief The name for setting work mode internal in MULTI device plugin option.
- *
- * This option should be used with value only:
- * PluginConfigInternalParams::MULTI_MODE_AUTO or PluginConfigInternalParams::MULTI_MODE_LEGACY
  */
-DECLARE_CONFIG_KEY(WORK_MODE);
-DECLARE_CONFIG_VALUE(MULTI_MODE_AUTO);
+DECLARE_CONFIG_KEY(MULTI_WORK_MODE_AS_AUTO);
 
 }  // namespace PluginConfigInternalParams
 
diff --git a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iplugin_internal.hpp b/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iplugin_internal.hpp
index 94d719b9c6b5ba..b82ae2de2e6d30 100644
--- a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iplugin_internal.hpp
+++ b/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iplugin_internal.hpp
@@ -19,12 +19,16 @@
 #include "ie_iextension.h"
 #include "ie_input_info.hpp"
 #include "ie_parameter.hpp"
+#include "openvino/pp.hpp"
 
+namespace ov {
+class Function;
+}  // namespace ov
 namespace InferenceEngine {
 
 class ICore;
 class IExecutableNetworkInternal;
-class IRemoteContext;
+class RemoteContext;
 class IExtension;
 
 /**
@@ -143,13 +147,13 @@ class INFERENCE_ENGINE_API_CLASS(IInferencePlugin) : public std::enable_shared_f
      * @brief Creates an executable network from network object, on specified remote context
      * @param network A network object acquired from InferenceEngine::Core::ReadNetwork
      * @param config string-string map of config parameters relevant only for this load operation
-     * @param context A pointer to plugin context derived from IRemoteContext class used to
+     * @param context A pointer to plugin context derived from RemoteContext class used to
      *        execute the network
      * @return Created Executable Network object
      */
     virtual std::shared_ptr<IExecutableNetworkInternal> LoadNetwork(const CNNNetwork& network,
                                                                     const std::map<std::string, std::string>& config,
-                                                                    const std::shared_ptr<IRemoteContext>& context);
+                                                                    const std::shared_ptr<RemoteContext>& context);
 
     /**
      * @brief Creates an executable network from model file path
@@ -193,14 +197,14 @@ class INFERENCE_ENGINE_API_CLASS(IInferencePlugin) : public std::enable_shared_f
      * @param[in]  params  The map of parameters
      * @return     A remote context object
      */
-    virtual std::shared_ptr<IRemoteContext> CreateContext(const ParamMap& params);
+    virtual std::shared_ptr<RemoteContext> CreateContext(const ParamMap& params);
 
     /**
      * @brief      Provides a default remote context instance if supported by a plugin
      * @param[in]  params  The map of parameters
      * @return     The default context.
      */
-    virtual std::shared_ptr<IRemoteContext> GetDefaultContext(const ParamMap& params);
+    virtual std::shared_ptr<RemoteContext> GetDefaultContext(const ParamMap& params);
 
     /**
      * @deprecated Use ImportNetwork(std::istream& networkModel, const std::map<std::string, std::string>& config)
@@ -232,7 +236,7 @@ class INFERENCE_ENGINE_API_CLASS(IInferencePlugin) : public std::enable_shared_f
      * @return An Executable network
      */
     virtual std::shared_ptr<IExecutableNetworkInternal> ImportNetwork(std::istream& networkModel,
-                                                                      const std::shared_ptr<IRemoteContext>& context,
+                                                                      const std::shared_ptr<RemoteContext>& context,
                                                                       const std::map<std::string, std::string>& config);
 
     /**
@@ -279,7 +283,7 @@ class INFERENCE_ENGINE_API_CLASS(IInferencePlugin) : public std::enable_shared_f
      * resources)
      * @note The function is used in
      * InferencePluginInternal::LoadNetwork(const CNNNetwork&, const std::map<std::string, std::string>&,
-     * IRemoteContext::Ptr) which performs common steps first and calls this plugin-dependent method implementation
+     * RemoteContext::Ptr) which performs common steps first and calls this plugin-dependent method implementation
      * after.
      * @param network A network object
      * @param context A remote context
@@ -288,7 +292,7 @@ class INFERENCE_ENGINE_API_CLASS(IInferencePlugin) : public std::enable_shared_f
      */
     virtual std::shared_ptr<IExecutableNetworkInternal> LoadExeNetworkImpl(
         const CNNNetwork& network,
-        const std::shared_ptr<IRemoteContext>& context,
+        const std::shared_ptr<RemoteContext>& context,
         const std::map<std::string, std::string>& config);
 
     /**
@@ -297,24 +301,34 @@ class INFERENCE_ENGINE_API_CLASS(IInferencePlugin) : public std::enable_shared_f
      * @param exeNetwork An executable network object to set information to
      * @param inputs An input information to set
      * @param outputs An output information to set
+     * @param function Function with initial execution info
      */
     void SetExeNetworkInfo(const std::shared_ptr<IExecutableNetworkInternal>& exeNetwork,
                            const ConstInputsDataMap& inputs,
                            const ConstOutputsDataMap& outputs);
 
+    /**
+     * @brief Set input and output information to executable network. This method is used to
+     * set additional information to InferenceEngine::IExecutableNetworkInternal create by device plugin.
+     * @param function Function with initial execution info
+     */
+    void SetExeNetworkInfo(const std::shared_ptr<IExecutableNetworkInternal>& exeNetwork,
+                           const std::shared_ptr<ov::Function>& function);
+
     std::string _pluginName;                     //!< A device name that plugins enables
     std::map<std::string, std::string> _config;  //!< A map config keys -> values
     std::weak_ptr<ICore> _core;                  //!< A pointer to ICore interface
 };
 
+#define IE_CREATE_PLUGIN CreatePluginEngine
+
 namespace details {
 template <>
 class SOCreatorTrait<IInferencePlugin> {
 public:
-    static constexpr auto name = "CreatePluginEngine";
+    static constexpr auto name = OV_PP_TOSTRING(IE_CREATE_PLUGIN);
 };
 }  // namespace details
-
 }  // namespace InferenceEngine
 
 /**
@@ -322,16 +336,16 @@ class SOCreatorTrait<IInferencePlugin> {
  * @brief Defines the exported `CreatePluginEngine` function which is used to create a plugin instance
  * @ingroup ie_dev_api_plugin_api
  */
-#define IE_DEFINE_PLUGIN_CREATE_FUNCTION(PluginType, version, ...)                                                  \
-    INFERENCE_PLUGIN_API(void) CreatePluginEngine(::std::shared_ptr<::InferenceEngine::IInferencePlugin>& plugin) { \
-        try {                                                                                                       \
-            plugin = ::std::make_shared<PluginType>(__VA_ARGS__);                                                   \
-        } catch (const InferenceEngine::Exception&) {                                                               \
-            throw;                                                                                                  \
-        } catch (const std::exception& ex) {                                                                        \
-            IE_THROW() << ex.what();                                                                                \
-        } catch (...) {                                                                                             \
-            IE_THROW(Unexpected);                                                                                   \
-        }                                                                                                           \
-        plugin->SetVersion(version);                                                                                \
+#define IE_DEFINE_PLUGIN_CREATE_FUNCTION(PluginType, version, ...)                                                \
+    INFERENCE_PLUGIN_API(void) IE_CREATE_PLUGIN(::std::shared_ptr<::InferenceEngine::IInferencePlugin>& plugin) { \
+        try {                                                                                                     \
+            plugin = ::std::make_shared<PluginType>(__VA_ARGS__);                                                 \
+        } catch (const InferenceEngine::Exception&) {                                                             \
+            throw;                                                                                                \
+        } catch (const std::exception& ex) {                                                                      \
+            IE_THROW() << ex.what();                                                                              \
+        } catch (...) {                                                                                           \
+            IE_THROW(Unexpected);                                                                                 \
+        }                                                                                                         \
+        plugin->SetVersion(version);                                                                              \
     }
diff --git a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iremote_context.hpp b/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iremote_context.hpp
deleted file mode 100644
index 361ff67af97902..00000000000000
--- a/inference-engine/src/plugin_api/cpp_interfaces/interface/ie_iremote_context.hpp
+++ /dev/null
@@ -1,67 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief This is a header file for the IE RemoteContext and RemoteBlob classes
- *
- * @file ie_remote_context.hpp
- */
-#pragma once
-
-#include <memory>
-#include <string>
-
-#include "ie_parameter.hpp"
-#include "ie_remote_context.hpp"
-
-namespace InferenceEngine {
-
-class RemoteBlob;
-
-class INFERENCE_ENGINE_API_CLASS(IRemoteContext)
-    : public RemoteContext,
-      public std::enable_shared_from_this<RemoteContext> {
-public:
-    /**
-     * @brief A smart pointer to the IRemoteContext object
-     */
-    using Ptr = std::shared_ptr<IRemoteContext>;
-
-    /**
-     * @brief Returns name of the device on which underlying object is allocated.
-     * Abstract method.
-     * @return A device name string in the same format as that in plugin metric.
-     */
-    std::string getDeviceName() const noexcept override;
-
-    /**
-     * @brief Allocates memory blob in device memory or wraps user-supplied memory handle
-     * using the specified tensor description and low-level device-specific parameters.
-     * Returns a pointer to the object which implements RemoteBlob interface.
-     * @param tensorDesc Defines the layout and dims of the blob
-     * @param params Map of the low-level blob object parameters.
-     * Abstract method.
-     * @return A pointer to plugin object that implements RemoteBlob interface.
-     */
-    std::shared_ptr<RemoteBlob> CreateBlob(const TensorDesc& tensorDesc, const ParamMap& params = {}) override;
-
-    /**
-     * @brief Returns a map of device-specific parameters required for low-level
-     * operations with underlying object.
-     * Parameters include device/context handles, access flags,
-     * etc. Contents of the map returned depend on remote execution context that is
-     * currently set on the device (working scenario).
-     * Abstract method.
-     * @return A map of name/parameter elements.
-     */
-    ParamMap getParams() const override;
-
-protected:
-    /**
-     * @brief IRemoteContext destructor
-     */
-    ~IRemoteContext() = default;
-};
-
-}  // namespace InferenceEngine
diff --git a/inference-engine/src/plugin_api/ie_icore.hpp b/inference-engine/src/plugin_api/ie_icore.hpp
index 9df7d436a88219..3d4c16927cbbdd 100644
--- a/inference-engine/src/plugin_api/ie_icore.hpp
+++ b/inference-engine/src/plugin_api/ie_icore.hpp
@@ -121,7 +121,7 @@ class ICore {
     /**
      * @brief Returns devices available for neural networks inference
      *
-     * @return A vector of devices. The devices are returned as { CPU, FPGA.0, FPGA.1, MYRIAD }
+     * @return A vector of devices. The devices are returned as { CPU, GPU.0, GPU.1, MYRIAD }
      * If there more than one device of specific type, they are enumerated with .# suffix.
      */
     virtual std::vector<std::string> GetAvailableDevices() const = 0;
diff --git a/inference-engine/src/plugin_api/ie_performance_hints.hpp b/inference-engine/src/plugin_api/ie_performance_hints.hpp
new file mode 100644
index 00000000000000..3904611375f481
--- /dev/null
+++ b/inference-engine/src/plugin_api/ie_performance_hints.hpp
@@ -0,0 +1,102 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+/**
+ * @brief A header file for config that holds the performance hints
+ * @file ie_performance_hints.hpp
+ */
+
+#pragma once
+#include <ie_parameter.hpp>
+#include <ie_plugin_config.hpp>
+
+namespace InferenceEngine {
+struct PerfHintsConfig {
+    std::string ovPerfHint = "";
+    int ovPerfHintNumRequests = 0;
+
+    /**
+     * @brief Parses configuration key/value pair
+     * @param key configuration key
+     * @param value configuration values
+     */
+    void SetConfig(const std::string& key, const std::string& value) {
+        if (PluginConfigParams::KEY_PERFORMANCE_HINT == key) {
+            ovPerfHint = CheckPerformanceHintValue(value);
+        } else if (PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS == key) {
+            ovPerfHintNumRequests = CheckPerformanceHintRequestValue(value);
+        }
+    }
+
+    /**
+     * @brief Return configuration value
+     * @param key configuration key
+     * @return configuration value wrapped into Parameter
+     */
+    Parameter GetConfig(const std::string& key) {
+        if (PluginConfigParams::KEY_PERFORMANCE_HINT == key) {
+            return ovPerfHint;
+        } else if (PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS == key) {
+            return ovPerfHintNumRequests;
+        } else {
+            IE_THROW() << "Unsupported Performance Hint config: " << key << std::endl;
+        }
+    }
+
+    /**
+     * @brief Supported Configuration keys
+     * @return vector of supported configuration keys
+     */
+    static std::vector<std::string> SupportedKeys() {
+        return {PluginConfigParams::KEY_PERFORMANCE_HINT, PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS};
+    }
+
+    /**
+     * @brief Checks configuration key and value, otherwise throws
+     * @param configuration key + value
+     * @return void
+     */
+    static void CheckConfigAndValue(std::pair<const std::string, const std::string&> kvp) {
+        if (kvp.first == PluginConfigParams::KEY_PERFORMANCE_HINT)
+            CheckPerformanceHintValue(kvp.second);
+        else if (kvp.first == PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS)
+            CheckPerformanceHintRequestValue(kvp.second);
+        else
+            IE_THROW() << "Unsupported Performance Hint config: " << kvp.first << std::endl;
+    }
+
+    /**
+     * @brief Returns configuration value if it is valid, otherwise throws
+     * @param configuration value
+     * @return configuration value
+     */
+    static std::string CheckPerformanceHintValue(const std::string& val) {
+        if (val == PluginConfigParams::LATENCY || val == PluginConfigParams::THROUGHPUT)
+            return val;
+        else
+            IE_THROW() << "Wrong value for property key " << PluginConfigParams::KEY_PERFORMANCE_HINT
+                       << ". Expected only " << PluginConfigParams::LATENCY << "/" << PluginConfigParams::THROUGHPUT;
+    }
+
+    /**
+     * @brief Returns configuration value if it is valid, otherwise throws
+     * @param configuration value as string
+     * @return configuration value as number
+     */
+    static int CheckPerformanceHintRequestValue(const std::string& val) {
+        int val_i = -1;
+        try {
+            val_i = std::stoi(val);
+            if (val_i > 0)
+                return val_i;
+            else
+                throw std::logic_error("wrong val");
+        } catch (const std::exception&) {
+            IE_THROW() << "Wrong value of " << val << " for property key "
+                       << PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS
+                       << ". Expected only positive integer numbers";
+        }
+    }
+};
+}  // namespace InferenceEngine
\ No newline at end of file
diff --git a/inference-engine/src/plugin_api/performance_heuristics.hpp b/inference-engine/src/plugin_api/performance_heuristics.hpp
new file mode 100644
index 00000000000000..cace1dd41852dc
--- /dev/null
+++ b/inference-engine/src/plugin_api/performance_heuristics.hpp
@@ -0,0 +1,136 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+///////////////////////////////////////////////////////////////////////////////////////////////////
+#pragma once
+#include <cfloat>
+
+#include "ngraph/ngraph.hpp"
+
+namespace ov {
+struct MemBandwidthPressure {
+    float max_mem_tolerance = UNKNOWN;
+    float ratio_compute_convs = 0;
+    float ratio_mem_limited_convs = 0;
+    float ratio_compute_deconvs = 0;
+
+    static constexpr float UNKNOWN = FLT_MAX;
+    static constexpr float ALL = 1.0f;
+    static constexpr float NONE = 0.0f;
+    static constexpr float LIMITED = 0.5f;  // conservatively assume 1/2 utilization of the cache
+};
+
+MemBandwidthPressure MemBandwidthPressureTolerance(
+    const std::shared_ptr<ngraph::Function> nGraphFunc,
+    const float L2_cache_size,
+    const float L3_cache_size,
+    const float memThresholdAssumeLimited = MemBandwidthPressure::LIMITED) {
+    int total_convs = 0, mem_limited_convs = 0, compute_convs = 0, total_gemms = 0, mem_limited_gemms = 0,
+        total_deconvs = 0, compute_deconvs = 0, mem_limited_deconvs = 0;
+    auto memLimitedFactor = [&](int size_data_moved, int datatype_size = 4) -> float {
+        return (L2_cache_size * 1.0f /*util factor, tbd */
+                / (size_data_moved * datatype_size));
+    };
+    auto isLowPrecision = [&](ngraph::element::Type type) -> bool {
+        return (type == ngraph::element::i8) || (type == ngraph::element::u8);
+    };
+    auto isHalfPrecision = [&](ngraph::element::Type type) -> bool {
+        return (type == ngraph::element::bf16) || (type == ngraph::element::f16);
+    };
+
+    float worst_case = MemBandwidthPressure::UNKNOWN;
+    // Traverse nGraph Function in topological order
+    for (auto& node : nGraphFunc->get_ordered_ops()) {
+        const auto node_name = node->get_type_info().name;
+        if (std::strcmp("MatMul", node_name) && std::strcmp("Convolution", node_name) &&
+            std::strcmp("ConvolutionBackpropData", node_name)) {
+            if (!std::strcmp("GRUSequence", node_name) || !std::strcmp("TensorIterator", node_name)) {
+                MemBandwidthPressure res;
+                res.max_mem_tolerance = MemBandwidthPressure::UNKNOWN;
+                return res;
+            }
+            continue;
+        }
+        auto type1 = node->input_value(1).get_element_type();  // weights
+        const bool isINT8 = isLowPrecision(type1);
+        const bool isBF16orFP16 = isHalfPrecision(type1);
+        const int data_type_size = isINT8 ? 1 : isBF16orFP16 ? 2 : 4;
+
+        int dataSizeInput = 0, dataSizeOutput = 0;
+        if (!std::strcmp("MatMul", node_name)) {
+            const auto input0 = node->input(0);
+            const auto input1 = node->input(1);
+            const auto output = node->output(0);
+            // Check that input and output shape a fully defined (not dynamic)
+            if (input0.get_partial_shape().is_static() && input1.get_partial_shape().is_static() &&
+                output.get_partial_shape().is_static()) {
+                const auto& shapeInput0 = input0.get_shape();
+                const auto& shapeInput1 = input1.get_shape();
+                const auto non_const = !get_constant_from_source(node->input_value(1));
+                const auto& shapeOutput = output.get_shape();
+                const auto dataSizeInput0 =
+                    std::accumulate(shapeInput0.begin(), shapeInput0.end(), 1, std::multiplies<int>());
+                const auto dataSizeInput1 =
+                    std::accumulate(shapeInput1.begin(), shapeInput1.end(), 1, std::multiplies<int>());
+                dataSizeOutput = std::accumulate(shapeOutput.begin(), shapeOutput.end(), 1, std::multiplies<int>());
+                const auto total_data = dataSizeInput0 + non_const * dataSizeInput1 + dataSizeOutput;
+                total_gemms++;
+                const auto factor = memLimitedFactor(total_data, data_type_size);
+                mem_limited_gemms += factor < memThresholdAssumeLimited;
+                worst_case = std::min(factor, worst_case);
+            }
+        } else if (!std::strcmp("Convolution", node_name)) {
+            // Check that input and output shape a fully defined (not dynamic)
+            const auto input = node->input(0);
+            const auto output = node->output(0);
+            const auto kernels = node->input(1);
+            const auto& shape = kernels.get_shape();
+            total_convs++;
+            if (shape.size() >= 4 /* conventional 2D/3D conv */ && shape[2] >= 3 && shape[3] >= 3) {
+                compute_convs++;
+                continue;
+            }
+            if (input.get_partial_shape().is_static() && output.get_partial_shape().is_static()) {
+                const auto& shapeInput = input.get_shape();
+                const auto& shapeOutput = output.get_shape();
+                if (shapeInput.size() > 4 /*5D*/ && isINT8) {
+                    compute_convs++;
+                    continue;
+                }
+                dataSizeInput = std::accumulate(shapeInput.begin(), shapeInput.end(), 1, std::multiplies<int>());
+                dataSizeOutput = std::accumulate(shapeOutput.begin(), shapeOutput.end(), 1, std::multiplies<int>());
+                const auto factor = memLimitedFactor(dataSizeInput + dataSizeOutput, data_type_size);
+                mem_limited_convs += factor < memThresholdAssumeLimited;
+                worst_case = std::min(factor, worst_case);
+            }
+        } else if (!std::strcmp("ConvolutionBackpropData", node_name)) {
+            const auto input = node->input(0);
+            const auto output = node->output(0);
+            total_deconvs++;
+
+            // Check that input and output shape a fully defined (not dynamic)
+            if (input.get_partial_shape().is_static() && output.get_partial_shape().is_static()) {
+                const auto shapeInput = input.get_shape();
+                const auto shapeOutput = output.get_shape();
+                if (shapeInput.size() > 4 /*5D*/ && isINT8) {
+                    compute_deconvs++;
+                    continue;
+                }
+                dataSizeInput = std::accumulate(shapeInput.begin(), shapeInput.end(), 1, std::multiplies<int>());
+                dataSizeOutput = std::accumulate(shapeOutput.begin(), shapeOutput.end(), 1, std::multiplies<int>());
+                const auto factor = memLimitedFactor(dataSizeInput + dataSizeOutput, data_type_size);
+                mem_limited_deconvs += factor < memThresholdAssumeLimited;
+                worst_case = std::min(factor, worst_case);
+            }
+        }
+    }
+    MemBandwidthPressure res;
+    res.max_mem_tolerance = worst_case;
+    res.ratio_mem_limited_convs = total_convs ? static_cast<float>(mem_limited_convs) / total_convs : 0;
+    res.ratio_compute_convs = total_convs ? static_cast<float>(compute_convs) / total_convs : 0;
+    res.ratio_compute_deconvs = total_deconvs ? static_cast<float>(compute_deconvs) / total_deconvs : 0;
+    return res;
+}
+
+}  // namespace ov
\ No newline at end of file
diff --git a/inference-engine/src/plugin_api/shared_object.hpp b/inference-engine/src/plugin_api/shared_object.hpp
index de2523375c7661..1b839687ef0c6c 100644
--- a/inference-engine/src/plugin_api/shared_object.hpp
+++ b/inference-engine/src/plugin_api/shared_object.hpp
@@ -13,32 +13,28 @@
 
 namespace ov {
 namespace runtime {
-struct INFERENCE_ENGINE_API_CLASS(SharedObject) {
-    void* shared_object = nullptr;
-
-    /**
-     * @brief Loads a library with the name specified.
-     * @param path Full or relative path to the plugin library
-     */
-    explicit SharedObject(const char* path);
+/**
+ * @brief Loads a library with the name specified.
+ * @param path Full or relative path to the plugin library
+ * @return Reference to shared object
+ */
+INFERENCE_ENGINE_API_CPP(std::shared_ptr<void>) load_shared_object(const char* path);
 
 #ifdef ENABLE_UNICODE_PATH_SUPPORT
-    /**
-     * @brief Loads a library with the wide char name specified.
-     * @param path Full or relative path to the plugin library
-     */
-    explicit SharedObject(const wchar_t* path);
+/**
+ * @brief Loads a library with the wide char name specified.
+ * @param path Full or relative path to the plugin library
+ * @return Reference to shared object
+ */
+INFERENCE_ENGINE_API_CPP(std::shared_ptr<void>) load_shared_object(const wchar_t* path);
 #endif  // ENABLE_UNICODE_PATH_SUPPORT
-
-    ~SharedObject();
-
-    /**
-     * @brief Searches for a function symbol in the loaded module
-     * @param symbolName Name of the function to find
-     * @return A pointer to the function if found
-     * @throws Exception if the function is not found
-     */
-    void* get_symbol(const char* symbolName) const;
-};
+/**
+ * @brief Searches for a function symbol in the loaded module
+ * @param shared_object shared object reference
+ * @param symbolName Name of the function to find
+ * @return A pointer to the function if found
+ * @throws Exception if the function is not found
+ */
+INFERENCE_ENGINE_API_CPP(void*) get_symbol(const std::shared_ptr<void>& shared_object, const char* symbolName);
 }  // namespace runtime
 }  // namespace ov
diff --git a/inference-engine/src/plugin_api/so_ptr.hpp b/inference-engine/src/plugin_api/so_ptr.hpp
new file mode 100644
index 00000000000000..ff11901b14f52d
--- /dev/null
+++ b/inference-engine/src/plugin_api/so_ptr.hpp
@@ -0,0 +1,89 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+/**
+ * @brief This is a wrapper class for handling plugin instantiation and releasing resources
+ * @file ie_so_pointer.hpp
+ */
+#pragma once
+
+#include <cassert>
+#include <functional>
+#include <memory>
+#include <string>
+#include <type_traits>
+
+#include "openvino/runtime/common.hpp"
+#include "shared_object.hpp"
+
+namespace ov {
+namespace runtime {
+
+/**
+ * @brief This class instantiate object using shared library
+ * @tparam T An type of object SoPtr can hold
+ */
+template <class T>
+struct SoPtr {
+    template <class U>
+    friend class SoPtr;
+
+    /**
+     * @brief Default constructor
+     */
+    SoPtr() = default;
+
+    /**
+     * @brief Constructs an object with existing shared object reference and loaded pointer
+     * @param soLoader Existing pointer to a library loader
+     */
+    SoPtr(const std::shared_ptr<void>& so, const std::shared_ptr<T>& ptr) : _so{so}, _ptr{ptr} {}
+
+    /**
+     * @brief The copy-like constructor, can create So Pointer that dereferenced into child type if T is derived of U
+     * @param that copied SoPtr object
+     */
+    template <typename U>
+    SoPtr(const SoPtr<U>& that) : _so{that._so},
+                                  _ptr{std::dynamic_pointer_cast<T>(that._ptr)} {
+        IE_ASSERT(_ptr != nullptr);
+    }
+
+    /**
+     * @brief Standard pointer operator
+     * @return underlined interface with disabled Release method
+     */
+    T* operator->() const noexcept {
+        return _ptr.get();
+    }
+
+    explicit operator bool() const noexcept {
+        return _ptr != nullptr;
+    }
+
+    friend bool operator==(std::nullptr_t, const SoPtr& ptr) noexcept {
+        return !ptr;
+    }
+    friend bool operator==(const SoPtr& ptr, std::nullptr_t) noexcept {
+        return !ptr;
+    }
+    friend bool operator!=(std::nullptr_t, const SoPtr& ptr) noexcept {
+        return static_cast<bool>(ptr);
+    }
+    friend bool operator!=(const SoPtr& ptr, std::nullptr_t) noexcept {
+        return static_cast<bool>(ptr);
+    }
+
+    /**
+     * @brief The shared object or dinamic loaded library
+     */
+    std::shared_ptr<void> _so;
+
+    /**
+     * @brief Gets a smart pointer to the custom object
+     */
+    std::shared_ptr<T> _ptr;
+};
+}  // namespace runtime
+}  // namespace ov
diff --git a/inference-engine/src/plugin_api/threading/ie_executor_manager.hpp b/inference-engine/src/plugin_api/threading/ie_executor_manager.hpp
index 0ce1d96f222eea..243d247b23ec78 100644
--- a/inference-engine/src/plugin_api/threading/ie_executor_manager.hpp
+++ b/inference-engine/src/plugin_api/threading/ie_executor_manager.hpp
@@ -51,7 +51,7 @@ class ExecutorManagerImpl {
 /**
  * @brief This is global point for getting task executor objects by string id.
  * It's necessary in multiple asynchronous requests for having unique executors to avoid oversubscription.
- * E.g. There 2 task executors for CPU device: one - in FPGA, another - in MKLDNN. Parallel execution both of them leads
+ * E.g. There 2 task executors for CPU device: one - in GPU, another - in MKLDNN. Parallel execution both of them leads
  * to not optimal CPU usage. More efficient to run the corresponding tasks one by one via single executor.
  * @ingroup ie_dev_api_threading
  */
diff --git a/inference-engine/src/plugin_api/threading/ie_istreams_executor.hpp b/inference-engine/src/plugin_api/threading/ie_istreams_executor.hpp
index 8bb82aa974fd73..7d2bac73e5721c 100644
--- a/inference-engine/src/plugin_api/threading/ie_istreams_executor.hpp
+++ b/inference-engine/src/plugin_api/threading/ie_istreams_executor.hpp
@@ -82,6 +82,7 @@ class INFERENCE_ENGINE_API_CLASS(IStreamsExecutor) : public ITaskExecutor {
          * @return configured values
          */
         static Config MakeDefaultMultiThreaded(const Config& initial, const bool fp_intesive = true);
+        static int GetDefaultNumStreams();  // no network specifics considered (only CPU's caps);
 
         std::string _name;          //!< Used by `ITT` to name executor threads
         int _streams = 1;           //!< Number of streams.
diff --git a/inference-engine/src/transformations/CMakeLists.txt b/inference-engine/src/transformations/CMakeLists.txt
index bf4a4f31d6ae69..21d27abf18eff8 100644
--- a/inference-engine/src/transformations/CMakeLists.txt
+++ b/inference-engine/src/transformations/CMakeLists.txt
@@ -49,7 +49,7 @@ openvino_developer_export_targets(COMPONENT inference_engine TARGETS ${TARGET_NA
 
 # install
 
-install(TARGETS ${TARGET_NAME} EXPORT InferenceEngineTargets
+install(TARGETS ${TARGET_NAME} EXPORT OpenVINOTargets
         RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT core
         ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT core
         LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT core)
diff --git a/inference-engine/src/transformations/include/ngraph_ops/type_relaxed.hpp b/inference-engine/src/transformations/include/ngraph_ops/type_relaxed.hpp
index acc7682bb020ac..ffc41a618ec29a 100644
--- a/inference-engine/src/transformations/include/ngraph_ops/type_relaxed.hpp
+++ b/inference-engine/src/transformations/include/ngraph_ops/type_relaxed.hpp
@@ -11,7 +11,9 @@
 
 #include <transformations_visibility.hpp>
 
+#include <ngraph/op/convert.hpp>
 #include "ngraph/op/op.hpp"
+#include "ngraph/variant.hpp"
 
 namespace ngraph {
 namespace op {
@@ -79,11 +81,66 @@ class NGRAPH_API TypeRelaxedBase {
         m_input_data_types[inputIndex] = element_type;
     }
 
+protected:
+    void remember_input_data_types(Node &node, element::TypeVector &old_input_types) {
+        // Remember all input data types
+        for (size_t i = 0; i < node.get_input_size(); ++i) {
+            old_input_types.push_back(node.get_input_element_type(i));
+        }
+
+        // Reset input data types to m_output_data_type.
+        for (size_t i = 0; i < node.get_input_size(); ++i) {
+            auto origin_input_type = get_origin_input_type(i);
+            if (origin_input_type != element::undefined) {
+                node.get_input_tensor(i).set_tensor_type(origin_input_type, node.get_input_partial_shape(i));
+            }
+        }
+    }
+
+    void restore_input_data_types(Node &node, const element::TypeVector &old_input_types) {
+        // Restore original input data types
+        for (size_t i = 0; i < node.get_input_size(); ++i) {
+            node.get_input_tensor(i).set_tensor_type(old_input_types[i], node.get_input_partial_shape(i));
+        }
+
+        if (m_original_output_data_types.empty()) {
+            m_original_output_data_types = element::TypeVector(node.get_output_size());
+        }
+
+        // Save inferred output types
+        for (size_t i = 0; i < node.get_output_size(); ++i) {
+            m_original_output_data_types[i] = node.get_output_element_type(i);
+        }
+
+        // Override (some) output types
+        for (size_t i = 0; i < node.get_output_size(); ++i) {
+            auto overridden_output_type = get_overridden_output_type(i);
+            if (overridden_output_type != element::undefined) {
+                node.set_output_type(0, overridden_output_type, node.get_output_partial_shape(i));
+            }
+        }
+    }
+
+    void visit_attributes(AttributeVisitor& visitor) {
+        bool type_relax = true;
+        visitor.on_attribute("type_relax", type_relax);
+        visitor.on_attribute("input_data_types", m_input_data_types);
+        visitor.on_attribute("output_data_types", m_output_data_types);
+    }
+
+    typedef struct {} init_rt_result;
+
+    init_rt_result init_rt_info(Node &node) const {
+        node.get_rt_info()["opset"] = std::make_shared<ngraph::VariantWrapper<std::string>>("type_relaxed_opset");
+        return {};
+    }
+
 protected:
     // Data types that are used for parent shape/type infer function input ports
     // to infer output data types
     element::TypeVector m_input_data_types;
     element::TypeVector m_output_data_types;
+    element::TypeVector m_original_output_data_types;
 };
 
 /// Set another type for a specified output for the period of time when an instance of the class exists.
@@ -161,48 +218,86 @@ class TypeRelaxed : public BaseOp, public TypeRelaxedBase {
     }
 
     void validate_and_infer_types() override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
 
     std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
 
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
 private:
     void init() {
         validate_and_infer_types();
     }
+
+    init_rt_result init_rt = init_rt_info(*this);
 };
 
 template <typename BaseOp>
-void TypeRelaxed<BaseOp>::validate_and_infer_types() {
-    // Remember all input data types
-    element::TypeVector old_input_types;
+bool TypeRelaxed<BaseOp>::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+    std::shared_ptr<ngraph::op::v0::Convert> convert;
+    HostTensorVector casted_inputs(BaseOp::get_input_size());
     for (size_t i = 0; i < BaseOp::get_input_size(); ++i) {
-        old_input_types.push_back(BaseOp::get_input_element_type(i));
+        const auto expected_input_type = get_origin_input_type(i);
+
+        if (inputs[i]->get_element_type() == expected_input_type || expected_input_type == element::undefined) {
+            casted_inputs[i] = inputs[i];
+        } else {
+            if (convert == nullptr) {
+                convert = std::make_shared<ngraph::op::v0::Convert>();
+            }
+
+            convert->set_destination_type(expected_input_type);
+            casted_inputs[i] = std::make_shared<HostTensor>(expected_input_type, inputs[i]->get_shape());
+            if (!convert->evaluate({ casted_inputs[i] }, { inputs[i] })) {
+                return false;
+            }
+        }
     }
 
-    // Reset input data types to m_output_data_type.
-    for (size_t i = 0; i < BaseOp::get_input_size(); ++i) {
-        auto origin_input_type = get_origin_input_type(i);
-        if (origin_input_type != element::undefined) {
-            BaseOp::get_input_tensor(i).set_tensor_type(origin_input_type, BaseOp::get_input_partial_shape(i));
+    HostTensorVector original_outputs(BaseOp::get_output_size());
+    for (size_t i = 0; i < BaseOp::get_output_size(); ++i) {
+        const auto expected_output_type = get_overridden_output_type(i);
+        if (expected_output_type == element::undefined || expected_output_type == m_original_output_data_types[i]) {
+            original_outputs[i] = outputs[i];
+        } else {
+            original_outputs[i] = std::make_shared<HostTensor>(m_original_output_data_types[i], BaseOp::get_output_partial_shape(i));
         }
     }
 
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    BaseOp::validate_and_infer_types();
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-    // Restore original input data types
-    for (size_t i = 0; i < BaseOp::get_input_size(); ++i) {
-        BaseOp::get_input_tensor(i).set_tensor_type(old_input_types[i], BaseOp::get_input_partial_shape(i));
+    if (!BaseOp::evaluate(original_outputs, casted_inputs)) {
+        return false;
     }
 
-
-    // Override (some) output types
     for (size_t i = 0; i < BaseOp::get_output_size(); ++i) {
-        auto overridden_output_type = get_overridden_output_type(i);
-        if (overridden_output_type != element::undefined) {
-            BaseOp::set_output_type(0, overridden_output_type, BaseOp::get_output_partial_shape(i));
+        const auto expected_output_type = get_overridden_output_type(i);
+
+        if (expected_output_type != element::undefined && original_outputs[i]->get_element_type() != expected_output_type) {
+            if (convert == nullptr) {
+                convert = std::make_shared<ngraph::op::v0::Convert>();
+            }
+
+            convert->set_destination_type(expected_output_type);
+            const auto casted_output = std::make_shared<HostTensor>(expected_output_type, original_outputs[i]->get_shape());
+            if (!convert->evaluate({ outputs[i] }, { original_outputs[i] })) {
+                return false;
+            }
         }
     }
+
+    return true;
+}
+
+template <typename BaseOp>
+void TypeRelaxed<BaseOp>::validate_and_infer_types() {
+    element::TypeVector old_input_types;
+
+    remember_input_data_types(*this, old_input_types);
+
+    NGRAPH_SUPPRESS_DEPRECATED_START
+    BaseOp::validate_and_infer_types();
+    NGRAPH_SUPPRESS_DEPRECATED_END
+
+    restore_input_data_types(*this, old_input_types);
 }
 
 
@@ -218,19 +313,21 @@ std::shared_ptr<Node> TypeRelaxed<BaseOp>::clone_with_new_inputs(const OutputVec
     return new_node;
 }
 
+template <typename BaseOp>
+bool TypeRelaxed<BaseOp>::visit_attributes(AttributeVisitor& visitor) {
+    TypeRelaxedBase::visit_attributes(visitor);
+    BaseOp::visit_attributes(visitor);
+    return true;
+}
+
 template <typename BaseOp>
 const ::ngraph::Node::type_info_t& TypeRelaxed<BaseOp>::get_type_info() const { return get_type_info_static(); }
 
 template <typename BaseOp>
 const ::ngraph::Node::type_info_t& TypeRelaxed<BaseOp>::get_type_info_static() {
     auto baseOpTypeInfoPtr = &BaseOp::get_type_info_static();
-
-    // TODO: it should be static const std::string name = std::string("TypeRelaxed_") + baseOpTypeInfoPtr->name;
-    //       but currently it will not pass conversion ot Legacy Opset correctly
-    static const std::string name = baseOpTypeInfoPtr->name;
-
     static const ::ngraph::Node::type_info_t type_info_static{
-        name.c_str(), baseOpTypeInfoPtr->version, baseOpTypeInfoPtr};
+        baseOpTypeInfoPtr->name, baseOpTypeInfoPtr->version, baseOpTypeInfoPtr};
     return type_info_static;
 }
 
diff --git a/inference-engine/src/transformations/include/transformations/common_optimizations/disable_random_uniform_constant_folding.hpp b/inference-engine/src/transformations/include/transformations/common_optimizations/disable_random_uniform_constant_folding.hpp
new file mode 100644
index 00000000000000..e9c59587eb67de
--- /dev/null
+++ b/inference-engine/src/transformations/include/transformations/common_optimizations/disable_random_uniform_constant_folding.hpp
@@ -0,0 +1,27 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <ngraph/pass/graph_rewrite.hpp>
+
+namespace ngraph {
+namespace pass {
+
+class DisableRandomUniformConstantFolding;
+
+}  // namespace pass
+}  // namespace ngraph
+
+/**
+ * @ingroup ie_transformation_common_api
+ * @brief Disables ConstantFolding for RandomUniform operation. It is required as RandomUniform
+ * should generate new sequence each run.
+ */
+class ngraph::pass::DisableRandomUniformConstantFolding : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    DisableRandomUniformConstantFolding();
+};
diff --git a/inference-engine/src/transformations/include/transformations/common_optimizations/dropout_with_random_uniform_replacer.hpp b/inference-engine/src/transformations/include/transformations/common_optimizations/dropout_with_random_uniform_replacer.hpp
new file mode 100644
index 00000000000000..dfb591053ca668
--- /dev/null
+++ b/inference-engine/src/transformations/include/transformations/common_optimizations/dropout_with_random_uniform_replacer.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <ngraph/pass/graph_rewrite.hpp>
+#include <transformations_visibility.hpp>
+
+namespace ngraph {
+namespace pass {
+
+class TRANSFORMATIONS_API DropoutWithRandomUniformReplacer;
+
+}  // namespace pass
+}  // namespace ngraph
+
+/**
+ * @ingroup ie_transformation_common_api
+ * @brief This transformation replaces possible Dropout block (in inference mode) with RandomUniform
+ *  to Broadcast of half-ones in a sub-graph.
+ *
+ *   Dropout block:
+ *   RandomUniform ----------> Add --->  Floor
+ *   /\        /\              /\
+ *   |         |               |
+ *  Const(0)  Const(1)        Const(1)
+ *  min_val   max_val
+ *
+ *  Resulted block:
+ *  Broadcast -------> Add ---> Floor
+ *    /\               /\
+ *    |                |
+ *  Const(0.5)      Const(1)
+ *
+ */
+class ngraph::pass::DropoutWithRandomUniformReplacer : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    DropoutWithRandomUniformReplacer();
+};
diff --git a/inference-engine/src/transformations/include/transformations/common_optimizations/mul_conv_fusion.hpp b/inference-engine/src/transformations/include/transformations/common_optimizations/mul_conv_fusion.hpp
new file mode 100644
index 00000000000000..0adbc0844b271e
--- /dev/null
+++ b/inference-engine/src/transformations/include/transformations/common_optimizations/mul_conv_fusion.hpp
@@ -0,0 +1,104 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <functional>
+
+#include <transformations_visibility.hpp>
+
+#include <ngraph/pass/graph_rewrite.hpp>
+
+namespace ngraph {
+namespace pass {
+
+class TRANSFORMATIONS_API MultiplyConvolutionFusion;
+class TRANSFORMATIONS_API MultiplyGroupConvolutionFusion;
+class TRANSFORMATIONS_API MultiplyConvolutionBackpropDataFusion;
+class TRANSFORMATIONS_API MultiplyGroupConvolutionBackpropDataFusion;
+
+}  // namespace pass
+}  // namespace ngraph
+
+/**
+ * @ingroup ie_transformation_common_api
+ * @brief Multiply->Convolution fusion replaces following graph:
+ *
+ *   +-------+   +----------+
+ *   | Input |   | Constant |
+ *   +-------+   +----------+
+ *       |            |
+ *       ------  ------
+ *            |  |
+ *            v  v
+ *         +----------+            +---------+
+ *         | Multiply |            | Weights |
+ *         +----------+            +---------+
+ *              |                       |
+ *              -----------    ----------
+ *                        |    |
+ *                        v    v
+ *                   +----------------+
+ *                   | Convolution Op |
+ *                   +----------------+
+ *
+ * to following:
+ *
+ *                           +---------+   +----------+
+ *                           | Weights |   | Constant |
+ *                           +---------+   +----------+
+ *                                |            |
+ *                                ------  ------
+ *                                     |  |
+ *                                     v  v
+ *          +-------+              +----------+
+ *          | Input |              | Multiply |
+ *          +-------+              +----------+
+ *              |                       |
+ *              -----------    ----------
+ *                        |    |
+ *                        v    v
+ *                   +----------------+
+ *                   | Convolution Op |
+ *                   +----------------+
+ *
+ * where 'Convolution Op' is one of:
+ * - Convolution
+ * - ConvolutionBackpropData
+ * - GroupConvolution
+ * - GroupConvolutionBackpropData
+ *
+ * Restrictions:
+ * - weights' shape is static
+ * - if the constant input to Multiply has the same rank as 'input', the constant first dimension has to be 1
+ * - constant input to Multiply has to be broadcastable to weights when 'Convolution Op' is either Convolution or GroupConvolution
+ * - shape of a constant input to Multiply has to be in one of following forms: (1), (1, 1, ..., 1), (C, 1, ..., 1), (1, C, 1, ..., 1)
+ *   when 'Convolution Op' is either ConvolutionBackpropData or GroupConvolutionBackpropData
+ */
+
+
+class ngraph::pass::MultiplyConvolutionFusion: public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    MultiplyConvolutionFusion();
+};
+
+class ngraph::pass::MultiplyGroupConvolutionFusion: public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    MultiplyGroupConvolutionFusion();
+};
+
+class ngraph::pass::MultiplyConvolutionBackpropDataFusion: public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    MultiplyConvolutionBackpropDataFusion();
+};
+
+class ngraph::pass::MultiplyGroupConvolutionBackpropDataFusion: public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    MultiplyGroupConvolutionBackpropDataFusion();
+};
diff --git a/inference-engine/src/transformations/include/transformations/common_optimizations/random_uniform_fusion.hpp b/inference-engine/src/transformations/include/transformations/common_optimizations/random_uniform_fusion.hpp
new file mode 100644
index 00000000000000..60415fc08df10f
--- /dev/null
+++ b/inference-engine/src/transformations/include/transformations/common_optimizations/random_uniform_fusion.hpp
@@ -0,0 +1,28 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <ngraph/pass/graph_rewrite.hpp>
+#include <transformations_visibility.hpp>
+
+namespace ngraph {
+namespace pass {
+
+class TRANSFORMATIONS_API RandomUniformFusion;
+
+}  // namespace pass
+}  // namespace ngraph
+
+/**
+ * @ingroup ie_transformation_common_api
+ * @brief RandomUniformFusion transformation replaces RandomUniform -> Add or
+ * RandomUniform -> Mul subgraph with a RandomUniform and replaces min and max const
+ * with corrected values.
+ */
+class ngraph::pass::RandomUniformFusion : public ngraph::pass::MatcherPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    RandomUniformFusion();
+};
diff --git a/inference-engine/src/transformations/include/transformations/serialize.hpp b/inference-engine/src/transformations/include/transformations/serialize.hpp
index f9733fa06cf6c5..f69467726b65ce 100644
--- a/inference-engine/src/transformations/include/transformations/serialize.hpp
+++ b/inference-engine/src/transformations/include/transformations/serialize.hpp
@@ -5,6 +5,7 @@
 #pragma once
 
 #include <string>
+#include <functional>
 
 #include "ngraph/opsets/opset.hpp"
 #include "ngraph/pass/pass.hpp"
@@ -14,8 +15,10 @@ namespace ngraph {
 namespace pass {
 
 class TRANSFORMATIONS_API Serialize;
+class TRANSFORMATIONS_API StreamSerialize;
 
 }  // namespace pass
+
 }  // namespace ngraph
 
 /**
@@ -49,3 +52,35 @@ class ngraph::pass::Serialize : public ngraph::pass::FunctionPass {
     const Version m_version;
     const std::map<std::string, ngraph::OpSet> m_custom_opsets;
 };
+
+/**
+ * @ingroup ie_transformation_common_api
+ * @brief StreamSerialize transformation converts ngraph::Function into single binary stream
+ * @attention
+ * - dynamic shapes are not supported
+ */
+class ngraph::pass::StreamSerialize : public ngraph::pass::FunctionPass {
+public:
+    NGRAPH_RTTI_DECLARATION;
+
+    struct DataHeader {
+        size_t custom_data_offset;
+        size_t custom_data_size;
+        size_t consts_offset;
+        size_t consts_size;
+        size_t model_offset;
+        size_t model_size;
+    };
+
+    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
+
+    StreamSerialize(std::ostream & stream,
+                    std::map<std::string, ngraph::OpSet> && custom_opsets = {},
+                    const std::function<void(std::ostream &)> & custom_data_serializer = {},
+                    Serialize::Version version = Serialize::Version::IR_V10);
+
+private:
+    std::ostream & m_stream;
+    std::map<std::string, ngraph::OpSet> m_custom_opsets;
+    std::function<void(std::ostream &)> m_custom_data_serializer;
+};
diff --git a/inference-engine/src/transformations/src/ngraph_ops/framework_node.cpp b/inference-engine/src/transformations/src/ngraph_ops/framework_node.cpp
index 75d7faa0dd90bb..b262aca3df7ff2 100644
--- a/inference-engine/src/transformations/src/ngraph_ops/framework_node.cpp
+++ b/inference-engine/src/transformations/src/ngraph_ops/framework_node.cpp
@@ -95,8 +95,8 @@ void op::FrameworkNode::validate_and_infer_types() {
     }
 }
 
-constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<op::FrameworkNodeAttrs>::type_info;
+constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<ngraph::op::FrameworkNodeAttrs>::type_info;
 
-ov::AttributeAdapter<op::FrameworkNodeAttrs>::AttributeAdapter(
-    op::FrameworkNodeAttrs& value)
-    : DirectValueAccessor<op::FrameworkNodeAttrs>(value) {}
+ov::AttributeAdapter<ngraph::op::FrameworkNodeAttrs>::AttributeAdapter(
+    ngraph::op::FrameworkNodeAttrs& value)
+    : DirectValueAccessor<ngraph::op::FrameworkNodeAttrs>(value) {}
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/add_fake_quantize_fusion.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/add_fake_quantize_fusion.cpp
index 6a421a15c41a69..31fa2531652c0b 100644
--- a/inference-engine/src/transformations/src/transformations/common_optimizations/add_fake_quantize_fusion.cpp
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/add_fake_quantize_fusion.cpp
@@ -11,6 +11,7 @@
 #include <ngraph/opsets/opset5.hpp>
 #include <ngraph/rt_info.hpp>
 #include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/validation_util.hpp>
 #include "itt.hpp"
 
 
@@ -29,38 +30,85 @@ ngraph::pass::AddFakeQuantizeFusion::AddFakeQuantizeFusion() {
                                                                         ngraph::pattern::any_input()});
     ngraph::matcher_pass_callback callback = [=](pattern::Matcher& m) {
         const auto& pattern_value_map = m.get_pattern_value_map();
+        const auto& input = pattern_value_map.at(input_pattern);
+        const auto& type = input.get_element_type();
+        if (type.bitwidth() < element::f32.bitwidth())
+            return false;
         auto fq = std::dynamic_pointer_cast<opset5::FakeQuantize>(pattern_value_map.at(fq_pattern).get_node_shared_ptr());
         if (!fq)
             return false;
-        std::shared_ptr<Node> add_const = std::dynamic_pointer_cast<opset5::Constant>(pattern_value_map.at(const_pattern).get_node_shared_ptr());
+        const auto& add_node = pattern_value_map.at(add_pattern).get_node_shared_ptr();
+        auto add_const = std::dynamic_pointer_cast<opset5::Constant>(pattern_value_map.at(const_pattern).get_node_shared_ptr());
         if (!add_const)
             return false;
+        std::shared_ptr<Node> new_const = add_const;
         auto const_shape = add_const->get_shape();
         size_t const_shape_size = shape_size(const_shape);
-        if (const_shape_size > 1) {
+        bool is_single_value = const_shape_size == 1;
+
+        if (!is_single_value) {
+            float v;
+            is_single_value = op::util::get_single_value(add_const, v);
+            if (is_single_value) {
+                new_const = std::make_shared<opset5::Constant>(add_const->get_element_type(), Shape{1}, v);
+            }
+        }
+
+        if (!is_single_value) {
             // disallow constant shapes other than (N, 1, 1, ..., 1) or (1, C, 1, ..., 1)
             if (!(const_shape[0] > 1 && const_shape[0] == const_shape_size) &&
                 !(const_shape.size() > 1 && const_shape[1] == const_shape_size)) {
                 return false;
             }
-        }
 
-        if (const_shape_size > 1 &&
-            static_cast<Dimension::value_type>(const_shape.size()) < fq->get_input_partial_shape(0).rank().get_length()) {
-            // Reshape constants like (C, 1, 1) to (1, C, 1, 1)
-            const_shape.insert(const_shape.begin(), fq->get_input_partial_shape(0).rank().get_length() - const_shape.size(), 1);
-            add_const = std::make_shared<opset5::Reshape>(add_const, op::Constant::create(element::u64, Shape{const_shape.size()}, const_shape), false);
+            // Convolution+Add or MatMul+Add can be fused later
+            // so don't fuse Add+FQ in that situation
+            const auto& add_inputs = add_node->input_values();
+            bool add_parent_is_conv_or_mm = std::any_of(add_inputs.begin(), add_inputs.end(),
+                                                        [] (const Output<Node>& node) -> bool {
+                                                            auto node_ptr = node.get_node();
+                                                            return is_type<opset5::Convolution>(node_ptr) ||
+                                                                   is_type<opset5::GroupConvolution>(node_ptr) ||
+                                                                   is_type<opset5::ConvolutionBackpropData>(node_ptr) ||
+                                                                   is_type<opset5::GroupConvolutionBackpropData>(node_ptr) ||
+                                                                   is_type<opset5::MatMul>(node_ptr);
+                                                        });
+            if (add_parent_is_conv_or_mm)
+                return false;
+            auto fq_users = fq->get_users();
+            // Concat LPT transformation supports per tensor quantization only
+            bool fq_user_is_concat = std::any_of(fq_users.begin(), fq_users.end(),
+                                                 [] (const Output<Node>& node) -> bool {
+                                                     auto node_ptr = node.get_node();
+                                                     return is_type<opset5::Concat>(node_ptr);
+                                                 });
+            if (fq_user_is_concat)
+                return false;
+            auto diff = fq->get_input_partial_shape(0).rank().get_length() - static_cast<Dimension::value_type>(const_shape.size());
+            if (diff > 0) {
+                // Reshape constants like (C, 1, 1) to (1, C, 1, 1)
+                const_shape.insert(const_shape.begin(), diff, 1);
+                new_const = std::make_shared<opset5::Reshape>(new_const,
+                        op::Constant::create(element::u64, Shape{const_shape.size()}, const_shape), false);
+            }
         }
-        auto new_input_low = std::make_shared<opset5::Subtract>(fq->input_value(1), add_const);
-        auto new_input_high = std::make_shared<opset5::Subtract>(fq->input_value(2), add_const);
-        auto new_fq = register_new_node<opset5::FakeQuantize>(pattern_value_map.at(input_pattern),
+
+        auto input_low_sub = std::make_shared<opset5::Subtract>(fq->input_value(1), new_const);
+        std::shared_ptr<Node> new_input_low = get_constant_from_source(input_low_sub);
+        if (!new_input_low)
+            new_input_low = input_low_sub;
+        auto input_high_sub = std::make_shared<opset5::Subtract>(fq->input_value(2), new_const);
+        std::shared_ptr<Node> new_input_high = get_constant_from_source(input_high_sub);
+        if (!new_input_high)
+            new_input_high = input_high_sub;
+        auto new_fq = register_new_node<opset5::FakeQuantize>(input,
                                                               new_input_low,
                                                               new_input_high,
                                                               fq->input_value(3),
                                                               fq->input_value(4),
                                                               fq->get_levels());
         new_fq->set_friendly_name(fq->get_friendly_name());
-        copy_runtime_info({pattern_value_map.at(add_pattern).get_node_shared_ptr(), fq}, {new_input_low, new_input_high, new_fq});
+        copy_runtime_info({add_node, fq}, {new_input_low, new_input_high, new_fq});
         replace_node(fq, new_fq);
         return true;
     };
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/common_optimizations.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/common_optimizations.cpp
index 253c4f113ab073..a739e90654afda 100644
--- a/inference-engine/src/transformations/src/transformations/common_optimizations/common_optimizations.cpp
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/common_optimizations.cpp
@@ -14,6 +14,7 @@
 #include "transformations/common_optimizations/fq_reshape_fusion.hpp"
 #include "transformations/common_optimizations/gelu_fusion.hpp"
 #include "transformations/common_optimizations/depth_to_space_fusion.hpp"
+#include "transformations/common_optimizations/dropout_with_random_uniform_replacer.hpp"
 #include "transformations/common_optimizations/optimize_strided_slice.hpp"
 #include "transformations/common_optimizations/softplus_fusion.hpp"
 #include "transformations/common_optimizations/softplus_to_mish_fusion.hpp"
@@ -27,6 +28,8 @@
 #include "transformations/common_optimizations/hswish_fusion.hpp"
 #include "transformations/common_optimizations/convert_quantize_dequantize.hpp"
 #include "transformations/common_optimizations/relu_fake_quantize_fusion.hpp"
+#include "transformations/common_optimizations/disable_random_uniform_constant_folding.hpp"
+#include "transformations/common_optimizations/random_uniform_fusion.hpp"
 #include "transformations/common_optimizations/add_fake_quantize_fusion.hpp"
 #include "transformations/common_optimizations/mul_fake_quantize_fusion.hpp"
 #include "transformations/common_optimizations/clamp_fusion.hpp"
@@ -45,6 +48,7 @@
 #include "transformations/common_optimizations/transpose_to_reshape.hpp"
 #include "transformations/common_optimizations/strides_optimization.hpp"
 #include "transformations/common_optimizations/convert_nms_gather_path_to_unsigned.hpp"
+#include "transformations/common_optimizations/mul_conv_fusion.hpp"
 #include "transformations/op_conversions/bidirectional_sequences_decomposition.hpp"
 #include "transformations/op_conversions/convert_pad_to_group_conv.hpp"
 #include "transformations/op_conversions/convert_divide.hpp"
@@ -88,6 +92,7 @@ bool ngraph::pass::CommonOptimizations::run_on_function(std::shared_ptr<ngraph::
 
     // This pass must be called first in pipeline
     manager.register_pass<ngraph::pass::InitNodeInfo>();
+    manager.register_pass<ngraph::pass::DisableRandomUniformConstantFolding>();
     manager.register_pass<ngraph::pass::SimplifyShapeOfSubGraph>();
     manager.register_pass<ngraph::pass::ConstantFolding>();
     manager.register_pass<ngraph::pass::RemoveFilteringBoxesBySize>(); // Resolves dynamism (replaces NonZero), CF needed
@@ -135,6 +140,7 @@ bool ngraph::pass::CommonOptimizations::run_on_function(std::shared_ptr<ngraph::
     common_fusions->add_matcher<ngraph::pass::GeluFusion>();
     common_fusions->add_matcher<ngraph::pass::TransposeToReshape>();
     common_fusions->add_matcher<ngraph::pass::LeakyReluFusion>();
+    common_fusions->add_matcher<ngraph::pass::RandomUniformFusion>();
     common_fusions->set_name("ngraph::pass::CommonFusions");
 
     manager.register_pass<ngraph::pass::ConvertPadToGroupConvolution, false>();
@@ -166,6 +172,7 @@ bool ngraph::pass::CommonOptimizations::run_on_function(std::shared_ptr<ngraph::
     decomp->add_matcher<ngraph::pass::SimplifyCTCGreedyDecoderSeqLen>();
     decomp->add_matcher<ngraph::pass::EinsumDecomposition>();
     decomp->add_matcher<ngraph::pass::GatherNegativeConstIndicesNormalize>();
+    decomp->add_matcher<ngraph::pass::DropoutWithRandomUniformReplacer>();
     decomp->set_name("ngraph::pass::CommonDecompositions");
 
     // CF is required after all decompositions
@@ -179,6 +186,10 @@ bool ngraph::pass::CommonOptimizations::run_on_function(std::shared_ptr<ngraph::
     conv_fusions->add_matcher<ngraph::pass::GroupConvolutionMultiplyFusion>();
     conv_fusions->add_matcher<ngraph::pass::ConvolutionBackpropDataMultiplyFusion>();
     conv_fusions->add_matcher<ngraph::pass::GroupConvolutionBackpropDataMultiplyFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyConvolutionFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyGroupConvolutionFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyConvolutionBackpropDataFusion>();
+    conv_fusions->add_matcher<ngraph::pass::MultiplyGroupConvolutionBackpropDataFusion>();
     conv_fusions->set_name("ngraph::pass::ConvFusions");
 
     manager.register_pass<ngraph::pass::ConstantFolding>();
@@ -193,6 +204,8 @@ bool ngraph::pass::CommonOptimizations::run_on_function(std::shared_ptr<ngraph::
     fq_fusions->add_matcher<ngraph::pass::FakeQuantizeReshapeFusion>();
     fq_fusions->add_matcher<ngraph::pass::PullTransposeThroughFQUp>();
     fq_fusions->add_matcher<ngraph::pass::ReluFakeQuantizeFusion>();
+    fq_fusions->add_matcher<ngraph::pass::AddFakeQuantizeFusion>();
+    fq_fusions->add_matcher<ngraph::pass::MulFakeQuantizeFusion>();
     fq_fusions->set_name("ngraph::pass::FakeQuantizeFusions");
 
     // StridesOptimization should be at the very end
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/disable_random_uniform_constant_folding.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/disable_random_uniform_constant_folding.cpp
new file mode 100644
index 00000000000000..7c93745d3fa449
--- /dev/null
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/disable_random_uniform_constant_folding.cpp
@@ -0,0 +1,24 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "transformations/common_optimizations/disable_random_uniform_constant_folding.hpp"
+
+#include <memory>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <transformations/rt_info/disable_constant_folding.hpp>
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::DisableRandomUniformConstantFolding, "DisableRandomUniformConstantFolding", 0);
+
+ngraph::pass::DisableRandomUniformConstantFolding::DisableRandomUniformConstantFolding() {
+    auto random_uniform = pattern::wrap_type<opset8::RandomUniform>();
+
+    ngraph::matcher_pass_callback callback = [=](pattern::Matcher& m) {
+        disable_constant_folding(m.get_match_root());
+        return true;
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(random_uniform, "DisableRandomUniformConstantFolding");
+    this->register_matcher(m, callback);
+}
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/dropout_with_random_uniform_replacer.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/dropout_with_random_uniform_replacer.cpp
new file mode 100644
index 00000000000000..e0c938dc6ad3d6
--- /dev/null
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/dropout_with_random_uniform_replacer.cpp
@@ -0,0 +1,82 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "transformations/common_optimizations/dropout_with_random_uniform_replacer.hpp"
+
+#include <memory>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pattern/op/or.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/rt_info.hpp>
+#include <openvino/pass/pattern/op/or.hpp>
+
+#include "itt.hpp"
+#include "transformations/utils/utils.hpp"
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::DropoutWithRandomUniformReplacer, "DropoutWithRandomUniformReplacer", 0);
+
+ngraph::pass::DropoutWithRandomUniformReplacer::DropoutWithRandomUniformReplacer() {
+    MATCHER_SCOPE(DropoutWithRandomUniformReplacer);
+    const auto shape_pattern = ngraph::pattern::any_input();
+    const auto ru_min_const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+    const auto ru_max_const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+    const auto random_uniform_pattern =
+        ngraph::pattern::wrap_type<opset8::RandomUniform>({shape_pattern, ru_min_const_pattern, ru_max_const_pattern},
+                                                          pattern::consumers_count(1));
+    const auto convert_pattern = ngraph::pattern::wrap_type<opset8::Convert>({random_uniform_pattern});
+    const auto add_const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+    const auto convert_or_random_uniform_pattern =
+        std::make_shared<pattern::op::Or>(OutputVector{convert_pattern, random_uniform_pattern});
+
+    const auto add_pattern =
+        ngraph::pattern::wrap_type<opset8::Add>({convert_or_random_uniform_pattern, add_const_pattern});
+
+    const auto floor_pattern = ngraph::pattern::wrap_type<opset8::Floor>({add_pattern});
+
+    ngraph::matcher_pass_callback callback = [=](pattern::Matcher& m) {
+        const auto& pattern_map = m.get_pattern_value_map();
+        const auto random_uniform = pattern_map.at(random_uniform_pattern);
+        const auto shape_of = pattern_map.at(shape_pattern);
+        const auto ru = std::dynamic_pointer_cast<opset8::RandomUniform>(random_uniform.get_node_shared_ptr());
+        if (!ru)
+            return false;
+        if (!ru->get_out_type().is_real())
+            return false;
+
+        auto min_const_value =
+            std::dynamic_pointer_cast<opset8::Constant>(pattern_map.at(ru_min_const_pattern).get_node_shared_ptr());
+        auto max_const_value =
+            std::dynamic_pointer_cast<opset8::Constant>(pattern_map.at(ru_max_const_pattern).get_node_shared_ptr());
+        auto add_const_value =
+            std::dynamic_pointer_cast<opset8::Constant>(pattern_map.at(add_const_pattern).get_node_shared_ptr());
+
+        bool valid_constant_values = op::util::has_constant_value<double>(min_const_value, 0.0) &&
+                                     op::util::has_constant_value<double>(max_const_value, 1.0);
+        if (!valid_constant_values)
+            return false;
+
+        if (!add_const_value)
+            return false;
+
+        auto add_const_vector = add_const_value->cast_vector<double>();
+        if (add_const_vector.size() > 1)
+            return false;
+
+        // Add const should have zero fractional part
+        if (add_const_vector[0] - std::round(add_const_vector[0]) != 0.0)
+            return false;
+
+        const auto broadcast_const = opset8::Constant::create(ru->get_out_type(), Shape{}, {0.5});
+        const auto broadcast = std::make_shared<opset8::Broadcast>(broadcast_const, shape_of);
+
+        broadcast->set_friendly_name(ru->get_friendly_name());
+        copy_runtime_info(ru, broadcast);
+        ngraph::replace_node(ru, broadcast);
+
+        return true;
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(floor_pattern, matcher_name);
+    this->register_matcher(m, callback);
+}
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/fq_mul_fusion.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/fq_mul_fusion.cpp
index ff023b56b50bdf..3fbe15eeb18762 100644
--- a/inference-engine/src/transformations/src/transformations/common_optimizations/fq_mul_fusion.cpp
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/fq_mul_fusion.cpp
@@ -12,35 +12,10 @@
 #include <ngraph/opsets/opset4.hpp>
 #include <ngraph/pattern/op/wrap_type.hpp>
 #include <ngraph/rt_info.hpp>
+#include <ngraph/validation_util.hpp>
 
 NGRAPH_RTTI_DEFINITION(ngraph::pass::FakeQuantizeMulFusion, "FakeQuantizeMulFusion", 0);
 
-namespace {
-std::pair<ngraph::Output<ngraph::Node>, ngraph::Output<ngraph::Node>>
-    get_adjusted_output_range(ngraph::Output<ngraph::Node> out_low,
-                              ngraph::Output<ngraph::Node> out_high,
-                              ngraph::Output<ngraph::Node> multiplier) {
-        const auto mul_out_low = std::make_shared<ngraph::opset4::Multiply>(out_low, multiplier);
-        const auto mul_out_high = std::make_shared<ngraph::opset4::Multiply>(out_high, multiplier);
-        copy_runtime_info({out_low.get_node_shared_ptr(), multiplier.get_node_shared_ptr()},
-                          mul_out_low);
-        copy_runtime_info({out_high.get_node_shared_ptr(), multiplier.get_node_shared_ptr()},
-                          mul_out_high);
-
-        ngraph::OutputVector new_out_low(1), new_out_high(1);
-
-        if (!mul_out_low->constant_fold(new_out_low, {out_low, multiplier})) {
-            new_out_low[0] = mul_out_low;
-        }
-
-        if (!mul_out_high->constant_fold(new_out_high, {out_high, multiplier})) {
-            new_out_high[0] = mul_out_high;
-        }
-
-        return {new_out_low[0], new_out_high[0]};
-    }
-} // namespace
-
 // This transformation multiplies the "output_low" and "output_high" inputs of the FQ operation
 // by the constant value that before transormation is used to multiply the output of FQ.
 // Both output_low and output_high are multiplied by the value represented as C (a constant) below.
@@ -64,10 +39,11 @@ std::pair<ngraph::Output<ngraph::Node>, ngraph::Output<ngraph::Node>>
 
 ngraph::pass::FakeQuantizeMulFusion::FakeQuantizeMulFusion() {
     MATCHER_SCOPE(FakeQuantizeMulFusion);
+    const auto data_p = ngraph::pattern::any_input();
     const auto fq_output_low_p = ngraph::pattern::any_input();
     const auto fq_output_high_p = ngraph::pattern::any_input();
 
-    const auto fq_node_p = ngraph::pattern::wrap_type<opset4::FakeQuantize>({ngraph::pattern::any_input(),
+    const auto fq_node_p = ngraph::pattern::wrap_type<opset4::FakeQuantize>({data_p,
                                                                              ngraph::pattern::any_input(),
                                                                              ngraph::pattern::any_input(),
                                                                              fq_output_low_p,
@@ -81,20 +57,65 @@ ngraph::pass::FakeQuantizeMulFusion::FakeQuantizeMulFusion() {
     ngraph::matcher_pass_callback callback = [=](pattern::Matcher &m) {
         const auto& pattern_map = m.get_pattern_value_map();
 
+        const auto& data = pattern_map.at(data_p);
         const auto fq_node = pattern_map.at(fq_node_p).get_node_shared_ptr();
 
         const auto & original_output_low = pattern_map.at(fq_output_low_p);
         const auto & original_output_high = pattern_map.at(fq_output_high_p);
-        const auto & mul_constant = pattern_map.at(mul_constant_p);
+        auto mul_constant = pattern_map.at(mul_constant_p).get_node_shared_ptr();
+        auto mul_constant_shape = mul_constant->get_shape();
+        bool is_single_value = shape_size(mul_constant_shape) == 1;
+
+        if (!is_single_value) {
+            float v;
+            auto constant = std::dynamic_pointer_cast<opset4::Constant>(mul_constant);
+            if (constant) {
+                is_single_value = op::util::get_single_value(constant, v);
+                if (is_single_value) {
+                    mul_constant_shape = Shape{1};
+                    mul_constant = std::make_shared<opset4::Constant>(mul_constant->get_element_type(), mul_constant_shape, v);
+                }
+            }
+        }
+
+        if (!is_single_value) {
+            auto fq_outputs = fq_node->get_users();
+            // Convolution and GroupConvolution LP transformations require output low/high to have the same values
+            bool fq_output_is_conv = std::any_of(fq_outputs.begin(), fq_outputs.end(),
+                                                 [] (const std::shared_ptr<Node>& node) -> bool {
+                                                     return is_type<opset4::Convolution>(node) ||
+                                                            is_type<opset4::GroupConvolution>(node);
+                                                 });
+            if (fq_output_is_conv) {
+                return false;
+            }
+            const auto & data_rank = data.get_partial_shape().rank();
+            if (data_rank.is_dynamic()) {
+                return false;
+            }
+            auto rank = data_rank.get_length();
+            auto diff = rank - mul_constant_shape.size();
+            if (diff > 0) {
+                mul_constant_shape.insert(mul_constant_shape.begin(), diff, 1);
+                mul_constant = std::make_shared<ngraph::opset4::Reshape>(mul_constant,
+                        op::Constant::create(element::i64, Shape{mul_constant_shape.size()}, mul_constant_shape), false);
+            }
+        }
 
-        const auto new_output_limits = get_adjusted_output_range(
-                                                                 original_output_low, original_output_high, mul_constant);
+        auto get_adjusted_output_range = [&] (const Output<Node>& node) -> std::shared_ptr<Node> {
+            auto ret = std::make_shared<ngraph::opset4::Multiply>(node, mul_constant);
+            copy_runtime_info(node.get_node_shared_ptr(), ret);
+            auto constant =  get_constant_from_source(ret);
+            if (constant)
+                return constant;
+            return ret;
+        };
 
         const auto new_fq_node = fq_node->clone_with_new_inputs({fq_node->input_value(0),
             fq_node->input_value(1),
             fq_node->input_value(2),
-            new_output_limits.first,
-            new_output_limits.second});
+            get_adjusted_output_range(original_output_low),
+            get_adjusted_output_range(original_output_high)});
 
         const auto mul_node = pattern_map.at(mul_node_p).get_node_shared_ptr();
 
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/mul_conv_fusion.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/mul_conv_fusion.cpp
new file mode 100644
index 00000000000000..8e034e465e7b75
--- /dev/null
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/mul_conv_fusion.cpp
@@ -0,0 +1,293 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "transformations/common_optimizations/mul_conv_fusion.hpp"
+#include "itt.hpp"
+
+#include <memory>
+#include <vector>
+
+#include <ngraph/ngraph.hpp>
+#include <ngraph/pattern/matcher.hpp>
+#include <ngraph/rt_info.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/opsets/opset8.hpp>
+
+#include <transformations/utils/utils.hpp>
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::MultiplyConvolutionFusion, "MultiplyConvolutionFusion", 0);
+
+static bool is_dequantization_subgraph(const ngraph::Output<ngraph::Node>& multiply) {
+    auto inputs = multiply.get_node()->input_values();
+    const auto subtract = std::find_if(inputs.begin(), inputs.end(),
+                                       [] (const ngraph::Output<ngraph::Node>& n) -> bool {
+                                           return ov::is_type<ngraph::opset8::Subtract>(n.get_node());
+                                       });
+    if (subtract != inputs.end())
+        inputs = subtract->get_node()->input_values();
+    const auto first_convert = std::find_if(inputs.begin(), inputs.end(),
+                                      [] (const ngraph::Output<ngraph::Node>& n) -> bool {
+                                          if (ov::is_type<ngraph::opset8::Convert>(n.get_node())) {
+                                              const auto input = n.get_node()->input_value(0);
+                                              return ov::is_type<ngraph::opset8::Convert>(input.get_node());
+                                          }
+                                          return false;
+                                      });
+    if (first_convert == inputs.end())
+        return false;
+    const auto second_convert = first_convert->get_node()->input_value(0);
+    const auto& first_convert_src_type = second_convert.get_element_type();
+    const auto& first_convert_dest_type = first_convert->get_element_type();
+    const auto second_convert_src_type = second_convert.get_node()->input_value(0).get_element_type();
+    return (first_convert_src_type == ngraph::element::i8 || first_convert_src_type == ngraph::element::u8) &&
+        first_convert_dest_type == second_convert_src_type;
+}
+
+ngraph::pass::MultiplyConvolutionFusion::MultiplyConvolutionFusion() {
+    MATCHER_SCOPE(MultiplyConvolutionFusion);
+    auto input_pattern = pattern::any_input();
+    auto mul_const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+    auto mul_pattern = ngraph::pattern::wrap_type<opset8::Multiply>({input_pattern, mul_const_pattern}, pattern::consumers_count(1));
+    auto weights_pattern = ngraph::pattern::any_input(pattern::has_static_shape());
+    auto conv_pattern = ngraph::pattern::wrap_type<opset8::Convolution>({mul_pattern, weights_pattern});
+
+    matcher_pass_callback callback = [=](pattern::Matcher & m) -> bool {
+        const auto& pattern_to_output = m.get_pattern_value_map();
+
+        // Can't fuse Multiply to Convolution if that Multiply is part of dequantization subgraph
+        // since that breaks low precision transformations
+        if (is_dequantization_subgraph(pattern_to_output.at(mul_pattern)))
+            return false;
+
+        const auto& weights = pattern_to_output.at(weights_pattern);
+        const auto& mul_const = pattern_to_output.at(mul_const_pattern);
+
+        const auto& weights_shape = weights.get_shape();
+        const auto& mul_const_shape = mul_const.get_shape();
+        // Check if mul_const if broadcastable to weights.
+        // Also if mul_const's rank matches weights rank and mul_const.shape[0] != 1
+        // then we can't fuse the multiply, since first dimension in mul_const corresponds to
+        // batch size, while first dimension in weights corresponds to output channel count
+        if (op::util::check_for_broadcast(weights_shape, mul_const_shape) ||
+            (weights_shape.size() == mul_const_shape.size() && mul_const_shape[0] != 1)) {
+            return false;
+        }
+
+        auto weights_multiply = std::make_shared<opset8::Multiply>(weights, mul_const);
+        std::shared_ptr<Node> new_weights = get_constant_from_source(weights_multiply);
+        if (!new_weights)
+            new_weights = weights_multiply;
+
+        const auto& input = pattern_to_output.at(input_pattern);
+        const auto& conv = pattern_to_output.at(conv_pattern).get_node_shared_ptr();
+
+        auto new_conv = conv->clone_with_new_inputs({input, new_weights});
+        new_conv->set_friendly_name(conv->get_friendly_name());
+        copy_runtime_info({conv, pattern_to_output.at(mul_pattern).get_node_shared_ptr()},
+                          {new_weights, new_conv});
+        replace_node(conv, new_conv);
+
+        return true;
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(conv_pattern, matcher_name);
+    register_matcher(m, callback);
+}
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::MultiplyGroupConvolutionFusion, "MultiplyGroupConvolutionFusion", 0);
+
+ngraph::pass::MultiplyGroupConvolutionFusion::MultiplyGroupConvolutionFusion() {
+    MATCHER_SCOPE(MultiplyGroupConvolutionFusion);
+    auto input_pattern = pattern::any_input();
+    auto mul_const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+    auto mul_pattern = ngraph::pattern::wrap_type<opset8::Multiply>({input_pattern, mul_const_pattern}, pattern::consumers_count(1));
+    auto weights_pattern = ngraph::pattern::any_input(pattern::has_static_shape());
+    auto conv_pattern = ngraph::pattern::wrap_type<opset8::GroupConvolution>({mul_pattern, weights_pattern});
+
+    matcher_pass_callback callback = [=](pattern::Matcher & m) -> bool {
+        const auto& pattern_to_output = m.get_pattern_value_map();
+
+        // Can't fuse Multiply to Convolution if that Multiply is part of dequantization subgraph
+        // since that breaks low precision transformations
+        if (is_dequantization_subgraph(pattern_to_output.at(mul_pattern)))
+            return false;
+
+        const auto& weights = pattern_to_output.at(weights_pattern);
+        std::shared_ptr<Node> mul_const = pattern_to_output.at(mul_const_pattern).get_node_shared_ptr();
+
+        const auto& weights_shape = weights.get_shape();
+        if (shape_size(mul_const->get_shape()) > 1) {
+            auto mul_const_shape = mul_const->get_shape();
+            // extend mul_const_shape rank with unit dimensions
+            if (weights_shape.size() - mul_const_shape.size() > 1)
+                mul_const_shape.insert(mul_const_shape.begin(), weights_shape.size() - mul_const_shape.size() - 1, 1);
+            // if mul_const.shape[0] != 1
+            // then we can't fuse the multiply, since first dimension in mul_const corresponds to
+            // batch size, while first dimension in weights corresponds to output channel count
+            if (mul_const_shape[0] != 1)
+                return false;
+            auto G = mul_const_shape[1] > 1 ? weights_shape[0] : 1;
+            auto C = mul_const_shape[1] / G;
+            // Reshape mul_const from shape (1, C, H, W) to (G, 1, C / G, H, W) to match GroupConvolution weights format
+            Shape new_shape{G, 1, C};
+            std::copy(mul_const_shape.begin() + 2, mul_const_shape.end(), std::back_inserter(new_shape));
+            if (op::util::check_for_broadcast(weights_shape, new_shape)) {
+                return false;
+            }
+            mul_const = std::make_shared<opset8::Reshape>(mul_const, op::Constant::create(element::u64, Shape{new_shape.size()}, new_shape), false);
+        }
+
+        auto weights_multiply = std::make_shared<opset8::Multiply>(weights, mul_const);
+        std::shared_ptr<Node> new_weights = get_constant_from_source(weights_multiply);
+        if (!new_weights)
+            new_weights = weights_multiply;
+
+        const auto& input = pattern_to_output.at(input_pattern);
+        const auto& conv = pattern_to_output.at(conv_pattern).get_node_shared_ptr();
+
+        auto new_conv = conv->clone_with_new_inputs({input, new_weights});
+        new_conv->set_friendly_name(conv->get_friendly_name());
+        copy_runtime_info({conv, pattern_to_output.at(mul_pattern).get_node_shared_ptr()},
+                          {new_weights, new_conv});
+        replace_node(conv, new_conv);
+
+        return true;
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(conv_pattern, matcher_name);
+    register_matcher(m, callback);
+}
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::MultiplyConvolutionBackpropDataFusion, "MultiplyConvolutionBackpropDataFusion", 0);
+
+ngraph::pass::MultiplyConvolutionBackpropDataFusion::MultiplyConvolutionBackpropDataFusion() {
+    MATCHER_SCOPE(MultiplyConvolutionBackpropDataFusion);
+    auto input_pattern = pattern::any_input();
+    auto mul_const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+    auto mul_pattern = ngraph::pattern::wrap_type<opset8::Multiply>({input_pattern, mul_const_pattern}, pattern::consumers_count(1));
+    auto weights_pattern = ngraph::pattern::any_input(pattern::has_static_shape());
+    auto conv_pattern = ngraph::pattern::wrap_type<opset8::ConvolutionBackpropData>({mul_pattern, weights_pattern});
+
+    matcher_pass_callback callback = [=](pattern::Matcher & m) -> bool {
+        const auto& pattern_to_output = m.get_pattern_value_map();
+
+        // Can't fuse Multiply to Convolution if that Multiply is part of dequantization subgraph
+        // since that breaks low precision transformations
+        if (is_dequantization_subgraph(pattern_to_output.at(mul_pattern)))
+            return false;
+
+        const auto& weights = pattern_to_output.at(weights_pattern);
+        const auto& weights_shape = weights.get_shape();
+        std::shared_ptr<Node> mul_const = pattern_to_output.at(mul_const_pattern).get_node_shared_ptr();
+
+        if (shape_size(mul_const->get_shape()) > 1) {
+            auto mul_const_shape = mul_const->get_shape();
+            // extend mul_const_shape rank with unit dimensions
+            if (weights_shape.size() > mul_const_shape.size())
+                mul_const_shape.insert(mul_const_shape.begin(), weights_shape.size() - mul_const_shape.size(), 1);
+            // Check if constant has following shape (1, C, 1, 1, ..)
+            // We can't fuse constants like (1, C, H, W) due to backprop nature of this convolution
+            // In backprop, weights pixels are applied to input differently than in fprop convolution
+            for (size_t i = 0; i < mul_const_shape.size(); i++) {
+                if (i == 1)
+                   continue;
+                if (mul_const_shape[i] != 1)
+                    return false;
+            }
+            // Reshape mul_const from shape (1, C, 1, 1) to (C, 1, 1, 1) to match ConvolutionBackpropData weights format
+            Shape new_shape{mul_const_shape[1], 1};
+            new_shape.insert(new_shape.end(), mul_const_shape.size() - 2, 1);
+            if (op::util::check_for_broadcast(weights_shape, new_shape)) {
+                return false;
+            }
+            mul_const = std::make_shared<opset8::Reshape>(mul_const, op::Constant::create(element::u64, Shape{new_shape.size()}, new_shape), false);
+        }
+
+        auto weights_multiply = std::make_shared<opset8::Multiply>(weights, mul_const);
+        std::shared_ptr<Node> new_weights = get_constant_from_source(weights_multiply);
+        if (!new_weights)
+            new_weights = weights_multiply;
+
+        const auto& input = pattern_to_output.at(input_pattern);
+        const auto& conv = pattern_to_output.at(conv_pattern).get_node_shared_ptr();
+
+        auto new_conv = conv->clone_with_new_inputs({input, new_weights});
+        new_conv->set_friendly_name(conv->get_friendly_name());
+        copy_runtime_info({conv, pattern_to_output.at(mul_pattern).get_node_shared_ptr()},
+                          {new_weights, new_conv});
+        replace_node(conv, new_conv);
+
+        return true;
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(conv_pattern, matcher_name);
+    register_matcher(m, callback);
+}
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::MultiplyGroupConvolutionBackpropDataFusion, "MultiplyGroupConvolutionBackpropDataFusion", 0);
+
+ngraph::pass::MultiplyGroupConvolutionBackpropDataFusion::MultiplyGroupConvolutionBackpropDataFusion() {
+    MATCHER_SCOPE(MultiplyGroupConvolutionBackpropDataFusion);
+    auto input_pattern = pattern::any_input();
+    auto mul_const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+    auto mul_pattern = ngraph::pattern::wrap_type<opset8::Multiply>({input_pattern, mul_const_pattern}, pattern::consumers_count(1));
+    auto weights_pattern = ngraph::pattern::any_input(pattern::has_static_shape());
+    auto conv_pattern = ngraph::pattern::wrap_type<opset8::GroupConvolutionBackpropData>({mul_pattern, weights_pattern});
+
+    matcher_pass_callback callback = [=](pattern::Matcher & m) -> bool {
+        const auto& pattern_to_output = m.get_pattern_value_map();
+
+        // Can't fuse Multiply to Convolution if that Multiply is part of dequantization subgraph
+        // since that breaks low precision transformations
+        if (is_dequantization_subgraph(pattern_to_output.at(mul_pattern)))
+            return false;
+
+        const auto& weights = pattern_to_output.at(weights_pattern);
+        std::shared_ptr<Node> mul_const = pattern_to_output.at(mul_const_pattern).get_node_shared_ptr();
+
+        const auto& weights_shape = weights.get_shape();
+        if (shape_size(mul_const->get_shape()) > 1) {
+            auto mul_const_shape = mul_const->get_shape();
+            // extend mul_const_shape rank with unit dimensions
+            if (weights_shape.size() - mul_const_shape.size() > 1)
+                mul_const_shape.insert(mul_const_shape.begin(), weights_shape.size() - mul_const_shape.size() - 1, 1);
+            // We can't fuse constants like (1, C, H, W) due to backprop nature of this convolution
+            // In backprop, weights pixels are applied to input differently than in fprop convolution
+            for (size_t i = 0; i < mul_const_shape.size(); i++) {
+                if (i == 1)
+                   continue;
+                if (mul_const_shape[i] != 1)
+                    return false;
+            }
+            // Reshape mul_const from shape (1, C, 1, 1) to (G, C / G, 1, 1, 1) to match GroupConvolutionBackpropData weights format
+            auto G = mul_const_shape[1] > 1 ? weights_shape[0] : 1;
+            auto C = mul_const_shape[1] / G;
+            Shape new_shape{G, C, 1};
+            new_shape.insert(new_shape.end(), mul_const_shape.size() - 2, 1);
+            if (op::util::check_for_broadcast(weights_shape, new_shape)) {
+                return false;
+            }
+            mul_const = std::make_shared<opset8::Reshape>(mul_const, op::Constant::create(element::u64, Shape{new_shape.size()}, new_shape), false);
+        }
+
+        auto weights_multiply = std::make_shared<opset8::Multiply>(weights, mul_const);
+        std::shared_ptr<Node> new_weights = get_constant_from_source(weights_multiply);
+        if (!new_weights)
+            new_weights = weights_multiply;
+
+        const auto& input = pattern_to_output.at(input_pattern);
+        const auto& conv = pattern_to_output.at(conv_pattern).get_node_shared_ptr();
+
+        auto new_conv = conv->clone_with_new_inputs({input, new_weights});
+        new_conv->set_friendly_name(conv->get_friendly_name());
+        copy_runtime_info({conv, pattern_to_output.at(mul_pattern).get_node_shared_ptr()},
+                          {new_weights, new_conv});
+        replace_node(conv, new_conv);
+
+        return true;
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(conv_pattern, matcher_name);
+    register_matcher(m, callback);
+}
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/mul_fake_quantize_fusion.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/mul_fake_quantize_fusion.cpp
index 1fcff0ac15cc4f..cc64c79cba8a8f 100644
--- a/inference-engine/src/transformations/src/transformations/common_optimizations/mul_fake_quantize_fusion.cpp
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/mul_fake_quantize_fusion.cpp
@@ -11,6 +11,7 @@
 #include <ngraph/opsets/opset5.hpp>
 #include <ngraph/rt_info.hpp>
 #include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/validation_util.hpp>
 #include "itt.hpp"
 
 
@@ -29,6 +30,10 @@ ngraph::pass::MulFakeQuantizeFusion::MulFakeQuantizeFusion() {
                                                                         ngraph::pattern::any_input()});
     ngraph::matcher_pass_callback callback = [=](pattern::Matcher& m) {
         const auto& pattern_value_map = m.get_pattern_value_map();
+        const auto& input = pattern_value_map.at(input_pattern);
+        const auto& type = input.get_element_type();
+        if (type.bitwidth() < element::f32.bitwidth())
+            return false;
         auto fq = std::dynamic_pointer_cast<opset5::FakeQuantize>(pattern_value_map.at(fq_pattern).get_node_shared_ptr());
         if (!fq)
             return false;
@@ -37,74 +42,61 @@ ngraph::pass::MulFakeQuantizeFusion::MulFakeQuantizeFusion() {
             return false;
 
         auto mul_const_value = mul_const->cast_vector<float>();
-        if (std::any_of(mul_const_value.begin(), mul_const_value.end(), [] (float f) -> bool { return f == 0.0f; }))
+        if (std::any_of(mul_const_value.begin(), mul_const_value.end(), [] (float f) -> bool { return f <= 0.0f; }))
             return false;
 
+        std::shared_ptr<Node> new_const = mul_const;
         auto const_shape = mul_const->get_shape();
         size_t const_shape_size = shape_size(const_shape);
-        if (const_shape_size > 1) {
+        bool is_single_value = const_shape_size == 1;
+
+        if (!is_single_value) {
+            float v;
+            is_single_value = op::util::get_single_value(mul_const, v);
+            if (is_single_value) {
+                new_const = std::make_shared<opset5::Constant>(mul_const->get_element_type(), Shape{1}, v);
+                const_shape = Shape{1};
+            }
+        }
+
+        if (!is_single_value) {
             // disallow constant shapes other than (N, 1, 1, ..., 1) or (1, C, 1, ..., 1)
             if (!(const_shape[0] > 1 && const_shape[0] == const_shape_size) &&
                 !(const_shape.size() > 1 && const_shape[1] == const_shape_size)) {
                 return false;
             }
-        }
-
-        std::shared_ptr<Node> mul_const_node = mul_const;
-        if (const_shape_size > 1 &&
-            static_cast<Dimension::value_type>(const_shape.size()) < fq->get_input_partial_shape(0).rank().get_length()) {
+            const auto& rank = fq->get_input_partial_shape(0).rank();
+            if (rank.is_dynamic())
+                return false;
+            auto fq_users = fq->get_users();
+            // Concat LPT transformation supports per tensor quantization only
+            bool fq_user_is_concat = std::any_of(fq_users.begin(), fq_users.end(),
+                                                 [] (const Output<Node>& node) -> bool {
+                                                     auto node_ptr = node.get_node();
+                                                     return is_type<opset5::Concat>(node_ptr);
+                                                 });
+            if (fq_user_is_concat)
+                return false;
+            auto diff = rank.get_length() - static_cast<Dimension::value_type>(const_shape.size());
             // Reshape constants like (C, 1, 1) to (1, C, 1, 1)
-            const_shape.insert(const_shape.begin(), fq->get_input_partial_shape(0).rank().get_length() - const_shape.size(), 1);
-            mul_const_node = std::make_shared<opset5::Reshape>(mul_const_node,
+            const_shape.insert(const_shape.begin(), diff, 1);
+            new_const = std::make_shared<opset5::Reshape>(new_const,
                     op::Constant::create(element::u64, Shape{const_shape.size()}, const_shape), false);
         }
 
-        auto new_input_low = std::make_shared<opset5::Divide>(fq->input_value(1), mul_const_node);
-        auto new_input_high = std::make_shared<opset5::Divide>(fq->input_value(2), mul_const_node);
-
-        auto mul = pattern_value_map.at(mul_pattern).get_node_shared_ptr();
-        const auto& mul_data = pattern_value_map.at(input_pattern);
-
-        std::shared_ptr<Node> new_fq;
-        if (std::all_of(mul_const_value.begin(), mul_const_value.end(), [] (float f) -> bool { return f < 0.0f; })) {
-            new_fq = register_new_node<opset5::FakeQuantize>(mul_data, new_input_low, new_input_high,
-                    fq->input_value(4), fq->input_value(3), fq->get_levels());
-            copy_runtime_info({mul, fq}, {mul_const_node, new_input_low, new_input_high, new_fq});
-        } else if (std::any_of(mul_const_value.begin(), mul_const_value.end(), [] (float f) -> bool { return f < 0.0f; })) {
-            const auto& output_low = fq->input_value(3);
-            const auto& output_high = fq->input_value(4);
-            // get the mask of the values from mul_const that are less than zero
-            std::vector<float> less_than_zero;
-            less_than_zero.reserve(mul_const_value.size());
-            // and greater or equal to zero
-            std::vector<float> greater_eq_zero;
-            greater_eq_zero.reserve(mul_const_value.size());
-            for (size_t i = 0; i < mul_const_value.size(); i++) {
-                less_than_zero.push_back(mul_const_value[i] < 0);
-                greater_eq_zero.push_back(mul_const_value[i] >= 0);
-            }
-            auto less_const = op::Constant::create(output_low.get_element_type(), const_shape, less_than_zero);
-            auto greater_eq_const = op::Constant::create(output_low.get_element_type(), const_shape, greater_eq_zero);
-            // new_output_low is defined as follows:
-            //   output_low[i],  when mul_const[i] >= 0
-            //   output_high[i], when mul_const[i] < 0
-            auto new_output_low = std::make_shared<opset5::Add>(
-                    std::make_shared<opset5::Multiply>(greater_eq_const, output_low),
-                    std::make_shared<opset5::Multiply>(less_const, output_high));
-            // new_output_high is defined as follows:
-            //   output_high[i], when mul_const[i] >= 0
-            //   output_low[i],  when mul_const[i] < 0
-            auto new_output_high = std::make_shared<opset5::Add>(
-                    std::make_shared<opset5::Multiply>(greater_eq_const, output_high),
-                    std::make_shared<opset5::Multiply>(less_const, output_low));
-            new_fq = register_new_node<opset5::FakeQuantize>(mul_data, new_input_low,
-                    new_input_high, new_output_low, new_output_high, fq->get_levels());
-        } else {
-            new_fq = register_new_node<opset5::FakeQuantize>(mul_data, new_input_low, new_input_high,
-                    fq->input_value(3), fq->input_value(4), fq->get_levels());
-        }
+        auto input_low_div = std::make_shared<opset5::Divide>(fq->input_value(1), new_const);
+        std::shared_ptr<Node> new_input_low = get_constant_from_source(input_low_div);
+        if (!new_input_low)
+            new_input_low = input_low_div;
+        auto input_high_div = std::make_shared<opset5::Divide>(fq->input_value(2), new_const);
+        std::shared_ptr<Node> new_input_high = get_constant_from_source(input_high_div);
+        if (!new_input_high)
+            new_input_high = input_high_div;
 
-        copy_runtime_info({mul, fq}, {mul_const_node, new_input_low, new_input_high, new_fq});
+        auto new_fq = register_new_node<opset5::FakeQuantize>(input, new_input_low, new_input_high,
+                fq->input_value(3), fq->input_value(4), fq->get_levels());
+        copy_runtime_info({pattern_value_map.at(mul_pattern).get_node_shared_ptr(), fq},
+                          {new_const, new_input_low, new_input_high, new_fq});
         new_fq->set_friendly_name(fq->get_friendly_name());
         replace_node(fq, new_fq);
         return true;
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/pull_transpose_through_fq.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/pull_transpose_through_fq.cpp
index 618b633260e04d..68eb7eb337cbc4 100644
--- a/inference-engine/src/transformations/src/transformations/common_optimizations/pull_transpose_through_fq.cpp
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/pull_transpose_through_fq.cpp
@@ -17,18 +17,32 @@ NGRAPH_RTTI_DEFINITION(ngraph::pass::PullTransposeThroughFQUp, "PullTransposeThr
 ngraph::pass::PullTransposeThroughFQUp::PullTransposeThroughFQUp() {
     MATCHER_SCOPE(PullTransposeThroughFQUp);
     auto m_fq = pattern::wrap_type<opset1::FakeQuantize>({pattern::any_input(pattern::has_static_rank()),
-                                                          pattern::any_input(pattern::has_static_rank()),
-                                                          pattern::any_input(pattern::has_static_rank()),
-                                                          pattern::any_input(pattern::has_static_rank()),
-                                                          pattern::any_input(pattern::has_static_rank())},
+                                                          pattern::any_input(pattern::has_static_shape()),
+                                                          pattern::any_input(pattern::has_static_shape()),
+                                                          pattern::any_input(pattern::has_static_shape()),
+                                                          pattern::any_input(pattern::has_static_shape())},
                                                           pattern::consumers_count(1));
-    auto m_transpose = pattern::wrap_type<opset1::Transpose>({m_fq, pattern::wrap_type<opset1::Constant>()});
+    auto m_transpose_perm = pattern::wrap_type<opset1::Constant>();
+    auto m_transpose = pattern::wrap_type<opset1::Transpose>({m_fq, m_transpose_perm});
 
     ngraph::matcher_pass_callback callback = [=](pattern::Matcher& m) {
         auto & pattern_map = m.get_pattern_value_map();
         auto transpose = pattern_map[m_transpose].get_node_shared_ptr();
         auto fq = pattern_map[m_fq].get_node_shared_ptr();
 
+        auto are_inputs_scalars = shape_size(fq->input_value(1).get_shape()) == 1 &&
+                                  shape_size(fq->input_value(2).get_shape()) == 1 &&
+                                  shape_size(fq->input_value(3).get_shape()) == 1 &&
+                                  shape_size(fq->input_value(4).get_shape()) == 1;
+        if (!are_inputs_scalars) {
+            auto perm = std::dynamic_pointer_cast<opset1::Constant>(pattern_map[m_transpose_perm].get_node_shared_ptr());
+            if (!perm)
+                return false;
+            auto perm_val = perm->cast_vector<int64_t>();
+            if (!(perm_val[0] == 0 && perm_val[1] == 1))
+                return false;
+        }
+
         auto input_rank = fq->input(0).get_partial_shape().rank().get_length();
 
         ngraph::NodeVector new_ops;
diff --git a/inference-engine/src/transformations/src/transformations/common_optimizations/random_uniform_fusion.cpp b/inference-engine/src/transformations/src/transformations/common_optimizations/random_uniform_fusion.cpp
new file mode 100644
index 00000000000000..1d7c3bfbe10a54
--- /dev/null
+++ b/inference-engine/src/transformations/src/transformations/common_optimizations/random_uniform_fusion.cpp
@@ -0,0 +1,92 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "transformations/common_optimizations/random_uniform_fusion.hpp"
+
+#include <memory>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pattern/op/or.hpp>
+#include <ngraph/pattern/op/wrap_type.hpp>
+#include <ngraph/rt_info.hpp>
+#include <ngraph/ngraph.hpp>
+
+#include "itt.hpp"
+
+NGRAPH_RTTI_DEFINITION(ngraph::pass::RandomUniformFusion, "RandomUniformFusion", 0);
+
+ngraph::pass::RandomUniformFusion::RandomUniformFusion() {
+    MATCHER_SCOPE(RandomUniformFusion);
+    const auto data_pattern = ngraph::pattern::any_input();
+    const auto ru_min_input_pattern = ngraph::pattern::any_input();
+    const auto ru_max_input_pattern = ngraph::pattern::any_input();
+    const auto random_uniform_pattern =
+        ngraph::pattern::wrap_type<opset8::RandomUniform>({data_pattern, ru_min_input_pattern, ru_max_input_pattern},
+                                                          pattern::consumers_count(1));
+    const auto const_pattern = ngraph::pattern::wrap_type<opset8::Constant>();
+
+    const auto convert_pattern = ngraph::pattern::wrap_type<opset8::Convert>({random_uniform_pattern});
+    const auto random_uniform_or_convert_pattern =
+        std::make_shared<pattern::op::Or>(OutputVector{random_uniform_pattern, convert_pattern});
+
+    const auto mul_add_pattern =
+        ngraph::pattern::wrap_type<opset8::Multiply, opset8::Add>({random_uniform_or_convert_pattern, const_pattern});
+
+    ngraph::matcher_pass_callback callback = [=](pattern::Matcher& m) {
+        const auto& pattern_map = m.get_pattern_value_map();
+        const auto data = pattern_map.at(data_pattern);
+        const auto random_uniform = pattern_map.at(random_uniform_pattern);
+        const auto constant = pattern_map.at(const_pattern);
+        const auto ru = std::dynamic_pointer_cast<opset8::RandomUniform>(random_uniform.get_node_shared_ptr());
+        if (!ru)
+            return false;
+        if (!ru->get_out_type().is_real())
+            return false;
+
+        const auto old_const = std::dynamic_pointer_cast<opset8::Constant>(constant.get_node_shared_ptr());
+        if (!old_const)
+            return false;
+        if (!old_const->get_element_type().is_real())
+            return false;
+
+        auto const_shape = old_const->get_shape();
+        if (shape_size(const_shape) != 1)
+            return false;
+
+        const auto& value = old_const->cast_vector<double>();
+        auto new_const = op::Constant::create(ru->get_out_type(), Shape{}, value);
+
+        const auto& mul_add = pattern_map.at(mul_add_pattern);
+        const auto mul_add_ptr = std::dynamic_pointer_cast<ngraph::Node>(mul_add.get_node_shared_ptr());
+        const auto new_mul_add1 = mul_add_ptr->clone_with_new_inputs({ru->input_value(1), new_const});
+        const auto new_mul_add2 = mul_add_ptr->clone_with_new_inputs({ru->input_value(2), new_const});
+
+        const auto& folded_const1 = ngraph::get_constant_from_source(new_mul_add1);
+        const auto& folded_const2 = ngraph::get_constant_from_source(new_mul_add2);
+
+        const auto new_ru = ru->clone_with_new_inputs({data,
+                                                       folded_const1 ? folded_const1 : new_mul_add1,
+                                                       folded_const2 ? folded_const2 : new_mul_add2});
+        new_ru->set_friendly_name(m.get_match_root()->get_friendly_name());
+
+        if (pattern_map.count(convert_pattern)) {
+            const auto& convert = pattern_map.at(convert_pattern);
+            const auto cvt = std::dynamic_pointer_cast<opset8::Convert>(convert.get_node_shared_ptr());
+            if (!cvt)
+                return false;
+            if (!cvt->get_element_type().is_real())
+                return false;
+            const auto new_ru_conv = cvt->clone_with_new_inputs({new_ru});
+            copy_runtime_info({ru, cvt, mul_add.get_node_shared_ptr()}, {new_mul_add1, new_mul_add2, new_ru, new_ru_conv});
+            ngraph::replace_node(m.get_match_root(), new_ru_conv);
+        } else {
+            copy_runtime_info({ru, mul_add.get_node_shared_ptr()}, {new_mul_add1, new_mul_add2, new_ru});
+            ngraph::replace_node(m.get_match_root(), new_ru);
+        }
+
+        return true;
+    };
+
+    auto m = std::make_shared<ngraph::pattern::Matcher>(mul_add_pattern, matcher_name);
+    this->register_matcher(m, callback);
+}
diff --git a/inference-engine/src/transformations/src/transformations/op_conversions/convert_minimum_to_power_and_max.cpp b/inference-engine/src/transformations/src/transformations/op_conversions/convert_minimum_to_power_and_max.cpp
index 3ab36795350863..02fa3590de2d47 100644
--- a/inference-engine/src/transformations/src/transformations/op_conversions/convert_minimum_to_power_and_max.cpp
+++ b/inference-engine/src/transformations/src/transformations/op_conversions/convert_minimum_to_power_and_max.cpp
@@ -20,7 +20,7 @@ ngraph::pass::ConvertMinimum::ConvertMinimum() {
 
     ngraph::matcher_pass_callback callback = [this](pattern::Matcher& m) {
         auto minimum = std::dynamic_pointer_cast<ngraph::opset1::Minimum> (m.get_match_root());
-        if (!minimum  || transformation_callback(minimum)) {
+        if (!minimum  || transformation_callback(minimum) || !minimum->get_output_element_type(0).is_signed()) {
             return false;
         }
 
diff --git a/inference-engine/src/transformations/src/transformations/op_conversions/convert_nms_to_nms_ie_internal.cpp b/inference-engine/src/transformations/src/transformations/op_conversions/convert_nms_to_nms_ie_internal.cpp
index 07b1d26ebe1a02..47bea7f20c8e59 100644
--- a/inference-engine/src/transformations/src/transformations/op_conversions/convert_nms_to_nms_ie_internal.cpp
+++ b/inference-engine/src/transformations/src/transformations/op_conversions/convert_nms_to_nms_ie_internal.cpp
@@ -22,9 +22,9 @@ ngraph::pass::ConvertNMSToNMSIEInternal::ConvertNMSToNMSIEInternal() {
     MATCHER_SCOPE(ConvertNMSToNMSIEInternal);
     auto nms = ngraph::pattern::wrap_type<ngraph::opset5::NonMaxSuppression>();
 
-    ngraph::matcher_pass_callback callback = [](pattern::Matcher &m) {
+    ngraph::matcher_pass_callback callback = [=](pattern::Matcher &m) {
         auto nms_5 = std::dynamic_pointer_cast<ngraph::opset5::NonMaxSuppression>(m.get_match_root());
-        if (!nms_5) {
+        if (!nms_5 || transformation_callback(nms_5)) {
             return false;
         }
 
diff --git a/inference-engine/src/transformations/src/transformations/serialize.cpp b/inference-engine/src/transformations/src/transformations/serialize.cpp
index 3fbb1463f088bf..9273d5a2e687da 100644
--- a/inference-engine/src/transformations/src/transformations/serialize.cpp
+++ b/inference-engine/src/transformations/src/transformations/serialize.cpp
@@ -15,12 +15,14 @@
 #include "ngraph/opsets/opset.hpp"
 #include "ngraph/opsets/opset1.hpp"
 #include "ngraph_ops/framework_node.hpp"
+#include "ngraph_ops/type_relaxed.hpp"
 #include "pugixml.hpp"
 #include "transformations/serialize.hpp"
 
 using namespace ngraph;
 
 NGRAPH_RTTI_DEFINITION(ngraph::pass::Serialize, "Serialize", 0);
+NGRAPH_RTTI_DEFINITION(ngraph::pass::StreamSerialize, "StreamSerialize", 0);
 
 namespace {  // helpers
 template <typename Container>
@@ -84,11 +86,13 @@ class ConstantWriter {
 
     ConstantWriter(std::ostream& bin_data, bool enable_compression = true)
         : m_binary_output(bin_data)
-        , m_enable_compression(enable_compression) {
+        , m_enable_compression(enable_compression)
+        , m_blob_offset(bin_data.tellp()) {
     }
 
     FilePosition write(const char* ptr, size_t size) {
-        const auto offset = m_binary_output.tellp();
+        const FilePosition write_pos = m_binary_output.tellp();
+        const auto offset = write_pos - m_blob_offset;
         if (!m_enable_compression) {
             m_binary_output.write(ptr, size);
             return offset;
@@ -114,6 +118,7 @@ class ConstantWriter {
     ConstWritePositions m_hash_to_file_positions;
     std::ostream& m_binary_output;
     bool m_enable_compression;
+    FilePosition m_blob_offset;     // blob offset inside output stream
 };
 
 void ngfunction_2_irv10(pugi::xml_node& node,
@@ -325,7 +330,7 @@ class XmlSerializer : public ngraph::AttributeVisitor {
                 m_xml_node.append_attribute("offset").set_value(offset);
                 m_xml_node.append_attribute("size").set_value(size);
             }
-        } else if (const auto& a = ngraph::as_type<ngraph::AttributeAdapter<op::FrameworkNodeAttrs>>(&adapter)) {
+        } else if (const auto& a = ngraph::as_type<ngraph::AttributeAdapter<ngraph::op::FrameworkNodeAttrs>>(&adapter)) {
             const auto & attrs = a->get();
 
             // Update type and version attributes
@@ -346,6 +351,9 @@ class XmlSerializer : public ngraph::AttributeVisitor {
             for (const auto & attr : attrs) {
                 m_xml_node.append_attribute(attr.first.c_str()).set_value(attr.second.c_str());
             }
+        } else if (const auto& a = ngraph::as_type<ngraph::AttributeAdapter<ngraph::element::TypeVector>>(&adapter)) {
+            const auto & attrs = a->get();
+            m_xml_node.append_attribute(name.c_str()).set_value(join(attrs).c_str());
         } else {
             throw ngraph_error("Unsupported attribute type for serialization: " + name);
         }
@@ -465,6 +473,17 @@ const std::vector<Edge> create_edge_mapping(
 std::string get_opset_name(
     const ngraph::Node* n,
     const std::map<std::string, ngraph::OpSet>& custom_opsets) {
+    // Try to find opset name from RT info
+    auto opset_it = n->get_rt_info().find("opset");
+    if (opset_it != n->get_rt_info().end()) {
+        if (auto variant = std::dynamic_pointer_cast<ngraph::VariantImpl<std::string>>(opset_it->second)) {
+            const std::string & opset_name = variant->get();
+            if (custom_opsets.find(opset_name) != custom_opsets.end()) {
+                return opset_name;
+            }
+        }
+    }
+
     auto opsets = std::array<std::reference_wrapper<const ngraph::OpSet>, 8>{
         ngraph::get_opset1(), ngraph::get_opset2(), ngraph::get_opset3(),
         ngraph::get_opset4(), ngraph::get_opset5(), ngraph::get_opset6(),
@@ -623,7 +642,7 @@ bool resolve_dynamic_shapes(const ngraph::Function& f) {
         auto & op = f_ops[id];
         auto & clone_op = f_clone_ops[id];
 
-        if (auto op_subgraph = std::dynamic_pointer_cast<op::util::SubGraphOp>(op)) {
+        if (auto op_subgraph = std::dynamic_pointer_cast<ngraph::op::util::SubGraphOp>(op)) {
             resolve_dynamic_shapes(*op_subgraph->get_function());
         }
 
@@ -811,8 +830,34 @@ void ngfunction_2_irv10(pugi::xml_node& netXml,
         f.validate_nodes_and_infer_types();
     }
 }
+
+std::string valid_xml_path(const std::string &path) {
+    NGRAPH_CHECK(path.length() > 4, "Path for xml file is to short: \"" + path + "\"");
+
+    const char *const extension = ".xml";
+    const bool has_xml_extension = path.rfind(extension) == path.size() - std::strlen(extension);
+    NGRAPH_CHECK(has_xml_extension,
+                 "Path for xml file doesn't contains file name with 'xml' extension: \"" +
+                     path + "\"");
+    return path;
+}
+
+std::string provide_bin_path(const std::string &xmlPath, const std::string &binPath) {
+    if (!binPath.empty()) {
+        return binPath;
+    }
+    assert(xmlPath.size() > 4); // should be check by valid_xml_path
+    std::string bestPath = xmlPath;
+    const char *const extension = "bin";
+    const auto ext_size = std::strlen(extension);
+    bestPath.replace(bestPath.size() - ext_size, ext_size, extension);
+    return bestPath;
+}
+
 }  // namespace
 
+namespace ngraph {
+
 // ! [function_pass:serialize_cpp]
 // serialize.cpp
 bool pass::Serialize::run_on_function(std::shared_ptr<ngraph::Function> f) {
@@ -868,33 +913,6 @@ bool pass::Serialize::run_on_function(std::shared_ptr<ngraph::Function> f) {
     return false;
 }
 
-namespace {
-
-std::string valid_xml_path(const std::string &path) {
-    NGRAPH_CHECK(path.length() > 4, "Path for xml file is to short: \"" + path + "\"");
-
-    const char *const extension = ".xml";
-    const bool has_xml_extension = path.rfind(extension) == path.size() - std::strlen(extension);
-    NGRAPH_CHECK(has_xml_extension,
-                 "Path for xml file doesn't contains file name with 'xml' extension: \"" +
-                     path + "\"");
-    return path;
-}
-
-std::string provide_bin_path(const std::string &xmlPath, const std::string &binPath) {
-    if (!binPath.empty()) {
-        return binPath;
-    }
-    assert(xmlPath.size() > 4); // should be check by valid_xml_path
-    std::string bestPath = xmlPath;
-    const char *const extension = "bin";
-    const auto ext_size = std::strlen(extension);
-    bestPath.replace(bestPath.size() - ext_size, ext_size, extension);
-    return bestPath;
-}
-
-} // namespace
-
 pass::Serialize::Serialize(std::ostream& xmlFile,
                            std::ostream& binFile,
                            pass::Serialize::Version version,
@@ -920,4 +938,70 @@ pass::Serialize::Serialize(const std::string& xmlPath,
     , m_custom_opsets{custom_opsets}
 {
 }
+
+ngraph::pass::StreamSerialize::StreamSerialize(std::ostream & stream,
+                                               std::map<std::string, ngraph::OpSet> && custom_opsets,
+                                               const std::function<void(std::ostream &)> & custom_data_serializer,
+                                               Serialize::Version version)
+    : m_stream(stream)
+    , m_custom_opsets(std::move(custom_opsets))
+    , m_custom_data_serializer(custom_data_serializer) {
+    if (version != Serialize::Version::IR_V10) {
+        throw ngraph_error("Unsupported version");
+    }
+}
+
+bool ngraph::pass::StreamSerialize::run_on_function(std::shared_ptr<ngraph::Function> f) {
+    /*
+        Format:
+        [ DataHeader  ]
+        [ Custom data ]
+        [    Blobs    ]
+        [     IR      ]
+    */
+    DataHeader hdr = {};
+
+    auto writeHeader = [this](const DataHeader & hdr) {
+        m_stream.write((const char*)&hdr, sizeof hdr);
+    };
+
+    // Header
+    const size_t header_offset = m_stream.tellp();
+    writeHeader(hdr);
+
+    // Custom data
+    hdr.custom_data_offset = m_stream.tellp();
+    if (m_custom_data_serializer) {
+        m_custom_data_serializer(m_stream);
+    }
+
+    // Blobs
+    hdr.consts_offset = m_stream.tellp();
+    std::string name = "net";
+    pugi::xml_document xml_doc;
+    pugi::xml_node net_node = xml_doc.append_child(name.c_str());
+    ConstantWriter constant_write_handler(m_stream);
+    XmlSerializer visitor(net_node, name, m_custom_opsets, constant_write_handler);
+    visitor.on_attribute(name, f);
+
+    // IR
+    hdr.model_offset = m_stream.tellp();
+    xml_doc.save(m_stream);
+    m_stream.flush();
+
+    const size_t file_size = m_stream.tellp();
+
+    hdr.custom_data_size = hdr.consts_offset - hdr.custom_data_offset;
+    hdr.consts_size = hdr.model_offset - hdr.consts_offset;
+    hdr.model_size = file_size - hdr.model_offset;
+
+    m_stream.seekp(header_offset);
+    writeHeader(hdr);
+
+    m_stream.seekp(file_size);
+
+    // Return false because we didn't change nGraph Function
+    return false;
+}
 // ! [function_pass:serialize_cpp]
+}  // namespace ngraph
diff --git a/inference-engine/src/vpu/CMakeLists.txt b/inference-engine/src/vpu/CMakeLists.txt
index 3a11a33509736c..b50739c72615f1 100644
--- a/inference-engine/src/vpu/CMakeLists.txt
+++ b/inference-engine/src/vpu/CMakeLists.txt
@@ -24,8 +24,9 @@ if(ENABLE_MYRIAD)
                 DESTINATION ${IE_CPACK_LIBRARY_PATH}/vpu_custom_kernels
                 COMPONENT myriad)
         install(DIRECTORY ${VPU_CLC_MA2X8X_ROOT}/
-                DESTINATION deployment_tools/tools/cl_compiler
+                DESTINATION tools/cl_compiler
                 COMPONENT myriad
+                USE_SOURCE_PERMISSIONS
                 PATTERN ie_dependency.info EXCLUDE)
     endif()
 endif()
diff --git a/inference-engine/src/vpu/graph_transformer/src/utils/runtime_graph.cpp b/inference-engine/src/vpu/graph_transformer/src/utils/runtime_graph.cpp
index ed67650de9cbed..73934b614d4899 100644
--- a/inference-engine/src/vpu/graph_transformer/src/utils/runtime_graph.cpp
+++ b/inference-engine/src/vpu/graph_transformer/src/utils/runtime_graph.cpp
@@ -127,7 +127,8 @@ std::map<std::string, std::string> extractMeta(const StageMetaInfo& stageMeta) {
     if (stageMeta.execOrder < 0 || stageMeta.execTime == 0) {
         serializationInfo[ExecGraphInfoSerialization::PERF_COUNTER] = "not_executed";
     } else {
-        serializationInfo[ExecGraphInfoSerialization::PERF_COUNTER] = std::to_string(stageMeta.execTime);
+        int execTimeMcs = stageMeta.execTime * 1000; // ms to mcs
+        serializationInfo[ExecGraphInfoSerialization::PERF_COUNTER] = std::to_string(execTimeMcs);
     }
     std::stringstream layoutStream;
     int ind = 0;
diff --git a/inference-engine/src/vpu/myriad_plugin/CMakeLists.txt b/inference-engine/src/vpu/myriad_plugin/CMakeLists.txt
index 66e15697baaa07..c3c1d7f2a5675a 100644
--- a/inference-engine/src/vpu/myriad_plugin/CMakeLists.txt
+++ b/inference-engine/src/vpu/myriad_plugin/CMakeLists.txt
@@ -55,6 +55,6 @@ set_target_properties(${TARGET_NAME} PROPERTIES INTERPROCEDURAL_OPTIMIZATION_REL
 # install
 if (LINUX)
     install(FILES ${mvnc_SOURCE_DIR}/src/97-myriad-usbboot.rules
-        DESTINATION ${IE_CPACK_IE_DIR}/external
+        DESTINATION runtime/3rdparty
         COMPONENT myriad)
 endif()
diff --git a/inference-engine/tests/functional/inference_engine/CMakeLists.txt b/inference-engine/tests/functional/inference_engine/CMakeLists.txt
index d5a9d2fd2d7529..b6a91d48fd641c 100644
--- a/inference-engine/tests/functional/inference_engine/CMakeLists.txt
+++ b/inference-engine/tests/functional/inference_engine/CMakeLists.txt
@@ -26,7 +26,6 @@ set(DEPENDENCIES
     inference_engine_ir_reader
     inference_engine_ir_v7_reader
     HeteroPlugin
-    AutoPlugin
     MultiDevicePlugin
     template_extension
     lptNgraphFunctions
@@ -80,7 +79,6 @@ file(GLOB_RECURSE legacy_tests
     "${CMAKE_CURRENT_SOURCE_DIR}/lp_transformations/*.cpp" # CVS-55376
     "${CMAKE_CURRENT_SOURCE_DIR}/ngraph_reader/*.cpp" # CVS-55365
     "${CMAKE_CURRENT_SOURCE_DIR}/cnn_network/cnn_ngraph_impl_tests.cpp" # CVS-55375
-    "${CMAKE_CURRENT_SOURCE_DIR}/local_test.cpp" # CVS-55386
     )
 
 set_source_files_properties(${legacy_tests} PROPERTIES INCLUDE_DIRECTORIES
diff --git a/inference-engine/tests/functional/inference_engine/caching_test.cpp b/inference-engine/tests/functional/inference_engine/caching_test.cpp
index 10d952e6e0d778..a24c6f18d96d85 100644
--- a/inference-engine/tests/functional/inference_engine/caching_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/caching_test.cpp
@@ -17,7 +17,7 @@
 #include "details/ie_so_loader.h"
 #include "ie_metric_helpers.hpp"
 
-#include "cpp_interfaces/interface/ie_iremote_context.hpp"
+#include "ie_remote_context.hpp"
 #include "cpp_interfaces/interface/ie_iexecutable_network_internal.hpp"
 #include "cpp_interfaces/interface/ie_iplugin_internal.hpp"
 
@@ -62,7 +62,7 @@ std::string getTestCaseName(const testing::TestParamInfo<std::tuple<TestParam, s
     return std::get<1>(std::get<0>(obj.param)) + "_" + std::get<1>(obj.param);
 }
 
-class MockRemoteContext : public IRemoteContext {
+class MockRemoteContext : public RemoteContext {
     std::string m_name;
 public:
     MockRemoteContext(std::string name): m_name(std::move(name)) {}
@@ -97,7 +97,7 @@ class MockCachingInferencePlugin : public MockCachingInferencePluginBase {
                                                                                  const std::map<std::string, std::string>& config));
 
     MOCK_METHOD3(LoadExeNetworkImpl, std::shared_ptr<IExecutableNetworkInternal>(const CNNNetwork& network,
-                                                                                 const IRemoteContext::Ptr& context,
+                                                                                 const RemoteContext::Ptr& context,
                                                                                  const std::map<std::string, std::string>& config));
 
     MOCK_CONST_METHOD0(OnLoadNetworkFromFile, void(void));
@@ -106,7 +106,7 @@ class MockCachingInferencePlugin : public MockCachingInferencePluginBase {
                                                                const std::map<std::string, std::string>& config));
 
     MOCK_METHOD3(ImportNetwork, IExecutableNetworkInternal::Ptr(std::istream& networkModel,
-                                                                const IRemoteContext::Ptr& context,
+                                                                const RemoteContext::Ptr& context,
                                                                 const std::map<std::string, std::string>& config));
 
     MOCK_CONST_METHOD2(QueryNetwork, QueryNetworkResult(const CNNNetwork& network,
@@ -114,7 +114,7 @@ class MockCachingInferencePlugin : public MockCachingInferencePluginBase {
 
     MOCK_CONST_METHOD2(GetMetric, Parameter(const std::string& name, const std::map<std::string, Parameter>& options));
     MOCK_METHOD1(SetConfig, void(const std::map<std::string, std::string>& options));
-    MOCK_METHOD1(GetDefaultContext, std::shared_ptr<IRemoteContext>(const ParamMap& params));
+    MOCK_METHOD1(GetDefaultContext, std::shared_ptr<RemoteContext>(const ParamMap& params));
 };
 
 class MockExecutableNetwork : public IExecutableNetworkInternal {
@@ -131,6 +131,7 @@ class MockExecutableNetwork : public IExecutableNetworkInternal {
     MOCK_METHOD2(CreateInferRequestImpl, IInferRequestInternal::Ptr(InputsDataMap, OutputsDataMap));
     MOCK_METHOD1(setNetworkInputs, void(const InputsDataMap& networkInputs));
     MOCK_METHOD1(setNetworkOutputs, void(const OutputsDataMap& networkOutputs));
+    MOCK_METHOD0(GetExecGraphInfo, std::shared_ptr<ov::Function>());
 
     // void Export(std::ostream& networkModel) override {
     //     std::lock_guard<std::mutex> guard(m_pluginMutex);
@@ -217,10 +218,31 @@ class CachingTest : public ::testing::TestWithParam<std::tuple<TestParam, std::s
         m_dirCreator = std::unique_ptr<MkDirGuard>(new MkDirGuard(m_cacheDir));
     }
 
+    std::shared_ptr<MockExecutableNetwork> createMockIExecutableNet() {
+        auto mock = std::make_shared<MockExecutableNetwork>();
+        EXPECT_CALL(*mock, GetInputsInfo()).Times(AnyNumber()).WillRepeatedly(Return(ConstInputsDataMap{}));
+        EXPECT_CALL(*mock, GetOutputsInfo()).Times(AnyNumber()).WillRepeatedly(Return(ConstOutputsDataMap{}));
+        EXPECT_CALL(*mock, GetConfig(PluginConfigParams::KEY_PERF_COUNT)).Times(AnyNumber()).WillRepeatedly(Return(Parameter{PluginConfigParams::NO}));
+        EXPECT_CALL(*mock, GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS))).Times(AnyNumber()).WillRepeatedly(Return(Parameter{1u}));
+        EXPECT_CALL(*mock, GetExecGraphInfo()).Times(AnyNumber()).WillRepeatedly(Return([] {
+                    ngraph::ParameterVector parameters;
+                    parameters.push_back(std::make_shared<ngraph::op::v0::Parameter>(
+                        ov::element::f32, ov::Shape{1, 3, 8, 8}));
+                    auto notOp = std::make_shared<ngraph::op::v1::LogicalNot>(parameters.back());
+                    ngraph::ResultVector results;
+                    results.push_back(std::make_shared<ngraph::op::v0::Result>(notOp));
+                    return std::make_shared<ov::Function>(results, parameters, "empty_function");
+                } ()));
+        auto ptr = std::make_shared<MockIInferRequestInternal>();
+        EXPECT_CALL(*ptr, SetCallback(_)).Times(AnyNumber());
+        EXPECT_CALL(*mock, CreateInferRequest()).Times(AnyNumber()).WillRepeatedly(Return(ptr));
+        return mock;
+    }
+
     void SetUp() override {
         initParamTest();
         mockPlugin = std::make_shared<MockCachingInferencePlugin>();
-        net = std::make_shared<MockExecutableNetwork>();
+        net = createMockIExecutableNet();
         setupMock(*mockPlugin);
         std::string libraryName = get_mock_engine_name();
         sharedObjectLoader.reset(new SharedObjectLoader(libraryName.c_str()));
@@ -285,18 +307,6 @@ class CachingTest : public ::testing::TestWithParam<std::tuple<TestParam, std::s
         return ie.LoadNetwork(cnnNetwork, context, config);
     }
 
-    std::shared_ptr<MockExecutableNetwork> createMockIExecutableNet() {
-        auto mock = std::make_shared<MockExecutableNetwork>();
-        EXPECT_CALL(*mock, GetInputsInfo()).Times(AnyNumber()).WillRepeatedly(Return(ConstInputsDataMap{}));
-        EXPECT_CALL(*mock, GetOutputsInfo()).Times(AnyNumber()).WillRepeatedly(Return(ConstOutputsDataMap{}));
-        EXPECT_CALL(*mock, GetConfig(PluginConfigParams::KEY_PERF_COUNT)).Times(AnyNumber()).WillRepeatedly(Return(Parameter{PluginConfigParams::NO}));
-        EXPECT_CALL(*mock, GetMetric(METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS))).Times(AnyNumber()).WillRepeatedly(Return(Parameter{1u}));
-        auto ptr = std::make_shared<MockIInferRequestInternal>();
-        EXPECT_CALL(*ptr, SetCallback(_)).Times(AnyNumber());
-        EXPECT_CALL(*mock, CreateInferRequest()).Times(AnyNumber()).WillRepeatedly(Return(ptr));
-        return mock;
-    }
-
 private:
     template <class T>
     std::function<T> make_std_function(const std::string& functionName) {
@@ -326,7 +336,7 @@ class CachingTest : public ::testing::TestWithParam<std::tuple<TestParam, std::s
                 WillByDefault(Return("mock"));
 
         ON_CALL(plugin, ImportNetwork(_, _, _)).
-                WillByDefault(Invoke([&](std::istream &istr, const IRemoteContext::Ptr&,
+                WillByDefault(Invoke([&](std::istream &istr, const RemoteContext::Ptr&,
                                          const std::map<std::string, std::string> &) {
             return createMockIExecutableNet();
         }));
@@ -337,7 +347,7 @@ class CachingTest : public ::testing::TestWithParam<std::tuple<TestParam, std::s
         }));
 
         ON_CALL(plugin, LoadExeNetworkImpl(_, _, _)).
-                WillByDefault(Invoke([&](const CNNNetwork &, const IRemoteContext::Ptr&,
+                WillByDefault(Invoke([&](const CNNNetwork &, const RemoteContext::Ptr&,
                                          const std::map<std::string, std::string> &) {
             return net;
         }));
@@ -433,7 +443,7 @@ TEST_P(CachingTest, TestLoadCustomImportExport) {
     EXPECT_CALL(*mockPlugin, GetMetric(METRIC_KEY(IMPORT_EXPORT_SUPPORT), _)).Times(AnyNumber());
     EXPECT_CALL(*mockPlugin, GetMetric(METRIC_KEY(DEVICE_ARCHITECTURE), _)).Times(AnyNumber());
     ON_CALL(*mockPlugin, ImportNetwork(_, _, _)).
-            WillByDefault(Invoke([&](std::istream& s, IRemoteContext::Ptr,
+            WillByDefault(Invoke([&](std::istream& s, RemoteContext::Ptr,
                                      const std::map<std::string, std::string> &) {
         char a[sizeof(customData)];
         s.read(a, sizeof(customData));
@@ -1453,7 +1463,8 @@ TEST_P(CachingTest, LoadMulti_Archs) {
         EXPECT_CALL(*net, Export(_)).Times(2);
         testLoad([&](Core &ie) {
             ie.SetConfig({{CONFIG_KEY(CACHE_DIR), m_cacheDir}});
-            ASSERT_NO_THROW(m_testFunction(ie));
+            // ASSERT_NO_THROW(m_testFunction(ie));
+            m_testFunction(ie);
         });
     }
 }
@@ -1464,7 +1475,7 @@ TEST_P(CachingTest, LoadMulti_NoCachingOnDevice) {
     const auto TEST_DEVICE_MAX_COUNT = 100; // Looks enough to catch potential race conditions
     EXPECT_CALL(*mockPlugin, GetMetric(_, _)).Times(AnyNumber());
     EXPECT_CALL(*mockPlugin, GetMetric(METRIC_KEY(IMPORT_EXPORT_SUPPORT), _))
-            .Times(AnyNumber()).WillRepeatedly(Return(false));
+            .Times(AnyNumber()).WillRepeatedly(Return(Parameter{false}));
     EXPECT_CALL(*mockPlugin, QueryNetwork(_, _)).Times(AnyNumber());
     EXPECT_CALL(*mockPlugin, GetMetric(METRIC_KEY(DEVICE_ARCHITECTURE), _)).Times(AnyNumber());
     DataPtr inData = std::make_shared<Data>("in", Precision::FP32);
diff --git a/inference-engine/tests/functional/inference_engine/local_test.cpp b/inference-engine/tests/functional/inference_engine/local_test.cpp
index b79e591dfb7f77..91f379a4fa77c9 100644
--- a/inference-engine/tests/functional/inference_engine/local_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/local_test.cpp
@@ -3,10 +3,8 @@
 //
 
 #include <gtest/gtest.h>
-
 #include <ie_core.hpp>
-#include <legacy/net_pass.h>
-#include "common_test_utils/common_utils.hpp"
+#include "ngraph/ops.hpp"
 
 using namespace ::testing;
 using namespace std;
@@ -15,183 +13,204 @@ using namespace InferenceEngine;
 class LocaleTests : public ::testing::Test {
     std::string originalLocale;
     std::string _model = R"V0G0N(
-<net name="Power_Only" version="3" precision="FP32" batch="1">
+<net name="model" version="10">
+	<layers>
+		<layer id="0" name="input" type="Parameter" version="opset1">
+			<data shape="1,256,200,272" element_type="f16"/>
+			<output>
+				<port id="0" precision="FP16" names="input">
+					<dim>1</dim>
+					<dim>256</dim>
+					<dim>200</dim>
+					<dim>272</dim>
+				</port>
+			</output>
+		</layer>
+		<layer id="1" name="rois" type="Parameter" version="opset1">
+			<data shape="1000,4" element_type="f16"/>
+			<output>
+				<port id="0" precision="FP16" names="rois">
+					<dim>1000</dim>
+					<dim>4</dim>
+				</port>
+			</output>
+		</layer>
+		<layer id="2" name="indices" type="Parameter" version="opset1">
+			<data shape="1000" element_type="i32"/>
+			<output>
+				<port id="0" precision="I32" names="indices">
+					<dim>1000</dim>
+				</port>
+			</output>
+		</layer>
+		<layer id="3" name="output" type="ROIAlign" version="opset3">
+			<data mode="avg" pooled_h="7" pooled_w="7" sampling_ratio="2" spatial_scale="0.25"/>
+			<input>
+				<port id="0">
+					<dim>1</dim>
+					<dim>256</dim>
+					<dim>200</dim>
+					<dim>272</dim>
+				</port>
+				<port id="1">
+					<dim>1000</dim>
+					<dim>4</dim>
+				</port>
+				<port id="2">
+					<dim>1000</dim>
+				</port>
+			</input>
+			<output>
+				<port id="3" precision="FP16" names="output">
+					<dim>1000</dim>
+					<dim>256</dim>
+					<dim>7</dim>
+					<dim>7</dim>
+				</port>
+			</output>
+		</layer>
+		<layer id="4" name="output/sink_port_0" type="Result" version="opset1">
+			<input>
+				<port id="0">
+					<dim>1000</dim>
+					<dim>256</dim>
+					<dim>7</dim>
+					<dim>7</dim>
+				</port>
+			</input>
+		</layer>
+	</layers>
+	<edges>
+		<edge from-layer="0" from-port="0" to-layer="3" to-port="0"/>
+		<edge from-layer="1" from-port="0" to-layer="3" to-port="1"/>
+		<edge from-layer="2" from-port="0" to-layer="3" to-port="2"/>
+		<edge from-layer="3" from-port="3" to-layer="4" to-port="0"/>
+	</edges>
+</net>
+)V0G0N";
+
+    std::string _model_LSTM = R"V0G0N(
+ <net name="LSTMCell" version="10">
     <layers>
-        <layer name="data" type="Input" precision="FP32" id="0">
+        <layer id="0" name="in0" type="Parameter" version="opset1">
+            <data shape="1,512" element_type="f32"/>
             <output>
-                <port id="0">
-                    <dim>2</dim>
-                    <dim>3</dim>
-                    <dim>5</dim>
-                    <dim>5</dim>
+                <port id="0" precision="FP32">
+                    <dim>1</dim>
+                    <dim>512</dim>
                 </port>
             </output>
         </layer>
-        <layer name="power" type="Power" precision="FP32" id="1">
-            <data scale="0.75"
-                  shift="0.35"
-                  power="0.5"/>
-
-            <input>
-                <port id="1">
-                    <dim>2</dim>
-                    <dim>3</dim>
-                    <dim>5</dim>
-                    <dim>5</dim>
-                </port>
-            </input>
+        <layer id="1" name="in1" type="Parameter" version="opset1">
+            <data shape="1,256" element_type="f32"/>
             <output>
-                <port id="2">
-                    <dim>2</dim>
-                    <dim>3</dim>
-                    <dim>5</dim>
-                    <dim>5</dim>
+                <port id="0" precision="FP32">
+                    <dim>1</dim>
+                    <dim>256</dim>
                 </port>
             </output>
         </layer>
-        <layer name="sum" type="Eltwise" precision="FP32" id="2">
-            <data coeff="0.77,0.33"/>
-            <input>
-                <port id="1">
-                    <dim>2</dim>
-                    <dim>3</dim>
-                    <dim>5</dim>
-                    <dim>5</dim>
-                </port>
-                <port id="2">
-                    <dim>2</dim>
-                    <dim>3</dim>
-                    <dim>5</dim>
-                    <dim>5</dim>
-                </port>
-            </input>
+        <layer id="2" name="in2" type="Parameter" version="opset1">
+            <data shape="1,256" element_type="f32"/>
             <output>
-                <port id="3">
-                    <dim>2</dim>
-                    <dim>3</dim>
-                    <dim>5</dim>
-                    <dim>5</dim>
+                <port id="0" precision="FP32">
+                    <dim>1</dim>
+                    <dim>256</dim>
                 </port>
             </output>
         </layer>
-    </layers>
-    <edges>
-        <edge from-layer="0" from-port="0" to-layer="1" to-port="1"/>
-        <edge from-layer="1" from-port="2" to-layer="2" to-port="1"/>
-        <edge from-layer="0" from-port="0" to-layer="2" to-port="2"/>
-    </edges>
-    <pre-process reference-layer-name="data">
-        <channel id="0">
-            <mean value="104.006"/>
-            <scale value="0.1"/>
-        </channel>
-        <channel id="1">
-            <mean value="116.668"/>
-            <scale value="0.2"/>
-        </channel>
-        <channel id="2">
-            <mean value="122.678"/>
-            <scale value="0.3"/>
-        </channel>
-    </pre-process>
-
-</net>
-)V0G0N";
-
-    std::string _model_LSTM = R"V0G0N(
- <net batch="1" name="model" version="2">
-    <layers>
-        <layer id="0" name="Input" precision="FP32" type="Input">
+        <layer id="3" name="in3" type="Const" version="opset1">
+            <data offset="22223012" size="2097152" shape="1024,512" element_type="f32"/>
             <output>
-                <port id="0">
-                    <dim>1</dim>
-                    <dim>30</dim>
+                <port id="1" precision="FP32">
+                    <dim>1024</dim>
+                    <dim>512</dim>
                 </port>
             </output>
         </layer>
-        <layer id="1" name="Split" precision="FP32" type="Split">
-            <data axis="1" />
-            <input>
-                <port id="0">
-                    <dim>1</dim>
-                    <dim>30</dim>
-                </port>
-            </input>
+        <layer id="4" name="in4" type="Const" version="opset1">
+            <data offset="24320164" size="1048576" shape="1024,256" element_type="f32"/>
             <output>
-                <port id="1">
-                    <dim>1</dim>
-                    <dim>10</dim>
-                </port>
-                <port id="2">
-                    <dim>1</dim>
-                    <dim>10</dim>
+                <port id="1" precision="FP32">
+                    <dim>1024</dim>
+                    <dim>256</dim>
                 </port>
-                <port id="3">
-                    <dim>1</dim>
-                    <dim>10</dim>
+            </output>
+        </layer>
+        <layer id="5" name="in5" type="Const" version="opset1">
+            <data offset="25368740" size="4096" shape="1024" element_type="f32"/>
+            <output>
+                <port id="1" precision="FP32">
+                    <dim>1024</dim>
                 </port>
             </output>
         </layer>
-        <layer id="2" name="LSTMCell" precision="FP32" type="LSTMCell">
-            <data hidden_size="10" clip="0.2"/>
+        <layer id="6" name="LSTMCell" type="LSTMCell" version="opset1" precision="FP32">
+            <data hidden_size="256" element_type="f32" clip="0.00000"/>
             <input>
-                <port id="0">
+                <port id="0" precision="FP32">
                     <dim>1</dim>
-                    <dim>10</dim>
+                    <dim>512</dim>
                 </port>
-                <port id="1">
+                <port id="1" precision="FP32">
                     <dim>1</dim>
-                    <dim>10</dim>
+                    <dim>256</dim>
                 </port>
-                <port id="2">
+                <port id="2" precision="FP32">
                     <dim>1</dim>
-                    <dim>10</dim>
+                    <dim>256</dim>
                 </port>
-            </input>
-            <output>
-                <port id="3">
-                    <dim>1</dim>
-                    <dim>10</dim>
+                <port id="3" precision="FP32">
+                    <dim>1024</dim>
+                    <dim>512</dim>
                 </port>
-                <port id="4">
-                    <dim>1</dim>
-                    <dim>10</dim>
+                <port id="4" precision="FP32">
+                    <dim>1024</dim>
+                    <dim>256</dim>
                 </port>
-            </output>
-            <blobs>
-                <weights offset="0" size="3200"/>
-                <biases offset="3200" size="160"/>
-            </blobs>
-        </layer>
-        <layer name="Eltwise" type="Eltwise" id="3" precision="FP32">
-            <data operation="sum" />
-            <input>
-                <port id="0">
-                    <dim>1</dim>
-                    <dim>10</dim>
-                </port>
-                <port id="1">
-                    <dim>1</dim>
-                    <dim>10</dim>
+                <port id="5" precision="FP32">
+                    <dim>1024</dim>
                 </port>
             </input>
-            <output>
-                <port id="2">
-                    <dim>1</dim>
-                    <dim>10</dim>
-                </port>
-            </output>
+        <output>
+            <port id="6" precision="FP32">
+                <dim>1</dim>
+                <dim>256</dim>
+            </port>
+            <port id="7" precision="FP32">
+                <dim>1</dim>
+                <dim>256</dim>
+            </port>
+        </output>
         </layer>
-        </layers>
-        <edges>
-            <edge from-layer="0" from-port="0" to-layer="1" to-port="0"/>
-            <edge from-layer="1" from-port="1" to-layer="2" to-port="0"/>
-            <edge from-layer="1" from-port="2" to-layer="2" to-port="1"/>
-            <edge from-layer="1" from-port="3" to-layer="2" to-port="2"/>
-            <edge from-layer="2" from-port="3" to-layer="3" to-port="0"/>
-            <edge from-layer="2" from-port="4" to-layer="3" to-port="1"/>
-        </edges>
-    </net>
+		<layer id="7" name="485/sink_port_0" type="Result" version="opset1">
+			<input>
+				<port id="0">
+					<dim>1</dim>
+					<dim>256</dim>
+				</port>
+			</input>
+		</layer>
+		<layer id="8" name="485/sink_port_1" type="Result" version="opset1">
+			<input>
+				<port id="0">
+					<dim>1</dim>
+					<dim>256</dim>
+				</port>
+			</input>
+		</layer>
+    </layers>
+    <edges>
+        <edge from-layer="0" from-port="0" to-layer="6" to-port="0"/>
+        <edge from-layer="1" from-port="0" to-layer="6" to-port="1"/>
+        <edge from-layer="2" from-port="0" to-layer="6" to-port="2"/>
+        <edge from-layer="3" from-port="1" to-layer="6" to-port="3"/>
+        <edge from-layer="4" from-port="1" to-layer="6" to-port="4"/>
+        <edge from-layer="5" from-port="1" to-layer="6" to-port="5"/>
+        <edge from-layer="6" from-port="6" to-layer="7" to-port="0"/>
+        <edge from-layer="6" from-port="7" to-layer="8" to-port="0"/>
+    </edges>
+</net>
 )V0G0N";
 
 protected:
@@ -205,40 +224,30 @@ class LocaleTests : public ::testing::Test {
     void testBody(bool isLSTM = false) const {
         InferenceEngine::Core core;
 
-        // This model contains layers with float attributes.
-        // Conversion from string may be affected by locale.
         std::string model = isLSTM ? _model_LSTM : _model;
-        auto blob = make_shared_blob<uint8_t>(TensorDesc(Precision::U8, {3360}, Layout::C));
+        auto blob = make_shared_blob<uint8_t>(TensorDesc(Precision::U8, {26000000}, Layout::C));
         blob->allocate();
         auto net = core.ReadNetwork(model, blob);
 
-        IE_SUPPRESS_DEPRECATED_START
-        if (!isLSTM) {
-            auto power_layer = dynamic_pointer_cast<PowerLayer>(CommonTestUtils::getLayerByName(net, "power"));
-            ASSERT_EQ(power_layer->scale, 0.75f);
-            ASSERT_EQ(power_layer->offset, 0.35f);
-            ASSERT_EQ(power_layer->power, 0.5f);
-
-            auto sum_layer = dynamic_pointer_cast<EltwiseLayer>(CommonTestUtils::getLayerByName(net, "sum"));
-            std::vector<float> ref_coeff{0.77f, 0.33f};
-            ASSERT_EQ(sum_layer->coeff, ref_coeff);
-
-            auto info = net.getInputsInfo();
-            auto preproc = info.begin()->second->getPreProcess();
-            ASSERT_EQ(preproc[0]->stdScale, 0.1f);
-            ASSERT_EQ(preproc[0]->meanValue, 104.006f);
-        } else {
-            InferenceEngine::NetPass::UnrollRNN_if(net, [] (const RNNCellBase& rnn) -> bool { return true; });
-            auto lstmcell_layer = dynamic_pointer_cast<ClampLayer>(CommonTestUtils::getLayerByName(net, "LSTMCell:split_clip"));
-
-            float ref_coeff = 0.2f;
-            ASSERT_EQ(lstmcell_layer->min_value, -ref_coeff);
-            ASSERT_EQ(lstmcell_layer->max_value,  ref_coeff);
+        auto funcs = net.getFunction();
 
-            ASSERT_EQ(lstmcell_layer->GetParamAsFloat("min"), -ref_coeff);
-            ASSERT_EQ(lstmcell_layer->GetParamAsFloat("max"),  ref_coeff);
+        for (const auto & op : funcs->get_ops()) {
+            if (!isLSTM) {
+                if (op->get_friendly_name() == "output") {
+                    const auto roi = std::dynamic_pointer_cast<ngraph::op::v3::ROIAlign>(op);
+                    ASSERT_EQ(roi->get_pooled_h(), 7);
+                    ASSERT_EQ(roi->get_pooled_w(), 7);
+                    ASSERT_EQ(roi->get_sampling_ratio(), 2);
+                    ASSERT_EQ(roi->get_spatial_scale(), 0.25f);
+                }
+            } else {
+                if (op->get_friendly_name() == "LSTMCell") {
+                    const auto lstm_seq = std::dynamic_pointer_cast<ngraph::op::util::RNNCellBase>(op);
+                    ASSERT_EQ(lstm_seq->get_clip(), 0.0f);
+                    ASSERT_EQ(lstm_seq->get_hidden_size(), 256);
+                }
+            }
         }
-        IE_SUPPRESS_DEPRECATED_END
     }
 };
 
diff --git a/inference-engine/tests/functional/inference_engine/lp_transformations/add_transformation.cpp b/inference-engine/tests/functional/inference_engine/lp_transformations/add_transformation.cpp
index 529cd00854718a..82ce2c473320ea 100644
--- a/inference-engine/tests/functional/inference_engine/lp_transformations/add_transformation.cpp
+++ b/inference-engine/tests/functional/inference_engine/lp_transformations/add_transformation.cpp
@@ -62,7 +62,6 @@ class AddTransformationTestValues {
                                          operationType(std::move(operationType)) {}
     };
 
-    ngraph::element::Type precision;
     bool broadcast;
     int constInput;
     TestTransformationParams params;
@@ -169,7 +168,6 @@ const std::vector<std::pair<ngraph::PartialShape, ngraph::PartialShape>> inputSh
 const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches = {
     // Multiply with zero on the first branch
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -192,7 +190,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
     },
     // Multiply with zero on the second branch
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -245,7 +242,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
     //           \    /
     //            Add
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -298,7 +294,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
     //           \    /
     //            Add
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -328,7 +323,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -350,7 +344,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -372,7 +365,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -394,7 +386,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -419,7 +410,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
     // I8 + broadcast
 
     {
-        ngraph::element::f32,
         true,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -441,7 +431,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         true,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -463,7 +452,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         true,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -485,7 +473,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         true,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -507,7 +494,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
         ""
     },
     {
-        ngraph::element::f32,
         true,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -531,7 +517,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
 
     // convolution before FQ (choose that branch)
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -554,7 +539,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
     },
     // convolution with multiple consumers before FQ ( FP32 on other branch due to possible quantize fusing )
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -577,7 +561,6 @@ const std::vector<AddTransformationTestValues> testValuesWithoutConstantBranches
     },
     // group convolution before FQ (choose that branch)
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -645,7 +628,6 @@ const std::vector<AddTransformationTestValues> testValuesWithFirstConstantBranch
     //       \      /
     //      Multiply
     {
-        ngraph::element::f32,
         false,
         0,
         LayerTransformation::createParamsU8I8(),
@@ -722,7 +704,6 @@ const std::vector<AddTransformationTestValues> testValuesWithSecondConstantBranc
     //       \      /
     //      Multiply
     {
-        ngraph::element::f32,
         false,
         1,
         LayerTransformation::createParamsU8I8(),
@@ -772,7 +753,6 @@ const std::vector<std::pair<ngraph::PartialShape, ngraph::PartialShape>> inputSh
 const std::vector<AddTransformationTestValues> specialTestValues = {
     // constant input: Add -> Subtract
     {
-        ngraph::element::f32,
         false,
         1,
         LayerTransformation::createParamsU8I8(),
@@ -797,7 +777,6 @@ const std::vector<AddTransformationTestValues> specialTestValues = {
 
     // constant input: Add -> Subtract
     {
-        ngraph::element::f32,
         false,
         0,
         LayerTransformation::createParamsU8I8(),
@@ -839,7 +818,6 @@ const std::vector<std::pair<ngraph::PartialShape, ngraph::PartialShape>> inputSh
 
 const std::vector<AddTransformationTestValues> specialTestValues = {
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -888,7 +866,6 @@ const std::vector<std::pair<ngraph::PartialShape, ngraph::PartialShape>> inputSh
 
 const std::vector<AddTransformationTestValues> testValues = {
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -910,7 +887,6 @@ const std::vector<AddTransformationTestValues> testValues = {
         ""
     },
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -933,7 +909,6 @@ const std::vector<AddTransformationTestValues> testValues = {
     },
     // multiply with zero
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -982,7 +957,6 @@ const std::vector<std::pair<ngraph::PartialShape, ngraph::PartialShape>> inputSh
 
 const std::vector<AddTransformationTestValues> testValues = {
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -1004,7 +978,6 @@ const std::vector<AddTransformationTestValues> testValues = {
         ""
     },
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -1027,7 +1000,6 @@ const std::vector<AddTransformationTestValues> testValues = {
     },
     // multiply with zero
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8(),
@@ -1077,7 +1049,6 @@ const std::vector<std::pair<ngraph::PartialShape, ngraph::PartialShape>> inputSh
 const std::vector<AddTransformationTestValues> testValues = {
     // FP32 model, quantized branch: 1
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8().setUpdatePrecisions(false),
@@ -1100,7 +1071,6 @@ const std::vector<AddTransformationTestValues> testValues = {
     },
     // FP32 model, quantized branch: 0
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8().setUpdatePrecisions(false),
@@ -1123,7 +1093,6 @@ const std::vector<AddTransformationTestValues> testValues = {
     },
     // INT8 model (FQ decomposition before LPT), quantized branch: 1
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8().setUpdatePrecisions(false),
@@ -1146,7 +1115,6 @@ const std::vector<AddTransformationTestValues> testValues = {
     },
     // INT8 model (FQ decomposition before LPT), quantized branch: 0
     {
-        ngraph::element::f32,
         false,
         -1,
         LayerTransformation::createParamsU8I8().setUpdatePrecisions(false),
diff --git a/inference-engine/tests/functional/inference_engine/lp_transformations/move_fake_quantize_transformation.cpp b/inference-engine/tests/functional/inference_engine/lp_transformations/move_fake_quantize_transformation.cpp
new file mode 100644
index 00000000000000..76474731b69814
--- /dev/null
+++ b/inference-engine/tests/functional/inference_engine/lp_transformations/move_fake_quantize_transformation.cpp
@@ -0,0 +1,364 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "layer_transformation.hpp"
+
+#include <string>
+#include <sstream>
+#include <memory>
+#include <vector>
+
+#include <gtest/gtest.h>
+
+#include <low_precision/concat.hpp>
+
+#include <transformations/utils/utils.hpp>
+#include <transformations/init_node_info.hpp>
+#include <low_precision/relu.hpp>
+
+#include <low_precision/low_precision.hpp>
+
+#include "low_precision/move_fake_quantize.hpp"
+#include <low_precision/fake_quantize_decomposition.hpp>
+
+#include "common_test_utils/ngraph_test_utils.hpp"
+#include "lpt_ngraph_functions/move_fake_quantize_function.hpp"
+#include "lpt_ngraph_functions/common/builders.hpp"
+#include "lpt_ngraph_functions/common/fake_quantize_on_data.hpp"
+#include "lpt_ngraph_functions/relu_function.hpp"
+#include "simple_low_precision_transformer.hpp"
+
+using namespace testing;
+using namespace ngraph;
+using namespace ngraph::pass;
+
+namespace {
+
+class MoveFakeQuantizeTransformationActualValues {
+public:
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeBefore1;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertBefore1;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationBefore1;
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeBefore2;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertBefore2;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationBefore2;
+    std::string operation;
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeAfter;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertAfter;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationAfter;
+};
+
+inline std::ostream& operator<<(std::ostream& out, const MoveFakeQuantizeTransformationActualValues& values) {
+    return out << "_" <<
+        values.fakeQuantizeBefore1 << "_" <<
+        values.convertBefore1.outPrecision << "_" <<
+        values.dequantizationBefore1 << "_" <<
+        values.fakeQuantizeBefore2 << "_" <<
+        values.convertBefore2.outPrecision << "_" <<
+        values.dequantizationBefore2 << "_" <<
+        values.operation << "_" <<
+        values.fakeQuantizeAfter << "_" <<
+        values.convertAfter.outPrecision << "_" <<
+        values.dequantizationAfter;
+}
+
+class MoveFakeQuantizeTransformationResultValues {
+public:
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeBefore1;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertBefore1;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationBefore1;
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeBefore2;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertBefore2;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationBefore2;
+    std::string operation;
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeAfter;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertAfter;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationAfter;
+    ngraph::element::Type precisionAfterOperation;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationAfterNotFQ;
+};
+
+inline std::ostream& operator<<(std::ostream& out, const MoveFakeQuantizeTransformationResultValues& values) {
+    return out << "_" <<
+        values.fakeQuantizeBefore1 << "_" <<
+        values.convertBefore1.outPrecision << "_" <<
+        values.dequantizationBefore1 << "_" <<
+        values.fakeQuantizeBefore2 << "_" <<
+        values.convertBefore2.outPrecision << "_" <<
+        values.dequantizationBefore2 << "_" <<
+        values.operation << "_" <<
+        values.fakeQuantizeAfter << "_" <<
+        values.convertAfter << "_" <<
+        values.dequantizationAfter << "_" <<
+        values.dequantizationAfterNotFQ;
+}
+
+class MoveFakeQuantizeTransformationTestValues {
+public:
+    MoveFakeQuantizeTransformationTestValues() = default;
+    MoveFakeQuantizeTransformationTestValues(
+        const TestTransformationParams& params,
+        const bool multiChannels,
+        const  std::int64_t axis,
+        const MoveFakeQuantizeTransformationActualValues& actual,
+        const MoveFakeQuantizeTransformationResultValues& result,
+        const bool addNotPrecisionPreservedOperation = false,
+        const bool checkIntervalsAlignmentAttributes = true) :
+        params(params),
+        multiChannels(multiChannels),
+        axis(axis),
+        actual(actual),
+        result(result) {}
+
+    TestTransformationParams params;
+    bool multiChannels;
+    std::int64_t axis;
+    MoveFakeQuantizeTransformationActualValues actual;
+    MoveFakeQuantizeTransformationResultValues result;
+    // add not precision preserved operation to set output precision for FakeQuantize
+    // don't set to 'true' by default to keep test cases with tested operation as output
+};
+
+inline std::ostream& operator<<(std::ostream& out, const MoveFakeQuantizeTransformationTestValues& values) {
+    return out << "_" << values.multiChannels << "_" << values.actual << "_" << values.result;
+}
+
+typedef std::tuple <
+    ngraph::element::Type,
+    ngraph::PartialShape,
+    MoveFakeQuantizeTransformationTestValues
+> MoveFakeQuantizeTransformationParams;
+
+class MoveFakeQuantizeTransformation : public LayerTransformation, public testing::WithParamInterface<MoveFakeQuantizeTransformationParams> {
+public:
+    void SetUp() override {
+        const ngraph::element::Type precision = std::get<0>(GetParam());
+        const ngraph::PartialShape shape = std::get<1>(GetParam());
+        MoveFakeQuantizeTransformationTestValues testValues = std::get<2>(GetParam());
+
+        // dequantization output precision depends on input precision
+        // to avoid huge amount of tests cases let's define dequantization output precision as input precision
+        if (!testValues.actual.dequantizationBefore1.multiply.empty()) {
+            testValues.actual.dequantizationBefore1.multiply.outPrecision = precision;
+        }
+        if (!testValues.actual.dequantizationBefore2.multiply.empty()) {
+            testValues.actual.dequantizationBefore2.multiply.outPrecision = precision;
+        }
+
+        IntervalsAlignmentSharedValue::Interval interval{ -1.28f, 2.55f };
+
+        actualFunction = ngraph::builder::subgraph::MoveFakeQuantize::get(
+            precision,
+            shape,
+            testValues.actual.fakeQuantizeBefore1,
+            testValues.actual.convertBefore1,
+            testValues.actual.dequantizationBefore1,
+            testValues.actual.fakeQuantizeBefore2,
+            testValues.actual.convertBefore2,
+            testValues.actual.dequantizationBefore2,
+            testValues.actual.operation,
+            testValues.actual.fakeQuantizeAfter,
+            testValues.actual.convertAfter,
+            testValues.actual.dequantizationAfter,
+            {
+                ngraph::builder::subgraph::make_shared_attribute_ptr<PrecisionPreservedAttribute>(true),
+                ngraph::builder::subgraph::make_shared_attribute_ptr<IntervalsAlignmentAttribute>(interval, 256),
+                ngraph::builder::subgraph::make_shared_attribute_ptr<QuantizationAlignmentAttribute>(false)
+            },
+            ngraph::element::undefined,
+            {},
+            testValues.axis);
+        auto supportedPrecisionsOnActivation = std::vector<ngraph::pass::low_precision::OperationPrecisionRestriction>({
+                ngraph::pass::low_precision::OperationPrecisionRestriction::create<ngraph::opset1::AvgPool>({{0, testValues.params.precisionsOnActivations}})
+            });
+
+        auto quantizationRestrictions = testValues.multiChannels ?
+            std::vector<ngraph::pass::low_precision::OperationPerTensorQuantizationRestriction>() :
+            std::vector<ngraph::pass::low_precision::OperationPerTensorQuantizationRestriction>({
+                ngraph::pass::low_precision::OperationPerTensorQuantizationRestriction::create<ngraph::opset1::AvgPool>()
+                });
+
+        const auto params = TestTransformationParams::toParams(testValues.params);
+        ov::pass::Manager manager;
+        manager.register_pass<ngraph::pass::low_precision::MoveFakeQuantize>(params);
+        manager.run_passes(actualFunction);
+        // dequantization output precision depends on input precision
+        // to avoid huge amount of tests cases let's define dequantization output precision as input precision
+        if (!testValues.result.dequantizationAfter.multiply.empty()) {
+            testValues.result.dequantizationAfter.multiply.outPrecision = precision;
+        }
+
+        if (!testValues.params.updatePrecisions &&
+            (precision == ngraph::element::f32) &&
+            !testValues.result.dequantizationAfter.convert.empty()) {
+            testValues.result.dequantizationAfter.convert = {};
+        }
+
+        referenceFunction = ngraph::builder::subgraph::MoveFakeQuantize::get(
+            precision,
+            shape,
+            testValues.result.fakeQuantizeBefore1,
+            testValues.result.convertBefore1,
+            testValues.result.dequantizationBefore1,
+            testValues.result.fakeQuantizeBefore2,
+            testValues.result.convertBefore2,
+            testValues.result.dequantizationBefore2,
+            testValues.result.operation,
+            testValues.result.fakeQuantizeAfter,
+            testValues.result.convertAfter,
+            testValues.result.dequantizationAfter,
+            {
+                ngraph::builder::subgraph::make_shared_attribute_ptr<PrecisionPreservedAttribute>(true),
+                ngraph::builder::subgraph::make_shared_attribute_ptr<IntervalsAlignmentAttribute>(interval, 256),
+                ngraph::builder::subgraph::make_shared_attribute_ptr<QuantizationAlignmentAttribute>(false)
+            },
+            testValues.result.precisionAfterOperation,
+            {},
+            testValues.axis);
+    }
+
+    static std::string getTestCaseName(testing::TestParamInfo<MoveFakeQuantizeTransformationParams> obj) {
+        const ngraph::element::Type precision = std::get<0>(obj.param);
+        const ngraph::PartialShape shape = std::get<1>(obj.param);
+        const MoveFakeQuantizeTransformationTestValues testValues = std::get<2>(obj.param);
+
+        std::ostringstream result;
+        result <<
+            LayerTransformation::getTestCaseNameByParams(precision, shape, testValues.params) << "_" <<
+            (testValues.multiChannels ? "multiChannels_" : "notMultiChannels_") <<
+            "axis_" << testValues.axis << "_" <<
+            testValues.actual << "_" <<
+            testValues.result << "_";
+        return result.str();
+    }
+};
+
+TEST_P(MoveFakeQuantizeTransformation, CompareFunctions) {
+    actualFunction->validate_nodes_and_infer_types();
+    auto res = compare_functions(referenceFunction, actualFunction, true, true, true, true, true);
+    ASSERT_TRUE(res.first) << res.second;
+
+    const auto actualFakeQuantizes = LayerTransformation::get<opset1::FakeQuantize>(actualFunction);
+    ASSERT_TRUE(checkIfOutputAttributesSharedValuesAreTheSame<std::shared_ptr<PrecisionsAttribute>>(actualFakeQuantizes)) <<
+        "PrecisionsAttribute are not the same";
+}
+
+const std::vector<ngraph::element::Type> precisions = {
+    ngraph::element::f32,
+    ngraph::element::f16
+};
+
+namespace testValues1 {
+const std::vector<ngraph::PartialShape> shapes = {
+    { 1, 3, 9, 9 },
+    { 4, 3, 9, 9 },
+    { Dimension::dynamic(), 3, Dimension::dynamic(), Dimension::dynamic() }
+};
+const std::vector<MoveFakeQuantizeTransformationTestValues> testValues = {
+    // U8: concat
+    {
+        LayerTransformation::createParamsU8I8(),
+        false,
+        1,
+        {
+            {},
+            {},
+            {},
+            {},
+            {},
+            {},
+            "",
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {}
+        },
+        {
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {},
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {},
+            "",
+            {},
+            {},
+            {},
+        },
+        false,
+        false
+    },
+    {
+        LayerTransformation::createParamsU8I8(),
+        false,
+        1,
+        {
+            {},
+            {},
+            {},
+            {},
+            {},
+            {},
+            "relu",
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {}
+        },
+        {
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {},
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {},
+            "relu",
+            {},
+            {},
+            {},
+        },
+        false,
+        false
+    },
+    {
+        LayerTransformation::createParamsU8I8(),
+        false,
+        0,
+        {
+            {},
+            {},
+            {},
+            {},
+            {},
+            {},
+            "",
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {}
+        },
+        {
+            {},
+            {},
+            {},
+            {},
+            {},
+            {},
+            "",
+            { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+            {},
+            {}
+        },
+        false,
+        false
+    },
+};
+
+INSTANTIATE_TEST_SUITE_P(
+    smoke_LPT,
+    MoveFakeQuantizeTransformation,
+    ::testing::Combine(
+        ::testing::ValuesIn(precisions),
+        ::testing::ValuesIn(shapes),
+        ::testing::ValuesIn(testValues)),
+    MoveFakeQuantizeTransformation::getTestCaseName);
+} // namespace testValues1
+} // namespace
diff --git a/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp b/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp
index 6a67202125cfbd..38502dc6834490 100644
--- a/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp
+++ b/inference-engine/tests/functional/inference_engine/lp_transformations/reshape_transformation.cpp
@@ -931,6 +931,30 @@ const std::vector<ReshapeTransformationTestValues> testValues = {
                 {{0.1f, 0.01f, 0.1f}, ngraph::element::f32, {1, 3}}
             }
         }
+    },
+    // U8: without subtract 2D -> 2D
+    {
+        { Dimension::dynamic(), 2 },
+        { -1, 6 },
+        LayerTransformation::createParamsU8I8(),
+        {
+            ngraph::element::u8,
+            {
+                {ngraph::element::f32},
+                {},
+                {{0.1f, 0.02f}, ngraph::element::f32, {1, 2}}
+            }
+        },
+        {
+            ngraph::element::u8,
+            {{}, {}, {}},
+            ngraph::element::u8,
+            {
+                {ngraph::element::f32},
+                {},
+                {{0.1f,  0.02f, 0.1f, 0.02f, 0.1f, 0.02f}, ngraph::element::f32, {1, 6}}
+            }
+        }
     }
 };
 
diff --git a/inference-engine/tests/functional/inference_engine/ov_executable_network_test.cpp b/inference-engine/tests/functional/inference_engine/ov_executable_network_test.cpp
new file mode 100644
index 00000000000000..7c4e3ce7d261f5
--- /dev/null
+++ b/inference-engine/tests/functional/inference_engine/ov_executable_network_test.cpp
@@ -0,0 +1,49 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+#include <openvino/runtime/executable_network.hpp>
+
+using namespace ::testing;
+using namespace std;
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedExportStream) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.export_model(std::cout), InferenceEngine::NotAllocated);
+}
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetFunction) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.get_runtime_function(), InferenceEngine::NotAllocated);
+}
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetParameters) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.get_parameters(), InferenceEngine::NotAllocated);
+}
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetResults) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.get_results(), InferenceEngine::NotAllocated);
+}
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedSetConfig) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.set_config({{}}), InferenceEngine::NotAllocated);
+}
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetConfig) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.get_config({}), InferenceEngine::NotAllocated);
+}
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetMetric) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.get_metric({}), InferenceEngine::NotAllocated);
+}
+
+TEST(ExecutableNetworkOVTests, throwsOnUninitializedGetContext) {
+    ov::runtime::ExecutableNetwork exec;
+    ASSERT_THROW(exec.get_context(), InferenceEngine::NotAllocated);
+}
\ No newline at end of file
diff --git a/inference-engine/tests/functional/inference_engine/ov_shared_object_test.cpp b/inference-engine/tests/functional/inference_engine/ov_shared_object_test.cpp
index a396df7afc9ba6..1a1d48adf13273 100644
--- a/inference-engine/tests/functional/inference_engine/ov_shared_object_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/ov_shared_object_test.cpp
@@ -19,21 +19,21 @@ class SharedObjectOVTests: public ::testing::Test {
     }
 
     void loadDll(const string &libraryName) {
-        sharedObject.reset(new ov::runtime::SharedObject(libraryName.c_str()));
+        shared_object = ov::runtime::load_shared_object(libraryName.c_str());
     }
-    unique_ptr<ov::runtime::SharedObject> sharedObject;
+   std::shared_ptr<void> shared_object;
 
     using CreateF = void(std::shared_ptr<InferenceEngine::IInferencePlugin>&);
 
     std::function<CreateF> make_std_function(const std::string& functionName) {
-        std::function<CreateF> ptr(reinterpret_cast<CreateF*>(sharedObject->get_symbol(functionName.c_str())));
+        std::function<CreateF> ptr(reinterpret_cast<CreateF*>(ov::runtime::get_symbol(shared_object, functionName.c_str())));
         return ptr;
     }
 };
 
 TEST_F(SharedObjectOVTests, canLoadExistedPlugin) {
     loadDll(get_mock_engine_name());
-    EXPECT_NE(nullptr, sharedObject.get());
+    EXPECT_NE(nullptr, shared_object.get());
 }
 
 TEST_F(SharedObjectOVTests, loaderThrowsIfNoPlugin) {
diff --git a/inference-engine/tests/functional/inference_engine/serialization/single_layer/gather_tree.cpp b/inference-engine/tests/functional/inference_engine/serialization/single_layer/gather_tree.cpp
new file mode 100644
index 00000000000000..9e80930a70381a
--- /dev/null
+++ b/inference-engine/tests/functional/inference_engine/serialization/single_layer/gather_tree.cpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+
+#include "shared_test_classes/single_layer/gather_tree.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+using namespace LayerTestsDefinitions;
+
+namespace {
+
+TEST_P(GatherTreeLayerTest, Serialize) {
+    Serialize();
+}
+
+const std::vector<InferenceEngine::Precision> netPrecisions = {
+        InferenceEngine::Precision::FP32,
+        InferenceEngine::Precision::I32
+};
+
+const std::vector<std::vector<size_t>> inputShapes = { {5, 1, 10}, {1, 1, 10}, {20, 1, 10}, {20, 20, 10} };
+
+const std::vector<ngraph::helpers::InputLayerType> secondaryInputTypes = {
+        ngraph::helpers::InputLayerType::CONSTANT,
+        ngraph::helpers::InputLayerType::PARAMETER
+};
+
+INSTANTIATE_TEST_SUITE_P(smoke_GatherTree_Serialization, GatherTreeLayerTest,
+                        ::testing::Combine(
+                            ::testing::ValuesIn(inputShapes),
+                            ::testing::ValuesIn(secondaryInputTypes),
+                            ::testing::ValuesIn(netPrecisions),
+                            ::testing::Values(InferenceEngine::Precision::UNSPECIFIED),
+                            ::testing::Values(InferenceEngine::Precision::UNSPECIFIED),
+                            ::testing::Values(InferenceEngine::Layout::ANY),
+                            ::testing::Values(InferenceEngine::Layout::ANY),
+                            ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                        GatherTreeLayerTest::getTestCaseName);
+}   // namespace
\ No newline at end of file
diff --git a/inference-engine/tests/functional/inference_engine/transformations/add_fake_quantize_fusion.cpp b/inference-engine/tests/functional/inference_engine/transformations/add_fake_quantize_fusion.cpp
index 6896c77f091f5c..5c215aea4d43ed 100644
--- a/inference-engine/tests/functional/inference_engine/transformations/add_fake_quantize_fusion.cpp
+++ b/inference-engine/tests/functional/inference_engine/transformations/add_fake_quantize_fusion.cpp
@@ -42,7 +42,6 @@ TEST(TransformationTests, AddFakeQuantizeFusion) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::AddFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -62,6 +61,50 @@ TEST(TransformationTests, AddFakeQuantizeFusion) {
     ASSERT_TRUE(res.first) << res.second;
 }
 
+TEST(TransformationTests, AddFakeQuantizeFusionWithConvolutionAndScalarConstant) {
+    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
+
+    Shape data_shape{1, 3, 14, 14};
+    {
+        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+        auto filter = std::make_shared<opset5::Parameter>(element::f32, Shape{1, 3, 2, 2});
+        auto conv = std::make_shared<opset5::Convolution>(data, filter, Strides{1, 1},
+                CoordinateDiff{0, 0}, CoordinateDiff{0, 0}, Strides{1, 1});
+        auto add_const = opset5::Constant::create(element::f32, Shape{1}, {2});
+        auto add = std::make_shared<opset5::Add>(conv, add_const);
+        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {0});
+        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
+        auto output_low = opset5::Constant::create(element::f32, Shape{}, {0});
+        auto output_high = opset5::Constant::create(element::f32, Shape{}, {10});
+        auto fq = std::make_shared<opset5::FakeQuantize>(add, input_low,
+                                                         input_high, output_low,
+                                                         output_high, 11);
+        f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data, filter});
+        pass::Manager m;
+        m.register_pass<pass::InitNodeInfo>();
+        m.register_pass<pass::AddFakeQuantizeFusion>();
+        m.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+    {
+        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+        auto filter = std::make_shared<opset5::Parameter>(element::f32, Shape{1, 3, 2, 2});
+        auto conv = std::make_shared<opset5::Convolution>(data, filter, Strides{1, 1},
+                CoordinateDiff{0, 0}, CoordinateDiff{0, 0}, Strides{1, 1});
+        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {-2});
+        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {18});
+        auto output_low = opset5::Constant::create(element::f32, Shape{}, {0});
+        auto output_high = opset5::Constant::create(element::f32, Shape{}, {10});
+        auto fq = std::make_shared<opset5::FakeQuantize>(conv, input_low,
+                                                         input_high, output_low,
+                                                         output_high, 11);
+        f_ref = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data, filter});
+    }
+
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
 TEST(TransformationTests, AddFakeQuantizeFusionConstantOnFirstInput) {
     std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
 
@@ -81,7 +124,44 @@ TEST(TransformationTests, AddFakeQuantizeFusionConstantOnFirstInput) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::AddFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
+        m.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+    {
+        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {-2});
+        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {18});
+        auto output_low = opset5::Constant::create(element::f32, Shape{}, {0});
+        auto output_high = opset5::Constant::create(element::f32, Shape{}, {10});
+        auto fq = std::make_shared<opset5::FakeQuantize>(data, input_low,
+                                                         input_high, output_low,
+                                                         output_high, 11);
+        f_ref = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
+    }
+
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, AddFakeQuantizeFusionConstantWithEqualValues) {
+    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
+
+    Shape data_shape{1, 3, 14, 14};
+    {
+        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+        auto add_const = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {2, 2, 2});
+        auto add = std::make_shared<opset5::Add>(add_const, data);
+        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {0});
+        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
+        auto output_low = opset5::Constant::create(element::f32, Shape{}, {0});
+        auto output_high = opset5::Constant::create(element::f32, Shape{}, {10});
+        auto fq = std::make_shared<opset5::FakeQuantize>(add, input_low,
+                                                         input_high, output_low,
+                                                         output_high, 11);
+        f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
+        pass::Manager m;
+        m.register_pass<pass::InitNodeInfo>();
+        m.register_pass<pass::AddFakeQuantizeFusion>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -120,7 +200,6 @@ TEST(TransformationTests, AddFakeQuantizeFusionReshape) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::AddFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -159,7 +238,6 @@ TEST(TransformationTests, NegativeAddFakeQuantizeFusionNotAConstant) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::AddFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -180,3 +258,75 @@ TEST(TransformationTests, NegativeAddFakeQuantizeFusionNotAConstant) {
     auto res = compare_functions(f, f_ref, true);
     ASSERT_TRUE(res.first) << res.second;
 }
+
+TEST(TransformationTests, NegativeAddFakeQuantizeFusionWithConvolutionAndNonScalarConstant) {
+    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
+
+    Shape data_shape{1, 3, 14, 14};
+    {
+        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+        auto filter = std::make_shared<opset5::Parameter>(element::f32, Shape{4, 3, 2, 2});
+        auto conv = std::make_shared<opset5::Convolution>(data, filter, Strides{1, 1},
+                CoordinateDiff{0, 0}, CoordinateDiff{0, 0}, Strides{1, 1});
+        auto add_const = opset5::Constant::create(element::f32, Shape{1, 4, 1, 1}, {1, 2, 3, 4});
+        auto add = std::make_shared<opset5::Add>(conv, add_const);
+        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {0});
+        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
+        auto output_low = opset5::Constant::create(element::f32, Shape{}, {0});
+        auto output_high = opset5::Constant::create(element::f32, Shape{}, {10});
+        auto fq = std::make_shared<opset5::FakeQuantize>(add, input_low,
+                                                         input_high, output_low,
+                                                         output_high, 11);
+        f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data, filter});
+        pass::Manager m;
+        m.register_pass<pass::InitNodeInfo>();
+        m.register_pass<pass::AddFakeQuantizeFusion>();
+        m.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+    {
+        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+        auto filter = std::make_shared<opset5::Parameter>(element::f32, Shape{4, 3, 2, 2});
+        auto conv = std::make_shared<opset5::Convolution>(data, filter, Strides{1, 1},
+                CoordinateDiff{0, 0}, CoordinateDiff{0, 0}, Strides{1, 1});
+        auto add_const = opset5::Constant::create(element::f32, Shape{1, 4, 1, 1}, {1, 2, 3, 4});
+        auto add = std::make_shared<opset5::Add>(conv, add_const);
+        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {0});
+        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
+        auto output_low = opset5::Constant::create(element::f32, Shape{}, {0});
+        auto output_high = opset5::Constant::create(element::f32, Shape{}, {10});
+        auto fq = std::make_shared<opset5::FakeQuantize>(add, input_low,
+                                                         input_high, output_low,
+                                                         output_high, 11);
+        f_ref = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data, filter});
+    }
+
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, NegativeAddFakeQuantizeFusionLowPrecision) {
+    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
+
+    Shape data_shape{1, 3, 14, 14};
+    auto data = std::make_shared<opset5::Parameter>(element::f16, data_shape);
+    auto add_const = opset5::Constant::create(element::f16, Shape{1}, {2});
+    auto add = std::make_shared<opset5::Add>(data, add_const);
+    auto input_low = opset5::Constant::create(element::f16, Shape{1}, {0});
+    auto input_high = opset5::Constant::create(element::f16, Shape{1}, {20});
+    auto output_low = opset5::Constant::create(element::f16, Shape{}, {0});
+    auto output_high = opset5::Constant::create(element::f16, Shape{}, {10});
+    auto fq = std::make_shared<opset5::FakeQuantize>(add, input_low,
+                                                     input_high, output_low,
+                                                     output_high, 11);
+    f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
+    f_ref = clone_function(*f);
+    pass::Manager m;
+    m.register_pass<pass::InitNodeInfo>();
+    m.register_pass<pass::AddFakeQuantizeFusion>();
+    m.run_passes(f);
+    ASSERT_NO_THROW(check_rt_info(f));
+
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
diff --git a/inference-engine/tests/functional/inference_engine/transformations/dropout_with_random_uniform_replacer_test.cpp b/inference-engine/tests/functional/inference_engine/transformations/dropout_with_random_uniform_replacer_test.cpp
new file mode 100644
index 00000000000000..9e92e9f14c36df
--- /dev/null
+++ b/inference-engine/tests/functional/inference_engine/transformations/dropout_with_random_uniform_replacer_test.cpp
@@ -0,0 +1,375 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <memory>
+#include <ngraph/function.hpp>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pass/manager.hpp>
+#include <string>
+#include <transformations/common_optimizations/dropout_with_random_uniform_replacer.hpp>
+#include <transformations/init_node_info.hpp>
+
+#include "common_test_utils/ngraph_test_utils.hpp"
+
+using namespace testing;
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerCase1) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {30.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto broadcast_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.5});
+        auto broadcast = std::make_shared<ngraph::opset8::Broadcast>(broadcast_const, input);
+
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {30.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(broadcast, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerCase2) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f16,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto broadcast_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {0.5});
+        auto broadcast = std::make_shared<ngraph::opset8::Broadcast>(broadcast_const, input);
+
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(broadcast, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerWithConvert) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto convert = std::make_shared<ngraph::opset8::Convert>(ru, ngraph::element::f16);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(convert, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto broadcast_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.5});
+        auto broadcast = std::make_shared<ngraph::opset8::Broadcast>(broadcast_const, input);
+        auto convert = std::make_shared<ngraph::opset8::Convert>(broadcast, ngraph::element::f16);
+
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(convert, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerAddConstNegative) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.5});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.5});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerNonFloatRUNegative) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {100});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::i32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {10});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {100});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::i32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {10});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerInvalidMinNegative) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {-2.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {-2.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerInvalidMaxNegative) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.5});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.5});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+
+TEST(TransformationTests, DropoutWithRandomUniformReplacerInvalidAddConstRankNegative) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{3}, {1.0, 2.0, 3.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::DropoutWithRandomUniformReplacer>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{3}, {1.0, 2.0, 3.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+        auto floor = std::make_shared<ngraph::opset8::Floor>(add);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{floor}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
\ No newline at end of file
diff --git a/inference-engine/tests/functional/inference_engine/transformations/fq_mul_fusion_test.cpp b/inference-engine/tests/functional/inference_engine/transformations/fq_mul_fusion_test.cpp
index 57135f0285a3b6..8be09d1dd38d56 100644
--- a/inference-engine/tests/functional/inference_engine/transformations/fq_mul_fusion_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/transformations/fq_mul_fusion_test.cpp
@@ -49,8 +49,10 @@ class FQMulFusion : public testing::WithParamInterface<FQMulFusionParams>,
         const auto fq = std::make_shared<ngraph::opset4::FakeQuantize>(
             data, in_low, in_high, out_low, out_high, 255);
 
+        std::vector<float> mul_const(shape_size(mul_const_shape));
+        std::iota(mul_const.begin(), mul_const.end(), 0);
         const auto mul_value = ngraph::opset4::Constant::create(
-            ngraph::element::Type_t::f32, mul_const_shape, {3.14f});
+            ngraph::element::Type_t::f32, mul_const_shape, mul_const);
         const auto mul = std::make_shared<ngraph::opset4::Multiply>(fq, mul_value);
 
         m_function = std::make_shared<ngraph::Function>(
@@ -167,7 +169,7 @@ INSTANTIATE_TEST_SUITE_P(FQOutputs_1D__multiplier_3D, FQMulFusion,
                                            ::testing::Values(ngraph::Shape{1, 64, 1, 1}),
                                            ::testing::Values(ngraph::Shape{1}),
                                            ::testing::Values(ngraph::Shape{1, 3, 1}),
-                                           ::testing::Values(ngraph::Shape{1, 3, 1})));
+                                           ::testing::Values(ngraph::Shape{1, 1, 3, 1})));
 
 INSTANTIATE_TEST_SUITE_P(FQInOUt_ones__multiplier_4D_with_channel, FQMulFusion,
                         ::testing::Combine(::testing::Values(ngraph::Shape{1, 64, 3, 3}),
@@ -176,6 +178,14 @@ INSTANTIATE_TEST_SUITE_P(FQInOUt_ones__multiplier_4D_with_channel, FQMulFusion,
                                            ::testing::Values(ngraph::Shape{1, 64, 3, 3}),
                                            ::testing::Values(ngraph::Shape{1, 64, 3, 3})));
 
+INSTANTIATE_TEST_CASE_P(FQInOUt_ones__multiplier_3D, FQMulFusion,
+                        ::testing::Combine(::testing::Values(ngraph::Shape{1, 128, 512}),
+                                           ::testing::Values(ngraph::Shape{1}),
+                                           ::testing::Values(ngraph::Shape{1}),
+                                           ::testing::Values(ngraph::Shape{512}),
+                                           ::testing::Values(ngraph::Shape{1, 1, 512})));
+
+
 TEST(FQMulFusion_NonConstInputs, AllInputsNonConst) {
     const auto data = std::make_shared<ngraph::opset4::Parameter>(
         ngraph::element::Type_t::f32, ngraph::Shape{1, 3, 224, 224});
@@ -383,6 +393,53 @@ TEST(TransformationTests, FakeQuantizeMultiplyFusionNegative) {
     ASSERT_EQ(function->get_output_shape(0), ngraph::Shape({1, 300, 16}));
 }
 
+TEST(TransformationTests, FakeQuantizeMultiplyFusionMulConstWithEqualValues) {
+    const auto data = std::make_shared<ngraph::opset4::Parameter>(
+        ngraph::element::Type_t::f32, ngraph::Shape{1, 3, 224, 224});
+    const auto in_low =
+        std::make_shared<ngraph::opset4::Parameter>(ngraph::element::Type_t::f32, ngraph::Shape{});
+    const auto in_high =
+        std::make_shared<ngraph::opset4::Parameter>(ngraph::element::Type_t::f32, ngraph::Shape{});
+    const auto out_low = ngraph::opset4::Constant::create(
+        ngraph::element::Type_t::f32, ngraph::Shape{}, {1.0f});
+    const auto out_high = ngraph::opset4::Constant::create(
+        ngraph::element::Type_t::f32, ngraph::Shape{}, {100.0f});
+    const auto fq = std::make_shared<ngraph::opset4::FakeQuantize>(
+        data, in_low, in_high, out_low, out_high, 42);
+
+    const auto mul_value = ngraph::opset4::Constant::create(
+        ngraph::element::Type_t::f32, ngraph::Shape{1, 3, 1, 1}, {3, 3, 3});
+    const auto mul = std::make_shared<ngraph::opset4::Multiply>(fq, mul_value);
+
+    auto function = std::make_shared<ngraph::Function>(ngraph::OutputVector{mul},
+        ngraph::ParameterVector{data, in_low, in_high});
+
+    const auto expected_out_low = ngraph::opset4::Constant::create(
+        ngraph::element::Type_t::f32, ngraph::Shape{1}, {3.0f});
+    // this constant should be created by constant folding of the last FQ input
+    const auto expected_out_high = ngraph::opset4::Constant::create(
+        ngraph::element::Type_t::f32, ngraph::Shape{1}, {300.0f});
+
+    const auto expected_fq = std::make_shared<ngraph::opset4::FakeQuantize>(
+        data, in_low, in_high, expected_out_low, expected_out_high, 42);
+
+    const auto expected_function =
+        std::make_shared<ngraph::Function>(ngraph::OutputVector{expected_fq},
+            ngraph::ParameterVector{data, in_low, in_high});
+
+    ngraph::pass::Manager manager;
+    manager.register_pass<ngraph::pass::InitNodeInfo>();
+    manager.register_pass<ngraph::pass::FakeQuantizeMulFusion>();
+
+    manager.run_passes(function);
+    ASSERT_NO_THROW(check_rt_info(function));
+
+    const auto res = compare_functions(function, expected_function, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+
+
 
 } // namespace
 
diff --git a/inference-engine/tests/functional/inference_engine/transformations/mul_fake_quantize_fusion.cpp b/inference-engine/tests/functional/inference_engine/transformations/mul_fake_quantize_fusion.cpp
index b8133abffc2241..4d67c713857256 100644
--- a/inference-engine/tests/functional/inference_engine/transformations/mul_fake_quantize_fusion.cpp
+++ b/inference-engine/tests/functional/inference_engine/transformations/mul_fake_quantize_fusion.cpp
@@ -42,7 +42,6 @@ TEST(TransformationTests, MulFakeQuantizeFusionPositiveConstant) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::MulFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -81,7 +80,6 @@ TEST(TransformationTests, MulFakeQuantizeFusionConstantOnFirstInput) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::MulFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -120,7 +118,6 @@ TEST(TransformationTests, MulFakeQuantizeFusionReshape) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::MulFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -140,13 +137,13 @@ TEST(TransformationTests, MulFakeQuantizeFusionReshape) {
     ASSERT_TRUE(res.first) << res.second;
 }
 
-TEST(TransformationTests, MulFakeQuantizeFusionConstantAllNegative) {
+TEST(TransformationTests, MulFakeQuantizeFusionConstantNonScalarWithEqualValues) {
     std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
 
     Shape data_shape{1, 3, 14, 14};
     {
         auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
-        auto mul_const = opset5::Constant::create(element::f32, Shape{1}, {-2});
+        auto mul_const = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {2, 2, 2});
         auto mul = std::make_shared<opset5::Multiply>(data, mul_const);
         auto input_low = opset5::Constant::create(element::f32, Shape{1}, {1});
         auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
@@ -159,97 +156,18 @@ TEST(TransformationTests, MulFakeQuantizeFusionConstantAllNegative) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::MulFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
     {
         auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
-        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {-0.5});
-        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {-10});
-        auto output_low = opset5::Constant::create(element::f32, Shape{1}, {10});
-        auto output_high = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {-10, -10, -10});
-        auto fq = std::make_shared<opset5::FakeQuantize>(data, input_low,
-                                                         input_high, output_low,
-                                                         output_high, 11);
-        f_ref = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
-    }
-
-    auto res = compare_functions(f, f_ref, true);
-    ASSERT_TRUE(res.first) << res.second;
-}
-
-TEST(TransformationTests, MulFakeQuantizeFusionConstantSomeNegative) {
-    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
-
-    Shape data_shape{1, 3, 14, 14};
-    {
-        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
-        auto mul_const = opset5::Constant::create(element::f32, Shape{3, 1, 1}, {2, 1, -2});
-        auto mul = std::make_shared<opset5::Multiply>(data, mul_const);
-        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {1});
-        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
+        auto input_low = opset5::Constant::create(element::f32, Shape{1}, {0.5});
+        auto input_high = opset5::Constant::create(element::f32, Shape{1}, {10});
         auto output_low = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {-10, -10, -10});
         auto output_high = opset5::Constant::create(element::f32, Shape{1}, {10});
-        auto fq = std::make_shared<opset5::FakeQuantize>(mul, input_low,
-                                                         input_high, output_low,
-                                                         output_high, 20);
-        f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
-        pass::Manager m;
-        m.register_pass<pass::InitNodeInfo>();
-        m.register_pass<pass::MulFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
-        m.run_passes(f);
-        ASSERT_NO_THROW(check_rt_info(f));
-    }
-    {
-        auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
-        auto input_low = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {0.5f, 1.0f, -0.5f});
-        auto input_high = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {10.0f, 20.0f, -10.0f});
-        auto output_low = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {-10.0f, -10.0f, 10.0f});
-        auto output_high = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {10.0f, 10.0f, -10.0f});
-        auto fq = std::make_shared<opset5::FakeQuantize>(data, input_low,
-                                                         input_high, output_low,
-                                                         output_high, 20);
-        f_ref = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
-    }
-
-    auto res = compare_functions(f, f_ref, true);
-    ASSERT_TRUE(res.first) << res.second;
-}
-
-TEST(TransformationTests, MulFakeQuantizeFusionConstantSomeNegativeF16) {
-    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
-
-    Shape data_shape{1, 3, 14, 14};
-    {
-        auto data = std::make_shared<opset5::Parameter>(element::f16, data_shape);
-        auto mul_const = opset5::Constant::create(element::f16, Shape{3, 1, 1}, {2, 1, -2});
-        auto mul = std::make_shared<opset5::Multiply>(data, mul_const);
-        auto input_low = opset5::Constant::create(element::f16, Shape{1}, {1});
-        auto input_high = opset5::Constant::create(element::f16, Shape{1}, {20});
-        auto output_low = opset5::Constant::create(element::f16, Shape{1, 3, 1, 1}, {-10, -10, -10});
-        auto output_high = opset5::Constant::create(element::f16, Shape{1}, {10});
-        auto fq = std::make_shared<opset5::FakeQuantize>(mul, input_low,
-                                                         input_high, output_low,
-                                                         output_high, 20);
-        f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
-        pass::Manager m;
-        m.register_pass<pass::InitNodeInfo>();
-        m.register_pass<pass::MulFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
-        m.run_passes(f);
-        ASSERT_NO_THROW(check_rt_info(f));
-    }
-    {
-        auto data = std::make_shared<opset5::Parameter>(element::f16, data_shape);
-        auto input_low = opset5::Constant::create(element::f16, Shape{1, 3, 1, 1}, {0.5f, 1.0f, -0.5f});
-        auto input_high = opset5::Constant::create(element::f16, Shape{1, 3, 1, 1}, {10.0f, 20.0f, -10.0f});
-        auto output_low = opset5::Constant::create(element::f16, Shape{1, 3, 1, 1}, {-10.0f, -10.0f, 10.0f});
-        auto output_high = opset5::Constant::create(element::f16, Shape{1, 3, 1, 1}, {10.0f, 10.0f, -10.0f});
         auto fq = std::make_shared<opset5::FakeQuantize>(data, input_low,
                                                          input_high, output_low,
-                                                         output_high, 20);
+                                                         output_high, 11);
         f_ref = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
     }
 
@@ -276,7 +194,6 @@ TEST(TransformationTests, NegativeMulFakeQuantizeFusionNotAConstant) {
         pass::Manager m;
         m.register_pass<pass::InitNodeInfo>();
         m.register_pass<pass::MulFakeQuantizeFusion>();
-        m.register_pass<pass::ConstantFolding>();
         m.run_passes(f);
         ASSERT_NO_THROW(check_rt_info(f));
     }
@@ -297,3 +214,79 @@ TEST(TransformationTests, NegativeMulFakeQuantizeFusionNotAConstant) {
     auto res = compare_functions(f, f_ref, true);
     ASSERT_TRUE(res.first) << res.second;
 }
+
+TEST(TransformationTests, NegativeMulFakeQuantizeFusionLowPrecision) {
+    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
+
+    Shape data_shape{1, 3, 14, 14};
+    auto data = std::make_shared<opset5::Parameter>(element::f16, data_shape);
+    auto mul_const = opset5::Constant::create(element::f16, Shape{1}, {2});
+    auto mul = std::make_shared<opset5::Multiply>(data, mul_const);
+    auto input_low = opset5::Constant::create(element::f16, Shape{1}, {1});
+    auto input_high = opset5::Constant::create(element::f16, Shape{1}, {20});
+    auto output_low = opset5::Constant::create(element::f16, Shape{1, 3, 1, 1}, {0, 0, 0});
+    auto output_high = opset5::Constant::create(element::f16, Shape{1}, {10});
+    auto fq = std::make_shared<opset5::FakeQuantize>(mul, input_low,
+                                                     input_high, output_low,
+                                                     output_high, 11);
+    f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
+    f_ref = clone_function(*f);
+    pass::Manager m;
+    m.register_pass<pass::InitNodeInfo>();
+    m.register_pass<pass::MulFakeQuantizeFusion>();
+    m.run_passes(f);
+    ASSERT_NO_THROW(check_rt_info(f));
+
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, NegativeMulFakeQuantizeFusionConstantAllNegative) {
+    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
+
+    Shape data_shape{1, 3, 14, 14};
+    auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+    auto mul_const = opset5::Constant::create(element::f32, Shape{1}, {-2});
+    auto mul = std::make_shared<opset5::Multiply>(data, mul_const);
+    auto input_low = opset5::Constant::create(element::f32, Shape{1}, {1});
+    auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
+    auto output_low = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {-10, -10, -10});
+    auto output_high = opset5::Constant::create(element::f32, Shape{1}, {10});
+    auto fq = std::make_shared<opset5::FakeQuantize>(mul, input_low,
+                                                     input_high, output_low,
+                                                     output_high, 11);
+    f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
+    f_ref = clone_function(*f);
+    pass::Manager m;
+    m.register_pass<pass::InitNodeInfo>();
+    m.register_pass<pass::MulFakeQuantizeFusion>();
+    m.run_passes(f);
+    ASSERT_NO_THROW(check_rt_info(f));
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, NegativeMulFakeQuantizeFusionConstantSomeNegative) {
+    std::shared_ptr<Function> f(nullptr), f_ref(nullptr);
+
+    Shape data_shape{1, 3, 14, 14};
+    auto data = std::make_shared<opset5::Parameter>(element::f32, data_shape);
+    auto mul_const = opset5::Constant::create(element::f32, Shape{3, 1, 1}, {2, 1, -2});
+    auto mul = std::make_shared<opset5::Multiply>(data, mul_const);
+    auto input_low = opset5::Constant::create(element::f32, Shape{1}, {1});
+    auto input_high = opset5::Constant::create(element::f32, Shape{1}, {20});
+    auto output_low = opset5::Constant::create(element::f32, Shape{1, 3, 1, 1}, {-10, -10, -10});
+    auto output_high = opset5::Constant::create(element::f32, Shape{1}, {10});
+    auto fq = std::make_shared<opset5::FakeQuantize>(mul, input_low,
+                                                     input_high, output_low,
+                                                     output_high, 20);
+    f = std::make_shared<Function>(NodeVector{fq}, ParameterVector{data});
+    f_ref = clone_function(*f);
+    pass::Manager m;
+    m.register_pass<pass::InitNodeInfo>();
+    m.register_pass<pass::MulFakeQuantizeFusion>();
+    m.run_passes(f);
+    ASSERT_NO_THROW(check_rt_info(f));
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
+}
diff --git a/inference-engine/tests/functional/inference_engine/transformations/ngraph_fq_transpose_test.cpp b/inference-engine/tests/functional/inference_engine/transformations/ngraph_fq_transpose_test.cpp
index e767a4a26faaad..429eee56a7d433 100644
--- a/inference-engine/tests/functional/inference_engine/transformations/ngraph_fq_transpose_test.cpp
+++ b/inference-engine/tests/functional/inference_engine/transformations/ngraph_fq_transpose_test.cpp
@@ -24,16 +24,16 @@
 using namespace testing;
 
 TEST(TransformationTests, FQTransposeTest1) {
-    auto data1 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 3}, {1, 2, 3});
-    auto data2 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{3}, {1, 2, 3});
-    auto data3 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 3}, {1, 2, 3});
-    auto data4 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 3}, {1, 2, 3});
-    auto data5 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 3}, {1, 2, 3});
-    auto transpose_order = ngraph::op::Constant::create(ngraph::element::i64, ngraph::Shape{3}, {0, 2, 1});
-
-    std::shared_ptr<ngraph::Function> f(nullptr);
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
     {
-        auto fq = std::make_shared<ngraph::op::FakeQuantize>(data1, data2, data3, data4, data5, 1);
+        auto data = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 3}, {1, 2, 3});
+        auto input_low = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {2});
+        auto input_high = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {3});
+        auto output_low = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {2});
+        auto output_high = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {3});
+        auto transpose_order = ngraph::op::Constant::create(ngraph::element::i64, ngraph::Shape{3}, {0, 2, 1});
+
+        auto fq = std::make_shared<ngraph::op::FakeQuantize>(data, input_low, input_high, output_low, output_high, 1);
         auto transpose = std::make_shared<ngraph::op::Transpose>(fq, transpose_order);
 
         f = std::make_shared<ngraph::Function>(ngraph::NodeVector{transpose}, ngraph::ParameterVector{});
@@ -47,29 +47,35 @@ TEST(TransformationTests, FQTransposeTest1) {
         manager.register_pass<ngraph::pass::ConstantFolding>();
         ASSERT_NO_THROW(manager.run_passes(f));
     }
-    std::vector<size_t> ref_shape{1, 3, 1};
-    for (auto op : f->get_ops()) {
-        if (auto constant = ngraph::as_type_ptr<ngraph::op::Constant>(op)) {
-            auto shape = constant->get_shape();
-            ASSERT_EQ(shape, ref_shape);
-        }
+    {
+        auto data = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 3, 1}, {1, 2, 3});
+        auto input_low = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 1}, {2});
+        auto input_high = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 1}, {3});
+        auto output_low = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 1}, {2});
+        auto output_high = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 1}, {3});
+
+        auto fq = std::make_shared<ngraph::op::FakeQuantize>(data, input_low, input_high, output_low, output_high, 1);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{fq}, ngraph::ParameterVector{});
     }
+    auto res = compare_functions(f, f_ref, true);
+    ASSERT_TRUE(res.first) << res.second;
 }
 
 TEST(TransformationTests, FQTransposeDynamic) {
-    auto data1 = std::make_shared<ngraph::op::Parameter>(ngraph::element::f32, ngraph::PartialShape::dynamic());
-    auto data2 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{3}, {1, 2, 3});
-    auto data3 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 3}, {1, 2, 3});
-    auto data4 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 3}, {1, 2, 3});
-    auto data5 = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1, 3}, {1, 2, 3});
+    auto data = std::make_shared<ngraph::op::Parameter>(ngraph::element::f32, ngraph::PartialShape::dynamic());
+    auto input_low = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {2});
+    auto input_high = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {3});
+    auto output_low = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {2});
+    auto output_high = ngraph::op::Constant::create(ngraph::element::f32, ngraph::Shape{1}, {3});
     auto transpose_order = ngraph::op::Constant::create(ngraph::element::i64, ngraph::Shape{3}, {0, 2, 1});
 
     std::shared_ptr<ngraph::Function> f(nullptr);
     {
-        auto fq = std::make_shared<ngraph::op::FakeQuantize>(data1, data2, data3, data4, data5, 1);
+        auto fq = std::make_shared<ngraph::op::FakeQuantize>(data, input_low, input_high, output_low, output_high, 1);
         auto transpose = std::make_shared<ngraph::op::Transpose>(fq, transpose_order);
 
-        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{transpose}, ngraph::ParameterVector{data1});
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{transpose}, ngraph::ParameterVector{data});
 
         ngraph::pass::Manager manager;
         manager.register_pass<ngraph::pass::InitNodeInfo>();
diff --git a/inference-engine/tests/functional/inference_engine/transformations/random_uniform_fusion_test.cpp b/inference-engine/tests/functional/inference_engine/transformations/random_uniform_fusion_test.cpp
new file mode 100644
index 00000000000000..36f4ba84542859
--- /dev/null
+++ b/inference-engine/tests/functional/inference_engine/transformations/random_uniform_fusion_test.cpp
@@ -0,0 +1,290 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <memory>
+#include <ngraph/function.hpp>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pass/constant_folding.hpp>
+#include <ngraph/pass/manager.hpp>
+#include <string>
+#include <transformations/common_optimizations/random_uniform_fusion.hpp>
+#include <transformations/init_node_info.hpp>
+
+#include "common_test_utils/ngraph_test_utils.hpp"
+
+using namespace testing;
+
+TEST(TransformationTests, RandomUniformMulFusing) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+
+        auto mul_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 1}, {30.0});
+        auto mul = std::make_shared<ngraph::opset8::Multiply>(ru, mul_const);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{mul}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::RandomUniformFusion>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {30.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{ru}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, RandomUniformAddFusing) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {30.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{1, 1, 1, 1}, {-10.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(ru, add_const);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{add}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::RandomUniformFusion>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto ru_max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {20.0});
+        auto ru_min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {-10.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  ru_min_const,
+                                                                  ru_max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{ru}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, RandomUniformWithConvertMulFusing) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto conv = std::make_shared<ngraph::opset8::Convert>(ru, ngraph::element::f16);
+
+        auto mul_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {30.0});
+        auto mul = std::make_shared<ngraph::opset8::Multiply>(conv, mul_const);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{mul}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::RandomUniformFusion>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {30.0});
+
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto conv = std::make_shared<ngraph::opset8::Convert>(ru, ngraph::element::f16);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{conv}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+TEST(TransformationTests, RandomUniformWithConvertAddFusing) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {30.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto conv = std::make_shared<ngraph::opset8::Convert>(ru, ngraph::element::f16);
+
+        auto add_const = ngraph::opset8::Constant::create(ngraph::element::f16, ngraph::Shape{}, {-10.0});
+        auto add = std::make_shared<ngraph::opset8::Add>(conv, add_const);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{add}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::RandomUniformFusion>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto ru_min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {-10.0});
+        auto ru_max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {20.0});
+
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  ru_min_const,
+                                                                  ru_max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+        auto conv = std::make_shared<ngraph::opset8::Convert>(ru, ngraph::element::f16);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{conv}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+
+TEST(TransformationTests, RandomUniformFusingInvalidRUType) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {100});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::i32,
+                                                                  100,
+                                                                  200);
+
+        auto mul_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {30});
+        auto mul = std::make_shared<ngraph::opset8::Multiply>(ru, mul_const);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{mul}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::RandomUniformFusion>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {100});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::i32,
+                                                                  100,
+                                                                  200);
+
+        auto mul_const = ngraph::opset8::Constant::create(ngraph::element::i32, ngraph::Shape{}, {30});
+        auto mul = std::make_shared<ngraph::opset8::Multiply>(ru, mul_const);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{mul}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
+
+
+TEST(TransformationTests, RandomUniformFusingInvalidConstShape) {
+    std::shared_ptr<ngraph::Function> f(nullptr), f_ref(nullptr);
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+
+        auto mul_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{3}, {30, 20, 15});
+        auto mul = std::make_shared<ngraph::opset8::Multiply>(ru, mul_const);
+
+        f = std::make_shared<ngraph::Function>(ngraph::NodeVector{mul}, ngraph::ParameterVector{input});
+
+        ngraph::pass::Manager manager;
+        manager.register_pass<ngraph::pass::InitNodeInfo>();
+        manager.register_pass<ngraph::pass::RandomUniformFusion>();
+        manager.run_passes(f);
+        ASSERT_NO_THROW(check_rt_info(f));
+    }
+
+    {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i32, ngraph::Shape{3});
+        auto min_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {0.0});
+        auto max_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{}, {1.0});
+        auto ru = std::make_shared<ngraph::opset8::RandomUniform>(input,
+                                                                  min_const,
+                                                                  max_const,
+                                                                  ngraph::element::f32,
+                                                                  100,
+                                                                  200);
+
+        auto mul_const = ngraph::opset8::Constant::create(ngraph::element::f32, ngraph::Shape{3}, {30, 20, 15});
+        auto mul = std::make_shared<ngraph::opset8::Multiply>(ru, mul_const);
+
+        f_ref = std::make_shared<ngraph::Function>(ngraph::NodeVector{mul}, ngraph::ParameterVector{input});
+    }
+
+    auto res = compare_functions(f, f_ref);
+    ASSERT_TRUE(res.first) << res.second;
+}
diff --git a/inference-engine/tests/functional/inference_engine/transformations/type_relaxed_tests.cpp b/inference-engine/tests/functional/inference_engine/transformations/type_relaxed_tests.cpp
index 44a2a74f20b3fe..8cd8894bf66eda 100644
--- a/inference-engine/tests/functional/inference_engine/transformations/type_relaxed_tests.cpp
+++ b/inference-engine/tests/functional/inference_engine/transformations/type_relaxed_tests.cpp
@@ -5,6 +5,7 @@
 #include <gtest/gtest.h>
 #include "common_test_utils/test_common.hpp"
 #include <ngraph/opsets/opset1.hpp>
+#include <ngraph/pass/constant_folding.hpp>
 #include <ngraph_ops/type_relaxed.hpp>
 
 
@@ -295,4 +296,75 @@ TEST_F(TypeRelaxedTests, OneOutputMultipleInputPorts) {
         relaxed_op->validate_and_infer_types();
         ASSERT_EQ(param1->output(0).get_element_type(), element::i64);
     }
-}
\ No newline at end of file
+}
+
+TEST_F(TypeRelaxedTests, ConstantFoldingCheck) {
+    std::shared_ptr<ngraph::Function> f;
+    {
+        auto const1 = ngraph::opset1::Constant::create(element::i32, ngraph::Shape{}, { 2 });
+        auto const2 = ngraph::opset1::Constant::create(element::i32, ngraph::Shape{}, { 2 });
+        auto equal = ngraph::opset1::Equal(const1, const2);
+        auto relaxed_equal = make_shared<ngraph::op::TypeRelaxed<ngraph::opset1::Equal>>(equal, TypeVector{}, TypeVector{ element::u8 });
+
+        f = make_shared<ngraph::Function>(ngraph::OutputVector{ relaxed_equal }, ngraph::ParameterVector{});
+
+        ASSERT_NO_THROW(ngraph::pass::ConstantFolding().run_on_function(f));
+        auto layer_before_result = f->get_result()->get_input_node_shared_ptr(0);
+        ASSERT_TRUE(ngraph::is_type<ngraph::opset1::Constant>(layer_before_result));
+    }
+}
+
+TEST_F(TypeRelaxedTests, ConstantFoldingCheck1) {
+    std::shared_ptr<ngraph::Function> f;
+    {
+        auto const1 = ngraph::opset1::Constant::create(element::i32, ngraph::Shape{}, { 2 });
+        auto const2 = ngraph::opset1::Constant::create(element::i32, ngraph::Shape{}, { 2 });
+        auto equal = ngraph::opset1::Equal(const1, const2);
+        auto relaxed_equal = make_shared<ngraph::op::TypeRelaxed<ngraph::opset1::Equal>>(equal, TypeVector{}, TypeVector{ element::boolean });
+
+        f = make_shared<ngraph::Function>(ngraph::OutputVector{ relaxed_equal }, ngraph::ParameterVector{});
+
+        ASSERT_NO_THROW(ngraph::pass::ConstantFolding().run_on_function(f));
+        auto layer_before_result = f->get_result()->get_input_node_shared_ptr(0);
+        ASSERT_TRUE(ngraph::is_type<ngraph::opset1::Constant>(layer_before_result));
+    }
+}
+
+TEST_F(TypeRelaxedTests, ConstantFoldingCheck2) {
+    std::shared_ptr<ngraph::Function> f;
+    {
+        auto const1 = ngraph::opset1::Constant::create(element::u8, ngraph::Shape{}, { 2 });
+        auto const2 = ngraph::opset1::Constant::create(element::i8, ngraph::Shape{}, { 2 });
+
+        auto original_input_types = TypeVector{ element::i32, element::i32 };
+        auto relaxed_equal = std::make_shared<ngraph::op::TypeRelaxed<ngraph::opset1::Equal>>(
+            ngraph::element::TypeVector{ element::i32, element::i32 },
+            ngraph::element::TypeVector{ element::u8 },
+            ngraph::op::TemporaryReplaceOutputType(const1, element::i32).get(),
+            ngraph::op::TemporaryReplaceOutputType(const2, element::i32).get());
+
+        f = make_shared<ngraph::Function>(ngraph::OutputVector{ relaxed_equal }, ngraph::ParameterVector{});
+
+        ASSERT_NO_THROW(ngraph::pass::ConstantFolding().run_on_function(f));
+        auto layer_before_result = f->get_result()->get_input_node_shared_ptr(0);
+        ASSERT_TRUE(ngraph::is_type<ngraph::opset1::Constant>(layer_before_result));
+    }
+}
+
+TEST_F(TypeRelaxedTests, ConstantFoldingCheck3) {
+    std::shared_ptr<ngraph::Function> f;
+    {
+        auto const1 = ngraph::opset1::Constant::create(element::i32, ngraph::Shape{}, { 2 });
+        auto const2 = ngraph::opset1::Constant::create(element::i32, ngraph::Shape{}, { 2 });
+        auto equal = ngraph::opset1::Equal(const1, const2);
+
+        auto original_input_types = TypeVector{ element::f32, element::f32 };
+        auto relaxed_equal = make_shared<ngraph::op::TypeRelaxed<ngraph::opset1::Equal>>(equal, original_input_types, TypeVector{ element::u8 });
+
+        f = make_shared<ngraph::Function>(ngraph::OutputVector{ relaxed_equal }, ngraph::ParameterVector{});
+
+        ASSERT_NO_THROW(ngraph::pass::ConstantFolding().run_on_function(f));
+        auto layer_before_result = f->get_result()->get_input_node_shared_ptr(0);
+        ASSERT_TRUE(ngraph::is_type<ngraph::opset1::Constant>(layer_before_result));
+    }
+}
diff --git a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/perf_counters.cpp b/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/perf_counters.cpp
index b7007dd16f308a..a7bfe68707c6e7 100644
--- a/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/perf_counters.cpp
+++ b/inference-engine/tests/functional/plugin/conformance/test_runner/src/behavior/infer_request/perf_counters.cpp
@@ -18,6 +18,10 @@ const std::vector<std::map<std::string, std::string>> MulticonfigsPerfCounters =
         {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES), targetDevice }}
 };
 
+const std::vector<std::map<std::string, std::string>> AutoconfigsPerfCounters = {
+        {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES), targetDevice }}
+};
+
 INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPerfCountersTest,
                         ::testing::Combine(
                                 ::testing::Values(targetDevice),
@@ -30,4 +34,11 @@ INSTANTIATE_TEST_SUITE_P(smoke_Multi_BehaviorTests, InferRequestPerfCountersTest
                                 ::testing::ValuesIn(MulticonfigsPerfCounters)),
                          InferRequestPerfCountersTest::getTestCaseName);
 
+INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestPerfCountersTest,
+                        ::testing::Combine(
+                                ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+                                ::testing::ValuesIn(AutoconfigsPerfCounters)),
+                         InferRequestPerfCountersTest::getTestCaseName);
+
+
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/CMakeLists.txt b/inference-engine/tests/functional/plugin/cpu/CMakeLists.txt
index 761ddb19580f28..6680a202f9609e 100644
--- a/inference-engine/tests/functional/plugin/cpu/CMakeLists.txt
+++ b/inference-engine/tests/functional/plugin/cpu/CMakeLists.txt
@@ -9,7 +9,7 @@ add_library(cpuSpecificRtInfo STATIC ${IE_MAIN_SOURCE_DIR}/src/mkldnn_plugin/uti
 target_link_libraries(cpuSpecificRtInfo PRIVATE ngraph)
 
 set(INCLUDES ${CMAKE_CURRENT_SOURCE_DIR} ${IE_MAIN_SOURCE_DIR}/src/mkldnn_plugin)
-set(DEPENDENCIES MKLDNNPlugin AutoPlugin)
+set(DEPENDENCIES MKLDNNPlugin)
 set(LINK_LIBRARIES funcSharedTests cpuSpecificRtInfo)
 if (NGRAPH_ONNX_FRONTEND_ENABLE)
     list(APPEND INCLUDES "${OpenVINO_SOURCE_DIR}/docs/onnx_custom_op")
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/config.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/config.cpp
index aec20bce2cda5f..68d507c119120e 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/config.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/config.cpp
@@ -18,6 +18,10 @@ namespace {
 
     const std::vector<std::map<std::string, std::string>> Configs = {
             {},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}},
             {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::CPU_THROUGHPUT_AUTO}},
             {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::CPU_THROUGHPUT_NUMA}},
             {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "8"}},
@@ -27,7 +31,13 @@ namespace {
     };
 
     const std::vector<std::map<std::string, std::string>> MultiConfigs = {
-            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU}}
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+                {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+                {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+                {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}}
     };
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, CorrectConfigTests,
@@ -52,12 +62,25 @@ namespace {
             CorrectConfigTests::getTestCaseName);
 
     const std::vector<std::map<std::string, std::string>> inconfigs = {
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, "DOESN'T EXIST"}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "-1"}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "should be int"}},
             {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "OFF"}},
             {{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, "OFF"}},
             {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "NAN"}}
     };
 
     const std::vector<std::map<std::string, std::string>> multiinconfigs = {
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+             {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, "DOESN'T EXIST"}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+             {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "-1"}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+             {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "should be int"}},
             {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
                     {InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "OFF"}},
             {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
@@ -67,6 +90,13 @@ namespace {
     };
 
     const std::vector<std::map<std::string, std::string>> multiconf = {
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+             {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+             {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
+             {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+             {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}},
             {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU}}
     };
 
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp
index 7013c3096ddd75..c289a5831c005e 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/config.cpp
@@ -62,18 +62,5 @@ namespace {
                                      ::testing::ValuesIn(MultiInConfigs)),
                                      InferRequestConfigTest::getTestCaseName);
 
-    INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestConfigTest,
-                         ::testing::Combine(
-                             ::testing::Values(1u),
-                             ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                             ::testing::ValuesIn(multiConfigs)),
-                         InferRequestConfigTest::getTestCaseName);
 
-
-    INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests_, InferRequestConfigTest,
-                         ::testing::Combine(
-                             ::testing::Values(1u),
-                             ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                             ::testing::ValuesIn(MultiInConfigs)),
-                         InferRequestConfigTest::getTestCaseName);
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/infer_requset_dynamic.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/infer_requset_dynamic.cpp
new file mode 100644
index 00000000000000..3ca90740b4d227
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/infer_requset_dynamic.cpp
@@ -0,0 +1,78 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+
+#include "behavior/infer_request/infer_request_dynamic.hpp"
+
+using namespace BehaviorTestsDefinitions;
+
+namespace {
+
+const std::vector<InferenceEngine::Precision> netPrecisions = {
+    InferenceEngine::Precision::FP32
+};
+
+const std::vector<std::map<std::string, std::string>> configs = {
+    {}
+};
+
+std::shared_ptr<ngraph::Function> getFunction1() {
+    const std::vector<size_t> inputShape = {1, 4, 20, 20};
+    const ngraph::element::Type_t ngPrc = ngraph::element::Type_t::f32;
+
+    auto params = ngraph::builder::makeParams(ngPrc, {inputShape});
+    params.front()->set_friendly_name("Param_1");
+
+    auto in2add = ngraph::builder::makeConstant(ngPrc, {1, 4, 1, 1}, std::vector<float>{}, true);
+    auto add = ngraph::builder::makeEltwise(params[0], in2add, ngraph::helpers::EltwiseTypes::ADD);
+    auto relu1 = std::make_shared<ngraph::opset1::Relu>(add->output(0));
+    auto relu2 = std::make_shared<ngraph::opset1::Relu>(add->output(0));
+
+    ngraph::NodeVector results{relu1, relu2};
+    return std::make_shared<ngraph::Function>(results, params, "AddTwoOutputEdges");
+}
+
+std::shared_ptr<ngraph::Function> getFunction2() {
+    const std::vector<size_t> inputShape = {1, 4, 20, 20};
+    const ngraph::element::Type_t ngPrc = ngraph::element::Type_t::f32;
+
+    auto params = ngraph::builder::makeParams(ngPrc, {inputShape});
+    params.front()->set_friendly_name("Param_1");
+    auto split = ngraph::builder::makeSplit(params[0], ngPrc, 2, 1);
+
+    auto in2add = ngraph::builder::makeConstant(ngPrc, {1, 2, 1, 1}, std::vector<float>{}, true);
+    auto add = ngraph::builder::makeEltwise(split->output(0), in2add, ngraph::helpers::EltwiseTypes::ADD);
+    auto relu1 = std::make_shared<ngraph::opset1::Relu>(add);
+
+    auto in2mult = ngraph::builder::makeConstant(ngPrc, {1, 2, 1, 1}, std::vector<float>{}, true);
+    auto mult = ngraph::builder::makeEltwise(split->output(1), in2mult, ngraph::helpers::EltwiseTypes::MULTIPLY);
+    auto relu2 = std::make_shared<ngraph::opset1::Relu>(mult);
+
+    auto concat = std::make_shared<ngraph::opset1::Concat>(ngraph::OutputVector{relu1->output(0), relu2->output(0)}, 3);
+
+    return std::make_shared<ngraph::Function>(concat, params, "SplitAddConcat");
+}
+
+INSTANTIATE_TEST_CASE_P(smoke_BehaviorTests_1, InferRequestDynamicTests,
+                        ::testing::Combine(
+                                ::testing::Values(getFunction1()),
+                                ::testing::Values(std::vector<std::pair<std::vector<size_t>, std::vector<size_t>>>{
+                                    {{1, 4, 20, 20}, {1, 4, 20, 20}},
+                                    {{2, 4, 20, 20}, {2, 4, 20, 20}}}),
+                                ::testing::Values(CommonTestUtils::DEVICE_CPU),
+                                ::testing::ValuesIn(configs)),
+                        InferRequestDynamicTests::getTestCaseName);
+
+INSTANTIATE_TEST_CASE_P(smoke_BehaviorTests_2, InferRequestDynamicTests,
+                        ::testing::Combine(
+                                ::testing::Values(getFunction2()),
+                                ::testing::Values(std::vector<std::pair<std::vector<size_t>, std::vector<size_t>>>{
+                                    {{1, 4, 20, 20}, {1, 2, 20, 40}},
+                                    {{2, 4, 20, 20}, {2, 2, 20, 40}}}),
+                                ::testing::Values(CommonTestUtils::DEVICE_CPU),
+                                ::testing::ValuesIn(configs)),
+                        InferRequestDynamicTests::getTestCaseName);
+
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
index 684f1938b37f12..b75a7e8c789558 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
@@ -37,6 +37,10 @@ const std::vector<std::map<std::string, std::string>> Multiconfigs = {
         {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_CPU}}
 };
 
+const std::vector<std::map<std::string, std::string>> Autoconfigs = {
+        {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_CPU}}
+};
+
 INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPerfCountersTest,
                         ::testing::Combine(
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
@@ -48,4 +52,11 @@ INSTANTIATE_TEST_SUITE_P(smoke_Multi_BehaviorTests, InferRequestPerfCountersTest
                                 ::testing::Values(CommonTestUtils::DEVICE_MULTI),
                                 ::testing::ValuesIn(Multiconfigs)),
                          InferRequestPerfCountersTest::getTestCaseName);
+
+INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestPerfCountersTest,
+                        ::testing::Combine(
+                                ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+                                ::testing::ValuesIn(Autoconfigs)),
+                         InferRequestPerfCountersTest::getTestCaseName);
+
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp
index c03c1a4f121cc2..f7656b81c760a7 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/behavior/test_plugin.cpp
@@ -32,6 +32,10 @@ namespace {
              {InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::CPU_THROUGHPUT_AUTO}}
     };
 
+    const std::vector<std::map<std::string, std::string>> AutoConfigsInputOutput = {
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU}}
+    };
+
     const std::vector<std::map<std::string, std::string>> configsOutput = {
             {},
             {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::CPU_THROUGHPUT_AUTO}}
@@ -56,7 +60,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(AutoConfigsInputOutput)),
                             BehaviorTestOutput::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, BehaviorTests,
@@ -98,7 +102,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(AutoConfigsInputOutput)),
                             BehaviorTestInput::getTestCaseName);
 
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/low_precision_transformations/move_fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/low_precision_transformations/move_fake_quantize_transformation.cpp
new file mode 100644
index 00000000000000..09ac0e229a1330
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/low_precision_transformations/move_fake_quantize_transformation.cpp
@@ -0,0 +1,86 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+
+#include "low_precision_transformations/move_fake_quantize_transformation.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+using namespace LayerTestsDefinitions;
+
+namespace {
+const std::vector<ngraph::element::Type> netPrecisions = {
+    ngraph::element::f32,
+    //ngraph::element::f16
+};
+
+const std::vector<ngraph::pass::low_precision::LayerTransformation::Params> trasformationParamValues = {
+    LayerTestsUtils::LayerTransformationParamsNGraphFactory::createParams().setUpdatePrecisions(true)
+};
+
+const std::vector<LayerTestsDefinitions::MoveFakeQuantizeTransformationParam> params = {
+  // without operation
+  {
+        {},
+        {},
+        {},
+        {},
+        {},
+        {},
+        "",
+        { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+        {},
+        {},
+        "Concatenation",
+        "U8",
+        1,
+    },
+    // with ReLU operation
+    {
+        {},
+        {},
+        {},
+        {},
+        {},
+        {},
+        "relu",
+        { 256ul, {}, { -12.7f }, { 12.7f }, { -12.7f }, { 12.7f }},
+        {},
+        {},
+        "Concatenation",
+        "U8",
+        1
+    },
+    // negative axis
+    {
+        {},
+        {},
+        {},
+        {},
+        {},
+        {},
+        "",
+        {256ul, {},  {-1.28f}, {1.27f}, {-1.28f}, {1.27f}},
+        {},
+        {},
+        "Concatenation",
+        "FP32",
+        0
+    }
+};
+
+const std::vector<ngraph::Shape> shapes = {
+    { 1, 3, 16, 16 },
+    { 4, 3, 16, 16 }
+};
+
+INSTANTIATE_TEST_SUITE_P(smoke_LPT, MoveFakeQuantizeTransformation,
+    ::testing::Combine(
+        ::testing::ValuesIn(netPrecisions),
+        ::testing::ValuesIn(shapes),
+        ::testing::Values(CommonTestUtils::DEVICE_CPU),
+        ::testing::ValuesIn(trasformationParamValues),
+        ::testing::ValuesIn(params)),
+    MoveFakeQuantizeTransformation::getTestCaseName);
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/gather_tree.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/gather_tree.cpp
index 0076fd7b8fe588..6aa1a2b060843d 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/gather_tree.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/gather_tree.cpp
@@ -23,7 +23,7 @@ const std::vector<ngraph::helpers::InputLayerType> secondaryInputTypes = {
         ngraph::helpers::InputLayerType::PARAMETER
 };
 
-INSTANTIATE_TEST_SUITE_P(Basic_smoke, GatherTreeLayerTest,
+INSTANTIATE_TEST_SUITE_P(smoke_GatherTree, GatherTreeLayerTest,
                         ::testing::Combine(
                             ::testing::ValuesIn(inputShapes),
                             ::testing::ValuesIn(secondaryInputTypes),
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp
index be837c2970200e..37a21eb2106c81 100644
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/skip_tests_config.cpp
@@ -89,10 +89,14 @@ std::vector<std::string> disabledTestPatterns() {
         R"(.*/NmsLayerTest.*)",
         // TODO: 56520 Accuracy mismatch
         R"(.*ReduceOpsLayerTest.*type=Mean_.*netPRC=(I64|I32).*)",
-        R"(.*ReduceOpsLayerTest.*type=Mean_.*netPRC=U64.*)"
+        R"(.*ReduceOpsLayerTest.*type=Mean_.*netPRC=U64.*)",
+
+        // Issue: 62746
+        R"(smoke_CachingSupportCase_CPU/LoadNetworkCacheTestBase.CompareWithRefImpl/ReadConcatSplitAssign_f32_batch1_CPU)"
     };
 
-#if ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
+#define FIX_62820 0
+#if FIX_62820 && ((IE_THREAD == IE_THREAD_TBB) || (IE_THREAD == IE_THREAD_TBB_AUTO))
     retVector.emplace_back(R"(.*ReusableCPUStreamsExecutor.*)");
 #endif
 
diff --git a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/subgraph_tests/mul_conv_fusion.cpp b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/subgraph_tests/mul_conv_fusion.cpp
new file mode 100644
index 00000000000000..8a532e4dfa5b3b
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/subgraph_tests/mul_conv_fusion.cpp
@@ -0,0 +1,264 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+
+#include "subgraph_tests/mul_conv_fusion.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+#include <ngraph/opsets/opset8.hpp>
+
+using namespace SubgraphTestsDefinitions;
+
+namespace {
+    const std::vector<ngraph::element::Type> types{ngraph::element::f32};
+
+    const std::vector<ngraph::Shape> const_shapes_fprop_1d{
+        {},
+        {1},
+        {1, 1},
+        {8, 1},
+        {1, 1, 1},
+        {1, 8, 1},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_Convolution_1D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::Convolution::type_info),
+                                    ::testing::Values(ngraph::Shape{1, 8, 64}),
+                                    ::testing::Values(ngraph::Shape{64, 8, 1}),
+                                    ::testing::ValuesIn(const_shapes_fprop_1d),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(false), // Positive test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> const_shapes_fprop_2d{
+        {},
+        {1},
+        {1, 1},
+        {1, 1, 1},
+        {8, 1, 1},
+        {1, 1, 1, 1},
+        {1, 8, 1, 1},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_Convolution_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::Convolution::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 8, 14, 14}),
+                                    ::testing::Values(ngraph::Shape{2, 8, 7, 7}),
+                                    ::testing::ValuesIn(const_shapes_fprop_2d),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(false), // Positive test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> const_shapes_fprop_2d_kernel_same_as_input{
+        {7},
+        {1, 7},
+        {1, 1, 7},
+        {8, 1, 7},
+        {1, 1, 1, 7},
+        {1, 8, 1, 7},
+        {7, 1},
+        {1, 7, 1},
+        {8, 7, 1},
+        {1, 1, 7, 1},
+        {1, 8, 7, 1},
+        {1, 1, 7, 7},
+        {1, 8, 7, 7},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_Convolution_2D_kernel_same_as_input, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::Convolution::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 8, 7, 7}),
+                                    ::testing::Values(ngraph::Shape{3, 8, 7, 7}),
+                                    ::testing::ValuesIn(const_shapes_fprop_2d_kernel_same_as_input),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(false), // Positive test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> const_shapes_conv_bprop{
+        {},
+        {1},
+        {1, 1},
+        {1, 1, 1},
+        {1, 1, 1, 1},
+        {3, 1, 1},
+        {1, 3, 1, 1},
+    };
+    INSTANTIATE_TEST_SUITE_P(smoke_ConvolutionBackpropData_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::ConvolutionBackpropData::type_info),
+                                    ::testing::Values(ngraph::Shape{4, 3, 64, 64}),
+                                    ::testing::Values(ngraph::Shape{3, 20, 3, 3}),
+                                    ::testing::ValuesIn(const_shapes_conv_bprop),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(false), // Positive test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> const_shapes_group_conv{
+        {},
+        {1},
+        {1, 1},
+        {1, 1, 1},
+        {12, 1, 1},
+        {1, 1, 1, 1},
+        {1, 12, 1, 1},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_GroupConvolution_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::GroupConvolution::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 14, 14}),
+                                    ::testing::Values(ngraph::Shape{4, 5, 3, 7, 7}),
+                                    ::testing::ValuesIn(const_shapes_group_conv),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(false), // Positive test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> const_shapes_group_conv_kernel_same_as_input{
+        {14},
+        {1, 14},
+        {1, 1, 14},
+        {12, 1, 14},
+        {1, 1, 1, 14},
+        {1, 12, 1, 14},
+        {14, 1},
+        {1, 14, 1},
+        {12, 14, 1},
+        {1, 1, 14, 1},
+        {1, 12, 14, 1},
+        {1, 1, 14, 14},
+        {1, 12, 14, 14},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_GroupConvolution_2D_kernel_same_as_input, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::GroupConvolution::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 14, 14}),
+                                    ::testing::Values(ngraph::Shape{4, 5, 3, 14, 14}),
+                                    ::testing::ValuesIn(const_shapes_group_conv_kernel_same_as_input),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(false), // Positive test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> const_shapes_group_conv_bprop{
+        {},
+        {1},
+        {1, 1},
+        {1, 1, 1},
+        {12, 1, 1},
+        {1, 1, 1, 1},
+        {1, 12, 1, 1},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_GroupConvolutionBackpropData_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::GroupConvolutionBackpropData::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 10, 10}),
+                                    ::testing::Values(ngraph::Shape{4, 3, 5, 2, 2}),
+                                    ::testing::ValuesIn(const_shapes_group_conv_bprop),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(false), // Positive test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> negative_const_shapes{
+        {12, 64, 64},
+        {2, 1, 1, 1},
+        {1, 1, 64, 64},
+        {1, 12, 64, 64},
+        {2, 12, 64, 64},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_NegativeConvolution_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::Convolution::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 64, 64}),
+                                    ::testing::Values(ngraph::Shape{20, 12, 1, 1}),
+                                    ::testing::ValuesIn(negative_const_shapes),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(true), // Negative test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    INSTANTIATE_TEST_SUITE_P(smoke_NegativeConvolutionBackpropData_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::ConvolutionBackpropData::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 64, 64}),
+                                    ::testing::Values(ngraph::Shape{12, 20, 3, 3}),
+                                    ::testing::ValuesIn(negative_const_shapes),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(true), // Negative test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    INSTANTIATE_TEST_SUITE_P(smoke_NegativeGroupConvolution_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::GroupConvolution::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 64, 64}),
+                                    ::testing::Values(ngraph::Shape{4, 5, 3, 1, 2}),
+                                    ::testing::ValuesIn(negative_const_shapes),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(true), // Negative test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    INSTANTIATE_TEST_SUITE_P(smoke_NegativeGroupConvolutionBackpropData_2D, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::GroupConvolutionBackpropData::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 64, 64}),
+                                    ::testing::Values(ngraph::Shape{4, 3, 5, 1, 1}),
+                                    ::testing::ValuesIn(negative_const_shapes),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(true), // Negative test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    const std::vector<ngraph::Shape> negative_const_shapes_kernel_same_as_input{
+        {7},
+        {1, 7},
+        {1, 1, 7},
+        {12, 1, 7},
+        {1, 1, 1, 7},
+        {1, 12, 1, 7},
+        {7, 1},
+        {1, 7, 1},
+        {12, 7, 1},
+        {1, 1, 7, 1},
+        {1, 12, 7, 1},
+        {1, 1, 7, 7},
+        {1, 12, 7, 7},
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_NegativeConvolutionBackpropData_2D_kernel_same_as_input, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::ConvolutionBackpropData::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 7, 7}),
+                                    ::testing::Values(ngraph::Shape{12, 20, 7, 7}),
+                                    ::testing::ValuesIn(negative_const_shapes_kernel_same_as_input),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(true), // Negative test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+    INSTANTIATE_TEST_SUITE_P(smoke_NegativeGroupConvolutionBackpropData_2D_kernel_same_as_input, MulConvFusion,
+                            ::testing::Combine(
+                                    ::testing::Values(ngraph::opset8::GroupConvolutionBackpropData::type_info),
+                                    ::testing::Values(ngraph::Shape{2, 12, 7, 7}),
+                                    ::testing::Values(ngraph::Shape{4, 3, 5, 7, 7}),
+                                    ::testing::ValuesIn(negative_const_shapes_kernel_same_as_input),
+                                    ::testing::ValuesIn(types),
+                                    ::testing::Values(true), // Negative test
+                                    ::testing::Values(CommonTestUtils::DEVICE_CPU)),
+                            MulConvFusion::getTestCaseName);
+
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/concat.cpp b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/concat.cpp
index 11c20c7cd01fcd..786abb33e4587e 100644
--- a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/concat.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/concat.cpp
@@ -98,9 +98,9 @@ const std::vector<Precision> netPrecisions = {
 
 INSTANTIATE_TEST_SUITE_P(concat_Concat4D_CPU_Block8inPlace, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(1),
-                                ::testing::Values(std::vector<std::vector<size_t>>{{1, 8,  3, 5},
-                                                                                   {1, 16, 3, 5}}),
+                                ::testing::Values(0, 1),
+                                ::testing::Values(std::vector<std::vector<size_t>>{{1, 8, 3, 5},
+                                                                                   {1, 8, 3, 5}}),
                                 ::testing::ValuesIn(netPrecisions),
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
                                 ::testing::Values(planar_4D, planarChannels_4D, blocked8_4D)),
@@ -108,7 +108,7 @@ INSTANTIATE_TEST_SUITE_P(concat_Concat4D_CPU_Block8inPlace, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(smoke_Concat4D_CPU_Block8, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(0, 2, 3),
+                                ::testing::Values(1, 2, 3),
                                 ::testing::Values(std::vector<std::vector<size_t>>{{2, 16, 3, 5},
                                                                                    {2, 16, 3, 5}}),
                                 ::testing::ValuesIn(netPrecisions),
@@ -118,9 +118,9 @@ INSTANTIATE_TEST_SUITE_P(smoke_Concat4D_CPU_Block8, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(smoke_Concat4D_CPU_Block16inPlace, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(1),
-                                ::testing::Values(std::vector<std::vector<size_t>>{{2, 16, 3, 5},
-                                                                                   {2, 32, 3, 5}}),
+                                ::testing::Values(0, 1),
+                                ::testing::Values(std::vector<std::vector<size_t>>{{1, 32, 3, 5},
+                                                                                   {1, 32, 3, 5}}),
                                 ::testing::ValuesIn(netPrecisions),
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
                                 ::testing::Values(blocked16_4D)),
@@ -128,9 +128,9 @@ INSTANTIATE_TEST_SUITE_P(smoke_Concat4D_CPU_Block16inPlace, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(smoke_Concat4D_CPU_Block16, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(0, 2, 3),
-                                ::testing::Values(std::vector<std::vector<size_t>>{{2, 32, 3, 5},
-                                                                                   {2, 32, 3, 5}}),
+                                ::testing::Values(1, 2, 3),
+                                ::testing::Values(std::vector<std::vector<size_t>>{{3, 32, 3, 5},
+                                                                                   {3, 32, 3, 5}}),
                                 ::testing::ValuesIn(netPrecisions),
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
                                 ::testing::Values(blocked16_4D_ref)),
@@ -138,8 +138,8 @@ INSTANTIATE_TEST_SUITE_P(smoke_Concat4D_CPU_Block16, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(concat_Concat5D_CPU_Block8inPlace, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(1),
-                                ::testing::Values(std::vector<std::vector<size_t>>{{1, 8,  3, 5, 7},
+                                ::testing::Values(0, 1),
+                                ::testing::Values(std::vector<std::vector<size_t>>{{1, 16, 3, 5, 7},
                                                                                    {1, 16, 3, 5, 7}}),
                                 ::testing::ValuesIn(netPrecisions),
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
@@ -148,7 +148,7 @@ INSTANTIATE_TEST_SUITE_P(concat_Concat5D_CPU_Block8inPlace, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(smoke_Concat5D_CPU_Block8, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(0, 2, 3, 4),
+                                ::testing::Values(2, 3, 4),
                                 ::testing::Values(std::vector<std::vector<size_t>>{{2, 16, 3, 5, 7},
                                                                                    {2, 16, 3, 5, 7}}),
                                 ::testing::ValuesIn(netPrecisions),
@@ -158,9 +158,9 @@ INSTANTIATE_TEST_SUITE_P(smoke_Concat5D_CPU_Block8, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(smoke_Concat5D_CPU_Block16inPlace, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(1),
-                                ::testing::Values(std::vector<std::vector<size_t>>{{2, 16, 3, 5, 7},
-                                                                                   {2, 32, 3, 5, 7}}),
+                                ::testing::Values(0, 1),
+                                ::testing::Values(std::vector<std::vector<size_t>>{{1, 32, 3, 5, 7},
+                                                                                   {1, 32, 3, 5, 7}}),
                                 ::testing::ValuesIn(netPrecisions),
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
                                 ::testing::Values(blocked16_5D)),
@@ -168,7 +168,7 @@ INSTANTIATE_TEST_SUITE_P(smoke_Concat5D_CPU_Block16inPlace, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(smoke_Concat5D_CPU_Block16, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(0, 2, 3, 4),
+                                ::testing::Values(2, 3, 4),
                                 ::testing::Values(std::vector<std::vector<size_t>>{{2, 32, 3, 5, 7},
                                                                                    {2, 32, 3, 5, 7}}),
                                 ::testing::ValuesIn(netPrecisions),
@@ -179,19 +179,33 @@ INSTANTIATE_TEST_SUITE_P(smoke_Concat5D_CPU_Block16, ConcatLayerCPUTest,
 
 INSTANTIATE_TEST_SUITE_P(smoke_Concat_inPlace, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(1),
-                                ::testing::Values(std::vector<std::vector<size_t>>{{2, 3, 5},
-                                                                                   {2, 4, 5}},
-                                                  std::vector<std::vector<size_t>>{{2, 3},
-                                                                                   {2, 4}}),
+                                ::testing::Values(0, 1, 2),
+                                ::testing::Values(std::vector<std::vector<size_t>>{{1, 1, 1, 10},
+                                                                                   {1, 1, 1, 10}},
+                                                  std::vector<std::vector<size_t>>{{1, 1, 5},
+                                                                                   {1, 1, 5}}),
                                 ::testing::ValuesIn(netPrecisions),
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
                                 ::testing::Values(CPUSpecificParams{{}, {}, {}, "unknown"})),
                         ConcatLayerCPUTest::getTestCaseName);
 
-INSTANTIATE_TEST_SUITE_P(smoke_Concat3D, ConcatLayerCPUTest,
+INSTANTIATE_TEST_SUITE_P(smoke_Concat_byBatch, ConcatLayerCPUTest,
+                         ::testing::Combine(
+                                 ::testing::Values(0),
+                                 ::testing::Values(std::vector<std::vector<size_t>>{{5, 2, 2, 2},
+                                                                                    {2, 2, 2, 2}},
+                                                   std::vector<std::vector<size_t>>{{1, 3, 5},
+                                                                                    {3, 3, 5}},
+                                                   std::vector<std::vector<size_t>>{{4, 3, 2},
+                                                                                    {1, 3, 2}}),
+                                 ::testing::ValuesIn(netPrecisions),
+                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
+                                 ::testing::Values(CPUSpecificParams{{}, {}, {}, "unknown"})),
+                                 ConcatLayerCPUTest::getTestCaseName);
+
+INSTANTIATE_TEST_SUITE_P(smoke_Concat_3D, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(0, 2),
+                                ::testing::Values(1, 2),
                                 ::testing::Values(std::vector<std::vector<size_t>>{{2, 4, 5},
                                                                                    {2, 4, 5}}),
                                 ::testing::ValuesIn(netPrecisions),
@@ -199,16 +213,27 @@ INSTANTIATE_TEST_SUITE_P(smoke_Concat3D, ConcatLayerCPUTest,
                                 ::testing::Values(CPUSpecificParams{{}, {}, {}, "ref"})),
                         ConcatLayerCPUTest::getTestCaseName);
 
-INSTANTIATE_TEST_SUITE_P(smoke_Concat_1D_2D, ConcatLayerCPUTest,
+INSTANTIATE_TEST_SUITE_P(smoke_Concat_2D, ConcatLayerCPUTest,
                         ::testing::Combine(
-                                ::testing::Values(0),
-                                ::testing::Values(std::vector<std::vector<size_t>>{{2, 4},
-                                                                                   {3, 4}},
-                                                  std::vector<std::vector<size_t>>{{2}, {3}}),
+                                ::testing::Values(1),
+                                ::testing::Values(std::vector<std::vector<size_t>>{{3, 2},
+                                                                                   {3, 10}}),
                                 ::testing::ValuesIn(netPrecisions),
                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
                                 ::testing::Values(CPUSpecificParams{{}, {}, {}, "ref"})),
                         ConcatLayerCPUTest::getTestCaseName);
 
+INSTANTIATE_TEST_SUITE_P(smoke_Concat_1D, ConcatLayerCPUTest,
+                         ::testing::Combine(
+                                 ::testing::Values(0),
+                                 ::testing::Values(std::vector<std::vector<size_t>>{{5},
+                                                                                    {2},
+                                                                                    {1},
+                                                                                    {3}}),
+                                 ::testing::ValuesIn(netPrecisions),
+                                 ::testing::Values(CommonTestUtils::DEVICE_CPU),
+                                 ::testing::Values(CPUSpecificParams{{}, {}, {}, "unknown"})),
+                                 ConcatLayerCPUTest::getTestCaseName);
+
 } // namespace
 } // namespace CPULayerTestsDefinitions
\ No newline at end of file
diff --git a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/gru_sequence.cpp b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/gru_sequence.cpp
index a7b6163af45763..dc5c35b72dd105 100644
--- a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/gru_sequence.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/gru_sequence.cpp
@@ -167,7 +167,7 @@ namespace {
 std::vector<std::map<std::string, std::string>> additionalConfig
     = {{{PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::NO}}, {{PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::YES}}};
 
-CPUSpecificParams cpuParams{{ntc, ntc}, {ntc, ntc}, {"ref_any"}, "ref_any"};
+CPUSpecificParams cpuParams{{ntc, tnc}, {ntc, tnc}, {"ref_any"}, "ref_any"};
 CPUSpecificParams cpuParamsBatchSizeOne{{tnc, ntc}, {tnc, ntc}, {"ref_any"}, "ref_any"};;
 
 std::vector<ngraph::helpers::SequenceTestsMode> mode{ngraph::helpers::SequenceTestsMode::PURE_SEQ};
diff --git a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/lstm_sequence.cpp b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/lstm_sequence.cpp
index 044a70f820b996..4077e4755c3bce 100644
--- a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/lstm_sequence.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/lstm_sequence.cpp
@@ -176,7 +176,7 @@ std::vector<std::map<std::string, std::string>> additionalConfig
     = {{{PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::NO}},
        {{PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::YES}}};
 
-CPUSpecificParams cpuParams{{ntc, ntc, ntc}, {ntc, ntc, ntc}, {"ref_any"}, "ref_any"};
+CPUSpecificParams cpuParams{{ntc, tnc, tnc}, {ntc, tnc, tnc}, {"ref_any"}, "ref_any"};
 CPUSpecificParams cpuParamsBatchSizeOne{{tnc, ntc, ntc}, {tnc, ntc, ntc}, {"ref_any"}, "ref_any"};
 
 std::vector<ngraph::helpers::SequenceTestsMode> mode{ngraph::helpers::SequenceTestsMode::PURE_SEQ};
diff --git a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/rnn_sequence.cpp b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/rnn_sequence.cpp
index f70eace878c21c..80834bc9c44e34 100644
--- a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/rnn_sequence.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/rnn_sequence.cpp
@@ -148,7 +148,7 @@ namespace {
 std::vector<std::map<std::string, std::string>> additionalConfig
     = {{{PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::NO}}, {{PluginConfigParams::KEY_ENFORCE_BF16, PluginConfigParams::YES}}};
 
-CPUSpecificParams cpuParams{{ntc, ntc}, {ntc, ntc}, {"ref_any"}, "ref_any"};
+CPUSpecificParams cpuParams{{ntc, tnc}, {ntc, tnc}, {"ref_any"}, "ref_any"};
 CPUSpecificParams cpuParamsBatchSizeOne{{tnc, ntc}, {tnc, tnc}, {"ref_any"}, "ref_any"};
 
 std::vector<ngraph::helpers::SequenceTestsMode> mode{ngraph::helpers::SequenceTestsMode::PURE_SEQ};
diff --git a/inference-engine/tests/functional/plugin/cpu/subgraph_tests/src/tile_with_two_output_edges.cpp b/inference-engine/tests/functional/plugin/cpu/subgraph_tests/src/tile_with_two_output_edges.cpp
new file mode 100644
index 00000000000000..1b181607fdb194
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/cpu/subgraph_tests/src/tile_with_two_output_edges.cpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "ngraph_functions/builders.hpp"
+#include "test_utils/cpu_test_utils.hpp"
+
+using namespace ngraph;
+using ngraph::helpers::EltwiseTypes;
+
+namespace SubgraphTestsDefinitions {
+
+class TileWithTwoOutputEdges : public LayerTestsUtils::LayerTestsCommon {
+protected:
+    void SetUp() override {
+        targetDevice = CommonTestUtils::DEVICE_CPU;
+
+        auto ngPrc = element::f32;
+        auto inputParams = builder::makeParams(ngPrc, {{1, 3, 12, 9}});
+        auto paramOuts = helpers::convert2OutputVector(helpers::castOps2Nodes<op::Parameter>(inputParams));
+
+        auto tile = ngraph::builder::makeTile(paramOuts[0], std::vector<int64_t>{1, 2, 1, 1});
+
+        const auto const1 = ngraph::builder::makeConstant(ngPrc, std::vector<size_t>{1, 6, 1, 1}, std::vector<float>{}, true);
+        const auto const2 = ngraph::builder::makeConstant(ngPrc, std::vector<size_t>{1, 6, 1, 1}, std::vector<float>{}, true);
+
+        const auto add1 = ngraph::builder::makeEltwise(tile->output(0), const1, ngraph::helpers::EltwiseTypes::ADD);
+        const auto add2 = ngraph::builder::makeEltwise(tile->output(0), const2, ngraph::helpers::EltwiseTypes::ADD);
+
+        NodeVector results{add1, add2};
+        function = std::make_shared<ngraph::Function>(results, inputParams, "TileWithTwoOutputEdges");
+    }
+};
+
+TEST_F(TileWithTwoOutputEdges, smoke_CompareWithRefs) {
+    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+
+    Run();
+}
+
+} // namespace SubgraphTestsDefinitions
\ No newline at end of file
diff --git a/inference-engine/tests/functional/plugin/gna/pass_tests/convert_dwsc_to_scaleshifts.cpp b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_dwsc_to_scaleshifts.cpp
new file mode 100644
index 00000000000000..1d423e7bd43bd6
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_dwsc_to_scaleshifts.cpp
@@ -0,0 +1,215 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include "common_test_utils/test_common.hpp"
+#include <string>
+#include <sstream>
+#include <fstream>
+#include <memory>
+#include <queue>
+#include <map>
+
+#include "transformations/init_node_info.hpp"
+#include "ngraph_functions/builders.hpp"
+#include "shared_test_classes/base/layer_test_utils.hpp"
+
+using namespace ngraph;
+using namespace ngraph::opset7;
+
+namespace LayerTestsDefinitions {
+
+enum class modelType {
+    TranspDWSCTransp = 0,               /* Transpose(NHWC->NCHW) => DWSC (Group Convolution) => Transpose(NCHW->NHWC) */
+    TranspDWSCBiasTransp,               /* Transpose(NHWC->NCHW) => DWSC => Broadcasted Add (Bias) => Transpose(NCHW->NHWC) */
+};
+
+typedef std::tuple<
+    InferenceEngine::SizeVector,    // Kernel size
+    InferenceEngine::SizeVector,    // Strides
+    std::vector<ptrdiff_t>,         // Pad begin
+    std::vector<ptrdiff_t>,         // Pad end
+    InferenceEngine::SizeVector,    // Dilation
+    op::PadType,                    // Padding type
+    size_t,                         // Num out channels
+    size_t,                         // Num groups
+    InferenceEngine::SizeVector     // Bias
+> DWSCParams;
+
+typedef std::tuple<
+    DWSCParams,                         // DWSC and bias parameters
+    InferenceEngine::Precision,         // Network Precision
+    std::string,                        // Target Device
+    std::map<std::string, std::string>, // Configuration
+    InferenceEngine::SizeVector,        // Input shapes
+    modelType                           // Test model
+> DWSCToScaleShiftsParams;
+
+class DWSCToScaleShiftsTest : public testing::WithParamInterface<DWSCToScaleShiftsParams>,
+    virtual public LayerTestsUtils::LayerTestsCommon {
+public:
+    static std::string getTestCaseName(testing::TestParamInfo<DWSCToScaleShiftsParams> obj) {
+        DWSCParams params;
+        InferenceEngine::Precision netPrecision;
+        std::string targetDevice;
+        std::map<std::string, std::string> configuration;
+        InferenceEngine::SizeVector inputShape;
+        modelType model;
+        std::tie(params, netPrecision, targetDevice, configuration, inputShape, model) = obj.param;
+        op::PadType padType;
+        InferenceEngine::SizeVector filter, stride, dilation, bias;
+        std::vector<ptrdiff_t> padBegin, padEnd;
+        size_t numOutChannels, numGroups;
+        std::tie(filter, stride, padBegin, padEnd, dilation, padType, numOutChannels, numGroups, bias) = params;
+
+        std::ostringstream result;
+        result << "M=" << static_cast<uint32_t>(model) << "_";
+        result << "IS=" << CommonTestUtils::vec2str(inputShape) << "_";
+        result << "K" << CommonTestUtils::vec2str(filter) << "_";
+        result << "S" << CommonTestUtils::vec2str(stride) << "_";
+        result << "PB" << CommonTestUtils::vec2str(padBegin) << "_";
+        result << "PE" << CommonTestUtils::vec2str(padEnd) << "_";
+        result << "D=" << CommonTestUtils::vec2str(dilation) << "_";
+        result << "O=" << numOutChannels << "_";
+        result << "AP=" << padType << "_";
+        result << "B=" << CommonTestUtils::vec2str(bias) << "_";
+        result << "netPRC=" << netPrecision.name() << "_";
+        result << "targetDevice=" << targetDevice << "_";
+        for (auto const& configItem : configuration) {
+            result << "_configItem=" << configItem.first << "_" << configItem.second;
+        }
+        return result.str();
+    }
+
+protected:
+    void SetUp() override {
+        threshold = 0.05f;
+        DWSCParams params;
+        InferenceEngine::Precision netPrecision;
+        std::vector<size_t> inputShape;
+        modelType model;
+        std::tie(params, netPrecision, targetDevice, configuration, inputShape, model) = this->GetParam();
+        op::PadType padType;
+        InferenceEngine::SizeVector filter, stride, dilation, bias;
+        std::vector<ptrdiff_t> padBegin, padEnd;
+        size_t numOutChannels, numGroups;
+        std::tie(filter, stride, padBegin, padEnd, dilation, padType, numOutChannels, numGroups, bias) = params;
+        auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(netPrecision);
+
+        auto input = builder::makeParams(ngPrc, {inputShape});
+        auto transposeInOrder = op::Constant::create(element::i64, Shape{4}, {0, 3, 1, 2});
+        auto transposeIn = std::make_shared<Transpose>(input[0], transposeInOrder);
+        auto filterSize = std::accumulate(std::begin(filter), std::end(filter), 1ull, std::multiplies<size_t>());
+        auto filterWeights = CommonTestUtils::generate_float_numbers(numOutChannels * (inputShape[3] / numGroups) * filterSize, -0.5f, 0.5f);
+        auto dwsc = builder::makeGroupConvolution(transposeIn, ngPrc, filter, stride, padBegin,
+            padEnd, dilation, padType, numOutChannels, numGroups, false, filterWeights);
+        auto transposeOutOrder = op::Constant::create(element::i64, Shape{4}, {0, 2, 3, 1});
+        auto lastOp = std::make_shared<Transpose>(dwsc, transposeOutOrder);
+
+        if (model == modelType::TranspDWSCBiasTransp) {
+            Shape biasShape{bias};
+            auto biasWeights = CommonTestUtils::generate_float_numbers(shape_size(biasShape), -1.0f, 1.0f);
+            auto biasConst = std::make_shared<Constant>(ngPrc, biasShape, biasWeights);
+            auto bias = std::make_shared<Add>(dwsc, biasConst);
+            lastOp = std::make_shared<Transpose>(bias, transposeOutOrder);
+        }
+
+        auto result = std::make_shared<Result>(lastOp);
+        function = std::make_shared<Function>(ResultVector{result}, ParameterVector{input});
+    }
+};
+
+TEST_P(DWSCToScaleShiftsTest, CompareWithRefs) {
+    Run();
+}
+
+const std::vector<InferenceEngine::Precision> netPrecisions = {
+    InferenceEngine::Precision::FP32,
+    InferenceEngine::Precision::FP16
+};
+
+const std::vector<std::map<std::string, std::string>> configs = {
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "1"},
+    }
+};
+
+const std::vector<op::PadType> padTypes = {
+        op::PadType::VALID,
+        op::PadType::EXPLICIT,
+        op::PadType::SAME_LOWER,
+        op::PadType::SAME_UPPER
+};
+
+const std::vector<modelType> models = {
+    modelType::TranspDWSCTransp,
+    modelType::TranspDWSCBiasTransp
+};
+
+const std::vector<std::vector<size_t>> inputNHWC = {{1, 1, 5, 32}};
+const std::vector<std::vector<size_t >> filters = {{1, 3}};
+const std::vector<std::vector<size_t >> strides = {{1, 1}, {1, 2}};
+const std::vector<std::vector<ptrdiff_t>> padBegins = {{0, 1}, {0, 2}};
+const std::vector<std::vector<ptrdiff_t>> padEnds = {{0, 1}};
+const std::vector<std::vector<size_t >> dilations = {{1, 1}};
+const std::vector<size_t> numOutChannels = {32};
+const std::vector<size_t> numGroups = {32};
+const std::vector<std::vector<size_t >> biases = {{1, 32, 1, 1}};
+
+const auto convParams = ::testing::Combine(
+    ::testing::ValuesIn(filters),
+    ::testing::ValuesIn(strides),
+    ::testing::ValuesIn(padBegins),
+    ::testing::ValuesIn(padEnds),
+    ::testing::ValuesIn(dilations),
+    ::testing::ValuesIn(padTypes),
+    ::testing::ValuesIn(numOutChannels),
+    ::testing::ValuesIn(numGroups),
+    ::testing::ValuesIn(biases)
+);
+
+INSTANTIATE_TEST_CASE_P(smoke_DWSCToScaleShifts, DWSCToScaleShiftsTest,
+    ::testing::Combine(
+        convParams,
+        ::testing::ValuesIn(netPrecisions),
+        ::testing::Values(CommonTestUtils::DEVICE_GNA),
+        ::testing::ValuesIn(configs),
+        ::testing::ValuesIn(inputNHWC),
+        ::testing::ValuesIn(models)),
+    DWSCToScaleShiftsTest::getTestCaseName);
+
+/* ============= Strides & Dilations Combination ============= */
+
+const std::vector<op::PadType> padTypesSD = {
+    op::PadType::VALID,
+};
+
+const std::vector<std::vector<size_t>> inputNHWCSD = {{1, 1, 8, 32}};
+const std::vector<std::vector<size_t >> dilationsSD = {{1, 1}, {1, 2}};
+
+const auto convParamsSD = ::testing::Combine(
+    ::testing::ValuesIn(filters),
+    ::testing::ValuesIn(strides),
+    ::testing::ValuesIn(padBegins),
+    ::testing::ValuesIn(padEnds),
+    ::testing::ValuesIn(dilationsSD),
+    ::testing::ValuesIn(padTypesSD),
+    ::testing::ValuesIn(numOutChannels),
+    ::testing::ValuesIn(numGroups),
+    ::testing::ValuesIn(biases)
+);
+
+INSTANTIATE_TEST_CASE_P(smoke_DWSCToScaleShiftsStridesDilations, DWSCToScaleShiftsTest,
+    ::testing::Combine(
+        convParamsSD,
+        ::testing::ValuesIn(netPrecisions),
+        ::testing::Values(CommonTestUtils::DEVICE_GNA),
+        ::testing::ValuesIn(configs),
+        ::testing::ValuesIn(inputNHWCSD),
+        ::testing::ValuesIn(models)),
+    DWSCToScaleShiftsTest::getTestCaseName);
+
+} // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/gna/pass_tests/convert_matmul_to_fullyconnected.cpp b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_matmul_to_fullyconnected.cpp
index ddce7bb0dcf189..3efc3160a9d4fc 100644
--- a/inference-engine/tests/functional/plugin/gna/pass_tests/convert_matmul_to_fullyconnected.cpp
+++ b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_matmul_to_fullyconnected.cpp
@@ -99,7 +99,8 @@ const std::vector<std::vector<std::vector<size_t>>> input_shapes = {
         {{1, 8}, {8, 1}},
         {{128, 8}, {8, 1}},
         {{8, 8}, {8, 8}},
-        {{1, 16}, {16, 8}}
+        {{1, 16}, {16, 8}},
+        {{6, 16}, {16, 8}}
 };
 
 
@@ -110,4 +111,4 @@ INSTANTIATE_TEST_SUITE_P(smoke_convert_matmul_to_fc, ConvertMatmulToFcPass,
                                 ::testing::Values(CommonTestUtils::DEVICE_GNA),
                                 ::testing::ValuesIn(configs)),
                         ConvertMatmulToFcPass::getTestCaseName);
-} // namespace LayerTestsDefinitions
\ No newline at end of file
+} // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded2valid_conv.cpp b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded_to_valid_conv.cpp
similarity index 94%
rename from inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded2valid_conv.cpp
rename to inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded_to_valid_conv.cpp
index 45faab02e841f3..0c3416b1969eb7 100644
--- a/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded2valid_conv.cpp
+++ b/inference-engine/tests/functional/plugin/gna/pass_tests/convert_padded_to_valid_conv.cpp
@@ -57,12 +57,12 @@ typedef std::tuple<
     std::map<std::string, std::string>, // Configuration
     InferenceEngine::SizeVector,        // Input shapes
     modelType                           // Test model
-> padded2ValidParams;
+> paddedToValidParams;
 
-class Padded2ValidConvTest : public testing::WithParamInterface<padded2ValidParams>,
+class PaddedToValidConvTest : public testing::WithParamInterface<paddedToValidParams>,
     virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<padded2ValidParams> obj) {
+    static std::string getTestCaseName(testing::TestParamInfo<paddedToValidParams> obj) {
         convSpecificParams convParams;
         miscSpecificParams miscParams;
         InferenceEngine::Precision netPrecision;
@@ -195,26 +195,26 @@ class Padded2ValidConvTest : public testing::WithParamInterface<padded2ValidPara
     }
 };
 
-class Gna30Padded2ValidConvTest : public Padded2ValidConvTest, GnaLayerTestCheck {
+class Gna30PaddedToValidConvTest : public PaddedToValidConvTest, GnaLayerTestCheck {
 protected:
     void Run() override {
         GnaLayerTestCheck::SkipTestCheck();
 
         if (!GnaLayerTestCheck::skipTest) {
-            Padded2ValidConvTest::Run();
+            PaddedToValidConvTest::Run();
         }
     }
 
     void SetUp() override {
-        Padded2ValidConvTest::SetUp();
+        PaddedToValidConvTest::SetUp();
     }
 };
 
-TEST_P(Padded2ValidConvTest, CompareWithRefs) {
+TEST_P(PaddedToValidConvTest, CompareWithRefs) {
     Run();
 }
 
-TEST_P(Gna30Padded2ValidConvTest, CompareWithRefs) {
+TEST_P(Gna30PaddedToValidConvTest, CompareWithRefs) {
     Run();
 }
 
@@ -322,7 +322,7 @@ const auto misc2DParams = ::testing::Combine(
     ::testing::ValuesIn(maxpool2DStrides)
 );
 
-INSTANTIATE_TEST_CASE_P(smoke_1DPadded2Valid, Padded2ValidConvTest,
+INSTANTIATE_TEST_CASE_P(smoke_1DPaddedToValid, PaddedToValidConvTest,
     ::testing::Combine(
         conv1DParams,
         misc1DParams,
@@ -331,9 +331,9 @@ INSTANTIATE_TEST_CASE_P(smoke_1DPadded2Valid, Padded2ValidConvTest,
         ::testing::ValuesIn(configs1D),
         ::testing::ValuesIn(input1DNHWC),
         ::testing::ValuesIn(models)),
-    Padded2ValidConvTest::getTestCaseName);
+    PaddedToValidConvTest::getTestCaseName);
 
-INSTANTIATE_TEST_CASE_P(smoke_1DPadded2Valid, Gna30Padded2ValidConvTest,
+INSTANTIATE_TEST_CASE_P(smoke_1DPaddedToValid, Gna30PaddedToValidConvTest,
     ::testing::Combine(
         conv1DParams,
         misc1DParams,
@@ -342,9 +342,9 @@ INSTANTIATE_TEST_CASE_P(smoke_1DPadded2Valid, Gna30Padded2ValidConvTest,
         ::testing::ValuesIn(configs1D_Gna30),
         ::testing::ValuesIn(input1DNHWC),
         ::testing::ValuesIn(models)),
-    Gna30Padded2ValidConvTest::getTestCaseName);
+    Gna30PaddedToValidConvTest::getTestCaseName);
 
-INSTANTIATE_TEST_CASE_P(smoke_2DPadded2Valid, Gna30Padded2ValidConvTest,
+INSTANTIATE_TEST_CASE_P(smoke_2DPaddedToValid, Gna30PaddedToValidConvTest,
     ::testing::Combine(
         conv2DParams,
         misc2DParams,
@@ -353,6 +353,6 @@ INSTANTIATE_TEST_CASE_P(smoke_2DPadded2Valid, Gna30Padded2ValidConvTest,
         ::testing::ValuesIn(configs2D),
         ::testing::ValuesIn(input2DNHWC),
         ::testing::ValuesIn(models)),
-    Gna30Padded2ValidConvTest::getTestCaseName);
+    Gna30PaddedToValidConvTest::getTestCaseName);
 
 } // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/gna/pass_tests/fq_maxpool_reordering.cpp b/inference-engine/tests/functional/plugin/gna/pass_tests/fq_maxpool_reordering.cpp
index 948ec611720448..af6d0c1a19b560 100644
--- a/inference-engine/tests/functional/plugin/gna/pass_tests/fq_maxpool_reordering.cpp
+++ b/inference-engine/tests/functional/plugin/gna/pass_tests/fq_maxpool_reordering.cpp
@@ -73,8 +73,9 @@ class FQMaxpoolReordering : public testing::WithParamInterface<fqMaxpoolReorderi
         std::tie(netPrecision, targetDevice, configuration, inputShape, inputMinMax, levels) = this->GetParam();
         auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(netPrecision);
 
-        auto inputLowNode = ngraph::builder::makeConstant<float>(ngPrc, {1}, { inputMinMax.first });
-        auto inputHighNode = ngraph::builder::makeConstant<float>(ngPrc, {1}, { inputMinMax.second });
+        std::tie(inputDataMin, inputDataMax) = inputMinMax;
+        auto inputLowNode = ngraph::builder::makeConstant<float>(ngPrc, {1}, { inputDataMin });
+        auto inputHighNode = ngraph::builder::makeConstant<float>(ngPrc, {1}, { inputDataMax });
 
         auto inputVector = ngraph::builder::makeParams(ngPrc, {inputShape});
 
diff --git a/inference-engine/tests/functional/plugin/gna/scale_factors_tests/const_input_add.cpp b/inference-engine/tests/functional/plugin/gna/scale_factors_tests/const_input_add.cpp
new file mode 100644
index 00000000000000..48c4fc9756cc8d
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gna/scale_factors_tests/const_input_add.cpp
@@ -0,0 +1,117 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+#include <memory>
+#include <tuple>
+#include <vector>
+#include <string>
+
+#include <ie_core.hpp>
+
+#include "common_test_utils/common_utils.hpp"
+#include "functional_test_utils/plugin_cache.hpp"
+#include "shared_test_classes/base/layer_test_utils.hpp"
+#include "functional_test_utils/blob_utils.hpp"
+#include "ngraph_functions/utils/ngraph_helpers.hpp"
+#include "ngraph_functions/builders.hpp"
+
+#include "ngraph_functions/pass/convert_prc.hpp"
+
+typedef std::tuple<
+    InferenceEngine::Precision,         // Network Precision
+    std::string,                        // Target Device
+    std::map<std::string, std::string>, // Configuration
+    std::pair<float, float>,            // Input min/max values
+    std::pair<float, float>             // Constant min/max values
+> constInputAddParams;
+
+namespace LayerTestsDefinitions {
+
+class ConstInputAddTest : public testing::WithParamInterface<constInputAddParams>,
+                          public LayerTestsUtils::LayerTestsCommon {
+    public:
+        static std::string getTestCaseName(testing::TestParamInfo<constInputAddParams> obj) {
+            InferenceEngine::Precision netPrecision;
+            std::string targetDevice;
+            std::map<std::string, std::string> configuration;
+            std::pair<float, float> inputRange;
+            std::pair<float, float> constRange;
+            std::tie(netPrecision, targetDevice, configuration, inputRange, constRange) = obj.param;
+
+            std::ostringstream result;
+            result << "netPRC=" << netPrecision.name() << "_";
+            result << "targetDevice=" << targetDevice << "_";
+            for (auto const& configItem : configuration) {
+                result << "_configItem=" << configItem.first << "_" << configItem.second;
+            }
+            result << "_IR=" << inputRange.first << "," << inputRange.second << "_";
+            result << "IR=" << constRange.first << "," << constRange.second;
+            return result.str();
+        }
+
+        InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override {
+            return FuncTestUtils::createAndFillBlob(info.getTensorDesc(), inputMax - inputMin, inputMin, (inputMax - inputMin) / 10);
+        }
+
+    protected:
+        void SetUp() override {
+            InferenceEngine::Precision netPrecision;
+            std::pair<float, float> inputRange;
+            std::pair<float, float> constRange;
+            std::tie(netPrecision, targetDevice, configuration, inputRange, constRange) = this->GetParam();
+            auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(netPrecision);
+            std::tie(inputMin, inputMax) = inputRange;
+
+            ngraph::Shape shape = {1, 72};
+            auto params = ngraph::builder::makeParams(ngPrc, { shape });
+
+            auto constant = ngraph::builder::makeConstant<float>(ngPrc, shape, {}, true, constRange.second, constRange.first);
+            auto eltwise = ngraph::builder::makeEltwise(constant, params[0], ngraph::helpers::EltwiseTypes::ADD);
+
+            ngraph::ResultVector results{ std::make_shared<ngraph::opset1::Result>(eltwise) };
+            function = std::make_shared<ngraph::Function>(results, params, "InputConstAdd");
+        }
+
+    private:
+        float inputMin = 0.0;
+        float inputMax = 0.0;
+};
+
+    TEST_P(ConstInputAddTest, CompareWithRefImpl) {
+        Run();
+    };
+
+    const std::vector<InferenceEngine::Precision> netPrecisions = {
+        InferenceEngine::Precision::FP32,
+        InferenceEngine::Precision::FP16
+    };
+
+    const std::vector<std::map<std::string, std::string>> configs = {
+        {
+            {"GNA_DEVICE_MODE", "GNA_SW_EXACT"}
+        }
+    };
+
+    const std::vector<std::pair<float, float>> inputRange = {
+        {-10, 10},
+        {-100, 100}
+    };
+
+    const std::vector<std::pair<float, float>> constRange = {
+        {-10, 10},
+        {-0.1, 0.1},
+        {-1.0e-5, 1.0e-5}
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_const_input_add, ConstInputAddTest,
+        ::testing::Combine(
+            ::testing::ValuesIn(netPrecisions),
+            ::testing::Values(CommonTestUtils::DEVICE_GNA),
+            ::testing::ValuesIn(configs),
+            ::testing::ValuesIn(inputRange),
+            ::testing::ValuesIn(constRange)),
+        ConstInputAddTest::getTestCaseName);
+
+} // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/gna/shared_tests_instances/behavior/caching/caching_tests.cpp b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/behavior/caching/caching_tests.cpp
index 80bf64514ae759..b7b071767dc53b 100644
--- a/inference-engine/tests/functional/plugin/gna/shared_tests_instances/behavior/caching/caching_tests.cpp
+++ b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/behavior/caching/caching_tests.cpp
@@ -9,8 +9,9 @@ using namespace LayerTestsDefinitions;
 namespace {
     static const std::vector<ngraph::element::Type> precisionsGNA = {
             ngraph::element::f32,
-            ngraph::element::u8,
-            ngraph::element::i16,
+            // integer weights are not supported by GNA so far
+            // ngraph::element::u8,
+            // ngraph::element::i16,
     };
 
     static const std::vector<std::size_t> batchSizesGNA = {
diff --git a/inference-engine/tests/functional/plugin/gna/shared_tests_instances/import_export_tests/import_export_multi_inputs.cpp b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/import_export_tests/import_export_multi_inputs.cpp
new file mode 100644
index 00000000000000..511c56e5784568
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/import_export_tests/import_export_multi_inputs.cpp
@@ -0,0 +1,118 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+#include <memory>
+#include <tuple>
+#include <vector>
+#include <string>
+#include <fstream>
+
+#include "ngraph_functions/builders.hpp"
+#include "base/import_export_base/import_export_base.hpp"
+
+namespace LayerTestsDefinitions {
+
+class ImportMultiInput : public FuncTestUtils::ImportNetworkTestBase {
+protected:
+    void SetUp() override {
+        InferenceEngine::Precision netPrecision;
+        std::tie(netPrecision, targetDevice, exportConfiguration, importConfiguration, applicationHeader) = this->GetParam();
+
+        auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(netPrecision);
+        auto input = ngraph::builder::makeParams(ngPrc, {{1, 10}, {1, 10}});
+        auto mul1 = ngraph::builder::makeEltwise(input[0], input[1], ngraph::helpers::EltwiseTypes::ADD);
+        auto result = std::make_shared<ngraph::opset7::Result>(mul1);
+
+        function = std::make_shared<ngraph::Function>(ngraph::ResultVector{result}, input, "multiple_input");
+    }
+};
+
+class ImportMultiInputChanged : public ImportMultiInput {};
+class ImportMultiInputUnchanged : public ImportMultiInput {};
+
+TEST_P(ImportMultiInputUnchanged, CompareWithRefImpl) {
+    TestRun(false);
+};
+
+TEST_P(ImportMultiInputChanged, CompareWithRefImpl) {
+    TestRun(true);
+};
+
+const std::vector<InferenceEngine::Precision> netPrecisions = {
+        InferenceEngine::Precision::FP32
+};
+
+const std::vector<std::map<std::string, std::string>> exportConfigs = {
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "327.67"},
+        {"GNA_SCALE_FACTOR_1", "327.67"}
+    }
+};
+
+const std::vector<std::map<std::string, std::string>> importConfigsChanged = {
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "32767"}
+    },
+        {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_1", "32767"}
+    },
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "32767"},
+        {"GNA_SCALE_FACTOR_1", "32767"}
+    },
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "1"},
+        {"GNA_SCALE_FACTOR_1", "32767"}
+    }
+};
+
+const std::vector<std::map<std::string, std::string>> importConfigsUnchanged = {
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "327.67"}
+    },
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "1"}
+    },
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"}
+    },
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_0", "327.67"},
+        {"GNA_SCALE_FACTOR_1", "327.67"}
+    },
+    {
+        {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+        {"GNA_SCALE_FACTOR_1", "327.67"}
+    },
+};
+
+INSTANTIATE_TEST_CASE_P(smoke_ImportNetworkGNA, ImportMultiInputUnchanged,
+                        ::testing::Combine(
+                            ::testing::ValuesIn(netPrecisions),
+                            ::testing::Values(CommonTestUtils::DEVICE_GNA),
+                            ::testing::ValuesIn(exportConfigs),
+                            ::testing::ValuesIn(importConfigsUnchanged),
+                            ::testing::Values("")),
+                        ImportMultiInputUnchanged::getTestCaseName);
+
+INSTANTIATE_TEST_CASE_P(smoke_ImportNetworkGNA, ImportMultiInputChanged,
+                        ::testing::Combine(
+                            ::testing::ValuesIn(netPrecisions),
+                            ::testing::Values(CommonTestUtils::DEVICE_GNA),
+                            ::testing::ValuesIn(exportConfigs),
+                            ::testing::ValuesIn(importConfigsChanged),
+                            ::testing::Values("")),
+                        ImportMultiInputChanged::getTestCaseName);
+
+} // namespace LayerTestsDefinitions
+
diff --git a/inference-engine/tests/functional/plugin/gna/shared_tests_instances/skip_tests_check.hpp b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/skip_tests_check.hpp
index 501b7134c60347..22a6771ea0df16 100644
--- a/inference-engine/tests/functional/plugin/gna/shared_tests_instances/skip_tests_check.hpp
+++ b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/skip_tests_check.hpp
@@ -16,8 +16,8 @@ class GnaLayerTestCheck : virtual public LayerTestsUtils::LayerTestsCommon {
             if (std::find(metrics.begin(), metrics.end(), METRIC_KEY(GNA_LIBRARY_FULL_VERSION)) != metrics.end()) {
                 std::string gnaLibVer = ie_core.GetMetric(targetDevice, METRIC_KEY(GNA_LIBRARY_FULL_VERSION));
 
-                if (gnaLibVer.rfind("2.1", 0) != 0) {
-                    GTEST_SKIP() << "Disabled test due to GNA library version being < 2.1" << std::endl;
+                if (gnaLibVer.rfind("2.1", 0) != 0 && gnaLibVer.rfind("3.0", 0) != 0) {
+                    GTEST_SKIP() << "Disabled test due to GNA library version being not 2.1 or 3.0" << std::endl;
                 }
                 skipTest = false;
             }
diff --git a/inference-engine/tests/functional/plugin/gna/shared_tests_instances/transpose_add.cpp b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/transpose_add.cpp
new file mode 100644
index 00000000000000..a6742a1128a32e
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gna/shared_tests_instances/transpose_add.cpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+#include "subgraph_tests/transpose_add.hpp"
+#include "common_test_utils/test_constants.hpp"
+namespace {
+std::vector<std::vector<size_t>> input_shapes {
+    {1, 4, 32},
+    {1, 8, 8},
+    {1, 7, 8},
+    {1, 40, 3}
+};
+
+std::vector<InferenceEngine::Precision> netPrecisions = {
+    InferenceEngine::Precision::FP32,
+    InferenceEngine::Precision::FP16,
+};
+
+std::map<std::string, std::string> additional_config = {
+    {"GNA_DEVICE_MODE", "GNA_SW_EXACT"},
+};
+} // namespace
+
+namespace SubgraphTestsDefinitions {
+    INSTANTIATE_TEST_SUITE_P(smoke_basic, TransposeAdd,
+        ::testing::Combine(
+            ::testing::ValuesIn(netPrecisions),
+            ::testing::Values(CommonTestUtils::DEVICE_GNA),
+            ::testing::ValuesIn(input_shapes),
+            ::testing::Values(additional_config)),
+        TransposeAdd::getTestCaseName);
+} // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/gpu/CMakeLists.txt b/inference-engine/tests/functional/plugin/gpu/CMakeLists.txt
index 8191fb4e9054ab..6e5df4bfd78394 100644
--- a/inference-engine/tests/functional/plugin/gpu/CMakeLists.txt
+++ b/inference-engine/tests/functional/plugin/gpu/CMakeLists.txt
@@ -13,7 +13,6 @@ addIeTargetTest(
             ${CMAKE_CURRENT_SOURCE_DIR}
         DEPENDENCIES
             clDNNPlugin
-            AutoPlugin
         LINK_LIBRARIES
             funcSharedTests
             OpenCL
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp
index 22a13191dc5298..c75aa903a2136a 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/config.cpp
@@ -15,6 +15,11 @@ namespace {
 
     IE_SUPPRESS_DEPRECATED_START
     const std::vector<std::map<std::string, std::string>> inconfigs = {
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, "DOESN'T EXIST"}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "-1"}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "should be int"}},
             {{InferenceEngine::PluginConfigParams::KEY_GPU_THROUGHPUT_STREAMS, "OFF"}},
             {{InferenceEngine::PluginConfigParams::KEY_PERF_COUNT, "ON"}},
             {{InferenceEngine::PluginConfigParams::KEY_CONFIG_FILE, "unknown_file"}},
@@ -24,6 +29,11 @@ namespace {
     };
 
     const std::vector<std::map<std::string, std::string>> multiinconfigs = {
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, "DOESN'T EXIST"}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "-1"}},
             {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
                     {InferenceEngine::PluginConfigParams::KEY_PERF_COUNT, "ON"}},
             {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
@@ -83,13 +93,31 @@ namespace {
             {{InferenceEngine::GPUConfigParams::KEY_GPU_MAX_NUM_THREADS, "4"}},
             {{InferenceEngine::GPUConfigParams::KEY_GPU_ENABLE_LOOP_UNROLLING, InferenceEngine::PluginConfigParams::YES}},
             {{InferenceEngine::GPUConfigParams::KEY_GPU_ENABLE_LOOP_UNROLLING, InferenceEngine::PluginConfigParams::NO}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY}},
+            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}},
     };
     IE_SUPPRESS_DEPRECATED_END
 
     const std::vector<std::map<std::string, std::string>> multiconf = {
-            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU}}
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+                {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+                {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY}},
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+                {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
+                {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, CorrectConfigAPITests,
             ::testing::Combine(
                 ::testing::ValuesIn(netPrecisions),
@@ -115,7 +143,7 @@ namespace {
             ::testing::Combine(
                     ::testing::ValuesIn(netPrecisions),
                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                    ::testing::ValuesIn(multiconf)),
+                    ::testing::ValuesIn(autoConfigs)),
             CorrectConfigAPITests::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, IncorrectConfigAPITests,
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp
index 90a22c2435cb86..dfaa591dd96376 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/callback.cpp
@@ -14,6 +14,11 @@ const std::vector<std::map<std::string, std::string>> multiConfigs = {
         {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
 };
 
+const std::vector<std::map<std::string, std::string>> autoConfigs = {
+    {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+        {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+};
+
 INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestCallbackTests,
         ::testing::Combine(
             ::testing::Values(CommonTestUtils::DEVICE_GPU),
@@ -27,8 +32,8 @@ INSTANTIATE_TEST_SUITE_P(smoke_Multi_BehaviorTests, InferRequestCallbackTests,
         InferRequestCallbackTests::getTestCaseName);
 
 INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestCallbackTests,
-                        ::testing::Combine(
-                            ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                            ::testing::ValuesIn(multiConfigs)),
-                        InferRequestCallbackTests::getTestCaseName);
+        ::testing::Combine(
+            ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+            ::testing::ValuesIn(autoConfigs)),
+        InferRequestCallbackTests::getTestCaseName);
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
index 5a4a5852c5a3a2..bdb9cf905182f7 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/perf_counters.cpp
@@ -14,6 +14,12 @@ namespace {
             {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> AutoConfigs = {
+            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+                {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES,
+                 CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+            };
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPerfCountersTest,
                             ::testing::Combine(
                                     ::testing::Values(CommonTestUtils::DEVICE_GPU),
@@ -26,4 +32,10 @@ namespace {
                                     ::testing::ValuesIn(Multiconfigs)),
                              InferRequestPerfCountersTest::getTestCaseName);
 
+    INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestPerfCountersTest,
+                            ::testing::Combine(
+                                    ::testing::Values(CommonTestUtils::DEVICE_AUTO),
+                                    ::testing::ValuesIn(AutoConfigs)),
+                             InferRequestPerfCountersTest::getTestCaseName);
+
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp
index 07fe3ddd855a3a..41da3069a871ea 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/infer_request/wait.cpp
@@ -13,6 +13,12 @@ namespace {
             {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES, CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestWaitTests,
                             ::testing::Combine(
                                     ::testing::Values(CommonTestUtils::DEVICE_GPU),
@@ -28,7 +34,7 @@ namespace {
     INSTANTIATE_TEST_SUITE_P(smoke_Auto_BehaviorTests, InferRequestWaitTests,
                             ::testing::Combine(
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(configs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             InferRequestWaitTests::getTestCaseName);
 
-}  // namespace
\ No newline at end of file
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp
index c6a17bb4bf7761..950425675bc2d4 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/preprocessing/set_preprocess.cpp
@@ -22,6 +22,12 @@ namespace {
             {{ InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestPreprocessTest,
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
@@ -40,7 +46,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(multiConfigs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             InferRequestPreprocessTest::getTestCaseName);
 
     const std::vector<InferenceEngine::Precision> ioPrecisions = {
@@ -85,4 +91,4 @@ namespace {
                                 ::testing::ValuesIn(configs)),
                         InferRequestPreprocessDynamicallyInSetBlobTest::getTestCaseName);
 
-}  // namespace
\ No newline at end of file
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp
index 98069d07303168..bfe1d09c36be7d 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/test_plugin.cpp
@@ -31,6 +31,12 @@ namespace {
             {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     const std::vector<std::map<std::string, std::string>> configsInput = {
             {},
             {{InferenceEngine::PluginConfigParams::KEY_GPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::GPU_THROUGHPUT_AUTO}}
@@ -65,7 +71,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             BehaviorTestOutput::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, BehaviorTests,
@@ -86,7 +92,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::Values(InferenceEngine::Precision::FP32),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             BehaviorTests::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, BehaviorTestInput,
@@ -107,7 +113,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::ValuesIn(netPrecisions),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(MultiConfigsInputOutput)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             BehaviorTestInput::getTestCaseName);
 
 }  // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp
index c02a209e9d59a9..fe7bbfa5c099f1 100644
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/behavior/version.cpp
@@ -14,6 +14,12 @@ namespace {
             {{ MULTI_CONFIG_KEY(DEVICE_PRIORITIES) , CommonTestUtils::DEVICE_GPU}}
     };
 
+    const std::vector<std::map<std::string, std::string>> autoConfigs = {
+        {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_GPU},
+            {InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES ,
+             CommonTestUtils::DEVICE_GPU + std::string(",") + CommonTestUtils::DEVICE_CPU}}
+    };
+
     const std::vector<std::map<std::string, std::string>> Heteroconfigs = {
             {{ HETERO_CONFIG_KEY(DUMP_GRAPH_DOT) , CommonTestUtils::DEVICE_GPU}}
     };
@@ -36,7 +42,7 @@ namespace {
                             ::testing::Combine(
                                     ::testing::Values(InferenceEngine::Precision::FP32),
                                     ::testing::Values(CommonTestUtils::DEVICE_AUTO),
-                                    ::testing::ValuesIn(Multiconfigs)),
+                                    ::testing::ValuesIn(autoConfigs)),
                             VersionTest::getTestCaseName);
 
     INSTANTIATE_TEST_SUITE_P(smoke_Hetero_BehaviorTests, VersionTest,
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/nms_transformation_for_last_node.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/nms_transformation_for_last_node.cpp
new file mode 100644
index 00000000000000..b8cc15d0bec126
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/nms_transformation_for_last_node.cpp
@@ -0,0 +1,13 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "execution_graph_tests/nms_transformation_for_last_node.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+namespace {
+using namespace ExecutionGraphTests;
+
+INSTANTIATE_TEST_SUITE_P(smoke_NmsTransformationLastNode, ExecGraphNmsTransformLastNode, ::testing::Values(CommonTestUtils::DEVICE_GPU),
+                        ExecGraphNmsTransformLastNode::getTestCaseName);
+} // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/remove_parameter.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/remove_parameter.cpp
new file mode 100644
index 00000000000000..5b37e05b952a87
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/execution_graph_tests/remove_parameter.cpp
@@ -0,0 +1,16 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "execution_graph_tests/remove_parameter.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+using namespace ExecutionGraphTests;
+
+namespace {
+
+INSTANTIATE_TEST_SUITE_P(smoke_removeParameter, ExecGraphRemoveParameterNode,
+                        ::testing::Values(CommonTestUtils::DEVICE_GPU),
+                        ExecGraphRemoveParameterNode::getTestCaseName);
+
+} // namespace
diff --git a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/low_precision_transformations/move_fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/low_precision_transformations/move_fake_quantize_transformation.cpp
new file mode 100644
index 00000000000000..86b44f3b248127
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/low_precision_transformations/move_fake_quantize_transformation.cpp
@@ -0,0 +1,86 @@
+﻿// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+
+#include "low_precision_transformations/move_fake_quantize_transformation.hpp"
+#include "common_test_utils/test_constants.hpp"
+
+using namespace LayerTestsDefinitions;
+
+namespace {
+const std::vector<ngraph::element::Type> netPrecisions = {
+    ngraph::element::f32,
+    ngraph::element::f16
+};
+
+    const std::vector<ngraph::pass::low_precision::LayerTransformation::Params> trasformationParamValues = {
+       LayerTestsUtils::LayerTransformationParamsNGraphFactory::createParams(),
+    };
+
+    const std::vector<LayerTestsDefinitions::MoveFakeQuantizeTransformationParam> params = {
+     // without operation
+    {
+       {},
+       {},
+       {},
+       {},
+       {},
+       {},
+       "",
+       { 256ul, {}, {0.f}, {2.55f}, {0.f}, {2.55f}},
+       {},
+       {},
+       "Concat",
+       "U8",
+       1,
+    },
+   // with ReLU operation
+    {
+       {},
+       {},
+       {},
+       {},
+       {},
+       {},
+       "relu",
+       { 256ul, {}, { -12.7f }, { 12.7f }, { -12.7f }, { 12.7f }},
+       {},
+       {},
+       "Concat",
+       "U8",
+       1
+    },
+     // negative axis
+    {
+       {},
+       {},
+       {},
+       {},
+       {},
+       {},
+       "",
+       {256ul, {},  {-1.28f}, {1.27f}, {-1.28f}, {1.27f}},
+       {},
+       {},
+       "Concat",
+       "FP32",
+       0
+    }
+    };
+
+    const std::vector<ngraph::Shape> shapes = {
+    { 1, 3, 16, 16 },
+    { 4, 3, 16, 16 }
+    };
+
+    INSTANTIATE_TEST_SUITE_P(smoke_LPT, MoveFakeQuantizeTransformation,
+    ::testing::Combine(
+        ::testing::ValuesIn(netPrecisions),
+        ::testing::ValuesIn(shapes),
+        ::testing::Values(CommonTestUtils::DEVICE_GPU),
+        ::testing::ValuesIn(trasformationParamValues),
+        ::testing::ValuesIn(params)),
+    MoveFakeQuantizeTransformation::getTestCaseName);
+}  // namespace
diff --git a/inference-engine/tests/functional/plugin/myriad/shared_tests_instances/skip_tests_config.cpp b/inference-engine/tests/functional/plugin/myriad/shared_tests_instances/skip_tests_config.cpp
index 68d72bc5329868..c75651220bb4a7 100644
--- a/inference-engine/tests/functional/plugin/myriad/shared_tests_instances/skip_tests_config.cpp
+++ b/inference-engine/tests/functional/plugin/myriad/shared_tests_instances/skip_tests_config.cpp
@@ -50,5 +50,7 @@ std::vector<std::string> disabledTestPatterns() {
         R"(.*IEClassNetworkTestP\.LoadNetworkActualHeteroDeviceNoThrow.*)",
         // CVS-58963: Not implemented yet
         R"(.*Behavior.*InferRequest.*OutOfFirstOutIsInputForSecondNetwork.*)",
+        // TODO: CVS-65013
+        R"(.*LoadNetworkCreateDefaultExecGraphResult.*)",
     };
 }
diff --git a/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp b/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp
index 1064edaa570865..27914608bbfca5 100644
--- a/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/behavior/core_integration.hpp
@@ -431,8 +431,7 @@ TEST_P(IEClassBasicTestP, ImportNetworkThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     Core ie = createCoreWithTemplate();
 
-    if (deviceName == CommonTestUtils::DEVICE_CPU ||
-        deviceName == CommonTestUtils::DEVICE_GPU) {
+    if (deviceName == CommonTestUtils::DEVICE_GPU) {
         ASSERT_THROW(ie.ImportNetwork("model", deviceName), NetworkNotRead);
 
         const std::string modelName = "compiled_blob.blob";
@@ -489,6 +488,36 @@ TEST_P(IEClassNetworkTestP, LoadNetworkActualHeteroDevice2NoThrow) {
     ASSERT_NO_THROW(ie.LoadNetwork(actualNetwork, CommonTestUtils::DEVICE_HETERO, {{"TARGET_FALLBACK", deviceName}}));
 }
 
+TEST_P(IEClassNetworkTestP, LoadNetworkCreateDefaultExecGraphResult) {
+    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    Core ie = createCoreWithTemplate();
+    auto net = ie.LoadNetwork(actualNetwork, deviceName);
+    auto exec_function = net.GetExecGraphInfo().getFunction();
+    ASSERT_NE(nullptr, exec_function);
+    auto actual_parameters = exec_function->get_parameters();
+    auto actual_results = exec_function->get_results();
+    auto expected_parameters = actualNetwork.getFunction()->get_parameters();
+    auto expected_results = actualNetwork.getFunction()->get_results();
+    ASSERT_EQ(expected_parameters.size(), actual_parameters.size());
+    for (std::size_t i = 0; i < expected_parameters.size(); ++i) {
+        auto expected_element_type = expected_parameters[i]->get_output_element_type(0);
+        auto actual_element_type = actual_parameters[i]->get_output_element_type(0);
+        ASSERT_EQ(expected_element_type, actual_element_type) << "For index: " << i;
+        auto expected_shape = expected_parameters[i]->get_output_shape(0);
+        auto actual_shape = actual_parameters[i]->get_output_shape(0);
+        ASSERT_EQ(expected_shape, actual_shape) << "For index: " << i;
+    }
+    ASSERT_EQ(expected_results.size(), actual_results.size());
+    for (std::size_t i = 0; i < expected_results.size(); ++i) {
+        auto expected_element_type = expected_results[i]->get_input_element_type(0);
+        auto actual_element_type = actual_results[i]->get_input_element_type(0);
+        ASSERT_EQ(expected_element_type, actual_element_type) << "For index: " << i;
+        auto expected_shape = expected_results[i]->get_input_shape(0);
+        auto actual_shape = actual_results[i]->get_input_shape(0);
+        ASSERT_EQ(expected_shape, actual_shape) << "For index: " << i;
+    }
+}
+
 //
 // ImportExportNetwork
 //
diff --git a/inference-engine/tests/functional/plugin/shared/include/behavior/exec_graph_info.hpp b/inference-engine/tests/functional/plugin/shared/include/behavior/exec_graph_info.hpp
index e9b4d0fa5201ef..ba9c7926708455 100644
--- a/inference-engine/tests/functional/plugin/shared/include/behavior/exec_graph_info.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/behavior/exec_graph_info.hpp
@@ -63,66 +63,57 @@ TEST_P(ExecGraphTests, CheckExecGraphInfoBeforeExecution) {
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     InferenceEngine::CNNNetwork execGraph;
-    if (targetDevice != CommonTestUtils::DEVICE_AUTO &&
-        targetDevice != CommonTestUtils::DEVICE_MULTI &&
-        targetDevice != CommonTestUtils::DEVICE_TEMPLATE &&
-        targetDevice != CommonTestUtils::DEVICE_GNA) {
-        // Load CNNNetwork to target plugins
-        auto execNet = ie->LoadNetwork(cnnNet, targetDevice, configuration);
-        ASSERT_NO_THROW(execGraph = execNet.GetExecGraphInfo());
-        // Create InferRequest
-        InferenceEngine::InferRequest req;
-        ASSERT_NO_THROW(req = execNet.CreateInferRequest());
-        // Store all the original layers from the network
-        const auto originalLayers = function->get_ops();
-        std::map<std::string, int> originalLayersMap;
-        for (const auto &layer : originalLayers) {
-            originalLayersMap[layer->get_friendly_name()] = 0;
-        }
-        int IteratorForLayersConstant = 0;
-
-        auto function = execGraph.getFunction();
-        ASSERT_NE(function, nullptr);
-
-        for (const auto & op : function->get_ops()) {
-            const auto & rtInfo = op->get_rt_info();
-
-            auto getExecValue = [&rtInfo](const std::string & paramName) -> std::string {
-                auto it = rtInfo.find(paramName);
-                IE_ASSERT(rtInfo.end() != it);
-                auto value = std::dynamic_pointer_cast<ngraph::VariantImpl<std::string>>(it->second);
-                IE_ASSERT(nullptr != value);
-
-                return value->get();
-            };
-
-            // Each layer from the execGraphInfo network must have PM data option set
-            ASSERT_EQ("not_executed", getExecValue(ExecGraphInfoSerialization::PERF_COUNTER));
-            // Parse origin layer names (fused/merged layers) from the executable graph
-            // and compare with layers from the original model
-            auto origFromExecLayer = getExecValue(ExecGraphInfoSerialization::ORIGINAL_NAMES);
-            if (origFromExecLayer == "")
-                IteratorForLayersConstant++;
-            std::vector<std::string> origFromExecLayerSep = separateStrToVec(origFromExecLayer, ',');
-            std::for_each(origFromExecLayerSep.begin(), origFromExecLayerSep.end(), [&](const std::string &layer) {
-                auto origLayer = originalLayersMap.find(layer);
-                ASSERT_NE(originalLayersMap.end(), origLayer) << layer;
-                origLayer->second++;
-            });
-        }
+    // Load CNNNetwork to target plugins
+    auto execNet = ie->LoadNetwork(cnnNet, targetDevice, configuration);
+    ASSERT_NO_THROW(execGraph = execNet.GetExecGraphInfo());
+    // Create InferRequest
+    InferenceEngine::InferRequest req;
+    ASSERT_NO_THROW(req = execNet.CreateInferRequest());
+    // Store all the original layers from the network
+    const auto originalLayers = function->get_ops();
+    std::map<std::string, int> originalLayersMap;
+    for (const auto &layer : originalLayers) {
+        originalLayersMap[layer->get_friendly_name()] = 0;
+    }
+    int IteratorForLayersConstant = 0;
+
+    auto function = execGraph.getFunction();
+    ASSERT_NE(function, nullptr);
+
+    for (const auto & op : function->get_ops()) {
+        const auto & rtInfo = op->get_rt_info();
+
+        auto getExecValue = [&rtInfo](const std::string & paramName) -> std::string {
+            auto it = rtInfo.find(paramName);
+            IE_ASSERT(rtInfo.end() != it) << " paramName: " << paramName;
+            auto value = std::dynamic_pointer_cast<ngraph::VariantImpl<std::string>>(it->second);
+            IE_ASSERT(nullptr != value);
+
+            return value->get();
+        };
+
+        // Each layer from the execGraphInfo network must have PM data option set
+        ASSERT_EQ("not_executed", getExecValue(ExecGraphInfoSerialization::PERF_COUNTER));
+        // Parse origin layer names (fused/merged layers) from the executable graph
+        // and compare with layers from the original model
+        auto origFromExecLayer = getExecValue(ExecGraphInfoSerialization::ORIGINAL_NAMES);
+        if (origFromExecLayer == "")
+            IteratorForLayersConstant++;
+        std::vector<std::string> origFromExecLayerSep = separateStrToVec(origFromExecLayer, ',');
+        std::for_each(origFromExecLayerSep.begin(), origFromExecLayerSep.end(), [&](const std::string &layer) {
+            auto origLayer = originalLayersMap.find(layer);
+            ASSERT_NE(originalLayersMap.end(), origLayer) << layer;
+            origLayer->second++;
+        });
+    }
 
-        // All layers from the original IR must be present with in ExecGraphInfo
-        for (auto &layer : originalLayersMap) {
-            if ((layer.second == 0) && (IteratorForLayersConstant > 0)) {
-                IteratorForLayersConstant--;
-                continue;
-            }
-            ASSERT_GE(layer.second, 0);
+    // All layers from the original IR must be present with in ExecGraphInfo
+    for (auto &layer : originalLayersMap) {
+        if ((layer.second == 0) && (IteratorForLayersConstant > 0)) {
+            IteratorForLayersConstant--;
+            continue;
         }
-    } else {
-        InferenceEngine::ExecutableNetwork network;
-        ASSERT_NO_THROW(network = ie->LoadNetwork(cnnNet, targetDevice, configuration));
-        ASSERT_THROW(network.GetExecGraphInfo(), InferenceEngine::NotImplemented);
+        ASSERT_GE(layer.second, 0);
     }
 }
 
@@ -132,74 +123,66 @@ TEST_P(ExecGraphTests, CheckExecGraphInfoAfterExecution) {
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     InferenceEngine::CNNNetwork execGraph;
-    if (targetDevice != CommonTestUtils::DEVICE_AUTO &&
-        targetDevice != CommonTestUtils::DEVICE_MULTI &&
-        targetDevice != CommonTestUtils::DEVICE_TEMPLATE &&
-        targetDevice != CommonTestUtils::DEVICE_GNA) {
-        // Load CNNNetwork to target plugins
-        auto execNet = ie->LoadNetwork(cnnNet, targetDevice, configuration);
-        ASSERT_NO_THROW(execGraph = execNet.GetExecGraphInfo());
-        // Create InferRequest
-        InferenceEngine::InferRequest req;
-        ASSERT_NO_THROW(req = execNet.CreateInferRequest());
-        // Store all the original layers from the network
-        const auto originalLayers = function->get_ops();
-        std::map<std::string, int> originalLayersMap;
-        for (const auto &layer : originalLayers) {
-            originalLayersMap[layer->get_friendly_name()] = 0;
-        }
-        int IteratorForLayersConstant = 0;
-        // Store all the layers from the executable graph information represented as CNNNetwork
-        bool has_layer_with_valid_time = false;
-        auto function = execGraph.getFunction();
-        ASSERT_NE(nullptr, function);
-
-        for (const auto & op : function->get_ops()) {
-            const auto & rtInfo = op->get_rt_info();
-
-            auto getExecValue = [&rtInfo](const std::string & paramName) -> std::string {
-                auto it = rtInfo.find(paramName);
-                IE_ASSERT(rtInfo.end() != it);
-                auto value = std::dynamic_pointer_cast<ngraph::VariantImpl<std::string>>(it->second);
-                IE_ASSERT(nullptr != value);
-
-                return value->get();
-            };
-
-            // At least one layer in the topology should be executed and have valid perf counter value
-            try {
-                float x = static_cast<float>(std::atof(
-                        getExecValue(ExecGraphInfoSerialization::PERF_COUNTER).c_str()));
-                ASSERT_GE(x, 0.0f);
-                has_layer_with_valid_time = true;
-            } catch (std::exception &) {}
-
-            // Parse origin layer names (fused/merged layers) from the executable graph
-            // and compare with layers from the original model
-            auto origFromExecLayer = getExecValue(ExecGraphInfoSerialization::ORIGINAL_NAMES);
-            std::vector<std::string> origFromExecLayerSep = separateStrToVec(origFromExecLayer, ',');
-            if (origFromExecLayer == "")
-                IteratorForLayersConstant++;
-            std::for_each(origFromExecLayerSep.begin(), origFromExecLayerSep.end(), [&](const std::string &layer) {
-                auto origLayer = originalLayersMap.find(layer);
-                ASSERT_NE(originalLayersMap.end(), origLayer) << layer;
-                origLayer->second++;
-            });
-        }
+    // Load CNNNetwork to target plugins
+    auto execNet = ie->LoadNetwork(cnnNet, targetDevice, configuration);
+    ASSERT_NO_THROW(execGraph = execNet.GetExecGraphInfo());
+    // Create InferRequest
+    InferenceEngine::InferRequest req;
+    ASSERT_NO_THROW(req = execNet.CreateInferRequest());
+    // Store all the original layers from the network
+    const auto originalLayers = function->get_ops();
+    std::map<std::string, int> originalLayersMap;
+    for (const auto &layer : originalLayers) {
+        originalLayersMap[layer->get_friendly_name()] = 0;
+    }
+    int IteratorForLayersConstant = 0;
+    // Store all the layers from the executable graph information represented as CNNNetwork
+    bool has_layer_with_valid_time = false;
+    auto function = execGraph.getFunction();
+    ASSERT_NE(nullptr, function);
+
+    for (const auto & op : function->get_ops()) {
+        const auto & rtInfo = op->get_rt_info();
+
+        auto getExecValue = [&rtInfo](const std::string & paramName) -> std::string {
+            auto it = rtInfo.find(paramName);
+            IE_ASSERT(rtInfo.end() != it);
+            auto value = std::dynamic_pointer_cast<ngraph::VariantImpl<std::string>>(it->second);
+            IE_ASSERT(nullptr != value);
+
+            return value->get();
+        };
+
+        // At least one layer in the topology should be executed and have valid perf counter value
+        try {
+            float x = static_cast<float>(std::atof(
+                    getExecValue(ExecGraphInfoSerialization::PERF_COUNTER).c_str()));
+            ASSERT_GE(x, 0.0f);
+            has_layer_with_valid_time = true;
+        } catch (std::exception &) {}
+
+        // Parse origin layer names (fused/merged layers) from the executable graph
+        // and compare with layers from the original model
+        auto origFromExecLayer = getExecValue(ExecGraphInfoSerialization::ORIGINAL_NAMES);
+        std::vector<std::string> origFromExecLayerSep = separateStrToVec(origFromExecLayer, ',');
+        if (origFromExecLayer == "")
+            IteratorForLayersConstant++;
+        std::for_each(origFromExecLayerSep.begin(), origFromExecLayerSep.end(), [&](const std::string &layer) {
+            auto origLayer = originalLayersMap.find(layer);
+            ASSERT_NE(originalLayersMap.end(), origLayer) << layer;
+            origLayer->second++;
+        });
+    }
 
-        ASSERT_TRUE(has_layer_with_valid_time);
+    ASSERT_TRUE(has_layer_with_valid_time);
 
-        // All layers from the original IR must be present within ExecGraphInfo
-        for (auto &layer : originalLayersMap) {
-            if ((layer.second == 0) && (IteratorForLayersConstant > 0)) {
-                IteratorForLayersConstant--;
-                continue;
-            }
-            ASSERT_GE(layer.second, 0);
+    // All layers from the original IR must be present within ExecGraphInfo
+    for (auto &layer : originalLayersMap) {
+        if ((layer.second == 0) && (IteratorForLayersConstant > 0)) {
+            IteratorForLayersConstant--;
+            continue;
         }
-    } else {
-        ASSERT_THROW(ie->LoadNetwork(cnnNet, targetDevice, configuration).GetExecGraphInfo(),
-                InferenceEngine::NotImplemented);
+        ASSERT_GE(layer.second, 0);
     }
 }
 
@@ -214,22 +197,14 @@ TEST_P(ExecGraphTests, CheckExecGraphInfoSerialization) {
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     InferenceEngine::CNNNetwork execGraph;
-    if (targetDevice != CommonTestUtils::DEVICE_AUTO &&
-        targetDevice != CommonTestUtils::DEVICE_MULTI &&
-        targetDevice != CommonTestUtils::DEVICE_TEMPLATE &&
-        targetDevice != CommonTestUtils::DEVICE_GNA) {
-        // Load CNNNetwork to target plugins
-        auto execNet = ie->LoadNetwork(cnnNet, targetDevice, configuration);
-        ASSERT_NO_THROW(execGraph = execNet.GetExecGraphInfo());
-        // Create InferRequest
-        InferenceEngine::InferRequest req;
-        ASSERT_NO_THROW(req = execNet.CreateInferRequest());
-        execGraph.serialize(out_xml_path, out_bin_path);
-        ASSERT_EQ(0, std::remove(out_xml_path.c_str()));
-        ASSERT_EQ(0, std::remove(out_bin_path.c_str()));
-    } else {
-        ASSERT_THROW(ie->LoadNetwork(cnnNet, targetDevice, configuration).GetExecGraphInfo(),
-                     InferenceEngine::NotImplemented);
-    }
+    // Load CNNNetwork to target plugins
+    auto execNet = ie->LoadNetwork(cnnNet, targetDevice, configuration);
+    ASSERT_NO_THROW(execGraph = execNet.GetExecGraphInfo());
+    // Create InferRequest
+    InferenceEngine::InferRequest req;
+    ASSERT_NO_THROW(req = execNet.CreateInferRequest());
+    execGraph.serialize(out_xml_path, out_bin_path);
+    ASSERT_EQ(0, std::remove(out_xml_path.c_str()));
+    ASSERT_EQ(0, std::remove(out_bin_path.c_str()));
 }
 }  // namespace BehaviorTestsDefinitions
\ No newline at end of file
diff --git a/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request/cancellation.hpp b/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request/cancellation.hpp
index 07eb211f5ddf5e..788a00e25ebe31 100644
--- a/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request/cancellation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request/cancellation.hpp
@@ -13,6 +13,8 @@ namespace BehaviorTestsDefinitions {
 class InferRequestCancellationTests : public BehaviorTestsUtils::InferRequestTests {
 public:
     void SetUp()  override {
+        // Skip test according to plugin specific disabledTestPatterns() (if any)
+        SKIP_IF_CURRENT_TEST_IS_DISABLED()
         std::tie(targetDevice, configuration) = this->GetParam();
         function = ngraph::builder::subgraph::makeConvPoolRelu({1, 3, 640, 640});
         cnnNet = InferenceEngine::CNNNetwork(function);
@@ -22,8 +24,6 @@ class InferRequestCancellationTests : public BehaviorTestsUtils::InferRequestTes
 };
 
 TEST_P(InferRequestCancellationTests, canCancelAsyncRequest) {
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
     // Create InferRequest
     InferenceEngine::InferRequest req = execNet.CreateInferRequest();
     req.StartAsync();
@@ -37,8 +37,6 @@ TEST_P(InferRequestCancellationTests, canCancelAsyncRequest) {
 }
 
 TEST_P(InferRequestCancellationTests, canResetAfterCancelAsyncRequest) {
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
     // Create InferRequest
     InferenceEngine::InferRequest req = execNet.CreateInferRequest();
 
@@ -55,16 +53,12 @@ TEST_P(InferRequestCancellationTests, canResetAfterCancelAsyncRequest) {
 }
 
 TEST_P(InferRequestCancellationTests, canCancelBeforeAsyncRequest) {
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
     // Create InferRequest
     InferenceEngine::InferRequest req = execNet.CreateInferRequest();
     ASSERT_NO_THROW(req.Cancel());
 }
 
 TEST_P(InferRequestCancellationTests, canCancelInferRequest) {
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
     // Create InferRequest
     InferenceEngine::InferRequest req = execNet.CreateInferRequest();
 
diff --git a/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request_dynamic.hpp b/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request/infer_request_dynamic.hpp
similarity index 76%
rename from inference-engine/tests/functional/plugin/shared/include/behavior/infer_request_dynamic.hpp
rename to inference-engine/tests/functional/plugin/shared/include/behavior/infer_request/infer_request_dynamic.hpp
index 52116bd19e6d50..2b2f4d09c00601 100644
--- a/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request_dynamic.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/behavior/infer_request/infer_request_dynamic.hpp
@@ -26,21 +26,63 @@
 #include "ngraph_functions/subgraph_builders.hpp"
 #include "shared_test_classes/subgraph/basic_lstm.hpp"
 
-
+// TODO [mandrono]: move current test case inside CPU plug-in and return the original tests
 namespace BehaviorTestsDefinitions {
 
-class InferRequestDynamicTests : public BehaviorTestsUtils::BehaviorTestsBasic {
+typedef std::tuple<
+        std::shared_ptr<ngraph::Function>,                                 // ngraph function
+        std::vector<std::pair<std::vector<size_t>, std::vector<size_t>>>,  // input/expected output shapes per inference
+        std::string,                                                       // Device name
+        std::map<std::string, std::string>                                 // Config
+> InferRequestDynamicParams;
+
+class InferRequestDynamicTests : public testing::WithParamInterface<InferRequestDynamicParams>,
+                                 public CommonTestUtils::TestsCommon {
 public:
-    void SetUp()  override {
-        std::tie(netPrecision, targetDevice, configuration) = this->GetParam();
-        function = ngraph::builder::subgraph::makeSplitConvConcat();
+    static std::string getTestCaseName(testing::TestParamInfo<InferRequestDynamicParams> obj) {
+        std::shared_ptr<ngraph::Function> func;
+        std::vector<std::pair<std::vector<size_t>, std::vector<size_t>>> inOutShapes;
+        std::string targetDevice;
+        std::map<std::string, std::string> configuration;
+        std::tie(func, inOutShapes, targetDevice, configuration) = obj.param;
+        std::ostringstream result;
+        result << "function=" << func->get_friendly_name() << "_";
+        result << "inOutShape=(";
+        for (const auto& inOutShape : inOutShapes) {
+            result << "(" << CommonTestUtils::vec2str(inOutShape.first) << "_" << CommonTestUtils::vec2str(inOutShape.second) << ")";
+        }
+        result << ")_";
+        result << "targetDevice=" << targetDevice;
+        if (!configuration.empty()) {
+            for (auto& configItem : configuration) {
+                result << "configItem=" << configItem.first << "_" << configItem.second << "_";
+            }
+        }
+        return result.str();
+    }
+
+protected:
+    void SetUp() override {
+        SKIP_IF_CURRENT_TEST_IS_DISABLED()
+        std::tie(function, inOutShapes, targetDevice, configuration) = this->GetParam();
     }
+
+    void TearDown() override {
+        if (!configuration.empty()) {
+            PluginCache::get().reset();
+        }
+        function.reset();
+    }
+
+    std::shared_ptr<InferenceEngine::Core> ie = PluginCache::get().ie();
+    std::shared_ptr<ngraph::Function> function;
+    std::string targetDevice;
+    std::map<std::string, std::string> configuration;
+    std::vector<std::pair<std::vector<size_t>, std::vector<size_t>>> inOutShapes;
 };
 
 TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithoutSetShape) {
     const std::string param_name = "Param_1";
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -57,8 +99,6 @@ TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithoutSetShape) {
 
 TEST_P(InferRequestDynamicTests, InferDynamicNetworkBoundWithoutSetShape) {
     const std::string param_name = "Param_1";
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -76,10 +116,8 @@ TEST_P(InferRequestDynamicTests, InferDynamicNetworkBoundWithoutSetShape) {
 
 TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithGetBlob) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    const InferenceEngine::SizeVector refOutShape = {1, 10, 18, 18};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
+    const InferenceEngine::SizeVector refOutShape = inOutShapes[0].second;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -106,10 +144,8 @@ TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithGetBlob) {
 
 TEST_P(InferRequestDynamicTests, InferUpperBoundNetworkWithGetBlob) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    const InferenceEngine::SizeVector refOutShape = {1, 10, 18, 18};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
+    const InferenceEngine::SizeVector refOutShape = inOutShapes[0].second;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -136,10 +172,8 @@ TEST_P(InferRequestDynamicTests, InferUpperBoundNetworkWithGetBlob) {
 
 TEST_P(InferRequestDynamicTests, InferOutOfRangeShapeNetworkWithGetBlobLower) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    const InferenceEngine::SizeVector refOutShape = {1, 10, 18, 18};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
+    const InferenceEngine::SizeVector refOutShape = inOutShapes[0].second;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -159,10 +193,8 @@ TEST_P(InferRequestDynamicTests, InferOutOfRangeShapeNetworkWithGetBlobLower) {
 
 TEST_P(InferRequestDynamicTests, InferOutOfRangeShapeNetworkWithGetBlobUpper) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    const InferenceEngine::SizeVector refOutShape = {1, 10, 18, 18};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
+    const InferenceEngine::SizeVector refOutShape = inOutShapes[0].second;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -182,12 +214,10 @@ TEST_P(InferRequestDynamicTests, InferOutOfRangeShapeNetworkWithGetBlobUpper) {
 
 TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithGetBlob2times) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    const InferenceEngine::SizeVector refShape2 = {2, 4, 20, 20};
-    const InferenceEngine::SizeVector refOutShape = {1, 10, 18, 18};
-    const InferenceEngine::SizeVector refOutShape2 = {2, 10, 18, 18};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
+    const InferenceEngine::SizeVector refShape2 = inOutShapes[1].first;
+    const InferenceEngine::SizeVector refOutShape = inOutShapes[0].second;
+    const InferenceEngine::SizeVector refOutShape2 = inOutShapes[1].second;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -224,9 +254,7 @@ TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithGetBlob2times) {
 
 TEST_P(InferRequestDynamicTests, GetSameBlob2times) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -247,10 +275,8 @@ TEST_P(InferRequestDynamicTests, GetSameBlob2times) {
 
 TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithSetBlob) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    const InferenceEngine::SizeVector refOutShape = {1, 10, 18, 18};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
+    const InferenceEngine::SizeVector refOutShape = inOutShapes[0].second;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -276,12 +302,10 @@ TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithSetBlob) {
 
 TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithSetBlob2times) {
     const std::string param_name = "Param_1";
-    const InferenceEngine::SizeVector refShape = {1, 4, 20, 20};
-    const InferenceEngine::SizeVector refShape2 = {2, 4, 20, 20};
-    const InferenceEngine::SizeVector refOutShape = {1, 10, 18, 18};
-    const InferenceEngine::SizeVector refOutShape2 = {2, 10, 18, 18};
-    // Skip test according to plugin specific disabledTestPatterns() (if any)
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    const InferenceEngine::SizeVector refShape = inOutShapes[0].first;
+    const InferenceEngine::SizeVector refShape2 = inOutShapes[1].first;
+    const InferenceEngine::SizeVector refOutShape = inOutShapes[0].second;
+    const InferenceEngine::SizeVector refOutShape2 = inOutShapes[1].second;
     // Create CNNNetwork from ngrpah::Function
     InferenceEngine::CNNNetwork cnnNet(function);
     std::map<std::string, ngraph::PartialShape> shapes;
@@ -317,4 +341,4 @@ TEST_P(InferRequestDynamicTests, InferDynamicNetworkWithSetBlob2times) {
     ASSERT_EQ(blob->getTensorDesc().getDims(), refOutShape2);
 }
 
-}  // namespace BehaviorTestsDefinitions
+}  // namespace BehaviorTestsDefinitions
\ No newline at end of file
diff --git a/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp b/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp
index 30b3b5873a8c77..080bcf948e1160 100644
--- a/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/behavior/ov_core_integration.hpp
@@ -38,7 +38,7 @@ namespace BehaviorTestsDefinitions {
 
 #define ASSERT_EXEC_METRIC_SUPPORTED(metricName)                                                \
     {                                                                                           \
-        std::vector<std::string> metrics = exeNetwork.GetMetric(METRIC_KEY(SUPPORTED_METRICS)); \
+        std::vector<std::string> metrics = exeNetwork.get_metric(METRIC_KEY(SUPPORTED_METRICS));\
         auto it = std::find(metrics.begin(), metrics.end(), metricName);                        \
         ASSERT_NE(metrics.end(), it);                                                           \
     }
@@ -440,6 +440,36 @@ TEST_P(OVClassNetworkTestP, LoadNetworkActualHeteroDevice2NoThrow) {
     ASSERT_NO_THROW(ie.compile_model(actualNetwork, CommonTestUtils::DEVICE_HETERO, {{"TARGET_FALLBACK", deviceName}}));
 }
 
+TEST_P(OVClassNetworkTestP, LoadNetworkCreateDefaultExecGraphResult) {
+    SKIP_IF_CURRENT_TEST_IS_DISABLED()
+    auto ie = createCoreWithTemplate();
+    auto net = ie.compile_model(actualNetwork, deviceName);
+    auto runtime_function = net.get_runtime_function();
+    ASSERT_NE(nullptr, runtime_function);
+    auto actual_parameters = runtime_function->get_parameters();
+    auto actual_results = runtime_function->get_results();
+    auto expected_parameters = actualNetwork->get_parameters();
+    auto expected_results = actualNetwork->get_results();
+    ASSERT_EQ(expected_parameters.size(), actual_parameters.size());
+    for (std::size_t i = 0; i < expected_parameters.size(); ++i) {
+        auto expected_element_type = expected_parameters[i]->get_output_element_type(0);
+        auto actual_element_type = actual_parameters[i]->get_output_element_type(0);
+        ASSERT_EQ(expected_element_type, actual_element_type) << "For index: " << i;
+        auto expected_shape = expected_parameters[i]->get_output_shape(0);
+        auto actual_shape = actual_parameters[i]->get_output_shape(0);
+        ASSERT_EQ(expected_shape, actual_shape) << "For index: " << i;
+    }
+    ASSERT_EQ(expected_results.size(), actual_results.size());
+    for (std::size_t i = 0; i < expected_results.size(); ++i) {
+        auto expected_element_type = expected_results[i]->get_input_element_type(0);
+        auto actual_element_type = actual_results[i]->get_input_element_type(0);
+        ASSERT_EQ(expected_element_type, actual_element_type) << "For index: " << i;
+        auto expected_shape = expected_results[i]->get_input_shape(0);
+        auto actual_shape = actual_results[i]->get_input_shape(0);
+        ASSERT_EQ(expected_shape, actual_shape) << "For index: " << i;
+    }
+}
+
 //
 // ImportExportNetwork
 //
@@ -448,30 +478,11 @@ TEST_P(OVClassImportExportTestP, smoke_ImportNetworkNoThrowWithDeviceName) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
     std::stringstream strm;
-    ExecutableNetwork executableNetwork;
+    ov::runtime::ExecutableNetwork executableNetwork;
     ASSERT_NO_THROW(executableNetwork = ie.compile_model(actualNetwork, deviceName));
-    ASSERT_NO_THROW(executableNetwork.Export(strm));
+    ASSERT_NO_THROW(executableNetwork.export_model(strm));
     ASSERT_NO_THROW(executableNetwork = ie.import_model(strm, deviceName));
-    ASSERT_NO_THROW(executableNetwork.CreateInferRequest());
-}
-
-TEST_P(OVClassImportExportTestP, smoke_ExportUsingFileNameImportFromStreamNoThrowWithDeviceName) {
-    SKIP_IF_CURRENT_TEST_IS_DISABLED()
-    ov::runtime::Core ie = createCoreWithTemplate();
-    ExecutableNetwork executableNetwork;
-    std::string fileName{"ExportedNetwork"};
-    {
-        ASSERT_NO_THROW(executableNetwork = ie.compile_model(simpleNetwork, deviceName));
-        ASSERT_NO_THROW(executableNetwork.Export(fileName));
-    }
-    {
-        {
-            std::ifstream strm(fileName);
-            ASSERT_NO_THROW(executableNetwork = ie.import_model(strm, deviceName));
-        }
-        ASSERT_EQ(0, remove(fileName.c_str()));
-    }
-    ASSERT_NO_THROW(executableNetwork.CreateInferRequest());
+    ASSERT_NO_THROW(executableNetwork.create_infer_request());
 }
 
 //
@@ -501,8 +512,7 @@ TEST_P(OVClassNetworkTestP, QueryNetworkWithKSO) {
     ov::runtime::Core ie = createCoreWithTemplate();
 
     try {
-        auto rres = ie.query_model(ksoNetwork, deviceName);
-        auto rl_map = rres.supportedLayersMap;
+        auto rl_map = ie.query_model(ksoNetwork, deviceName);
         auto func = ksoNetwork;
         for (const auto& op : func->get_ops()) {
             if (!rl_map.count(op->get_friendly_name())) {
@@ -545,8 +555,7 @@ TEST_P(OVClassNetworkTestP, SetAffinityWithConstantBranches) {
             func = std::make_shared<ngraph::Function>(results, params);
         }
 
-        auto rres = ie.query_model(func, deviceName);
-        auto rl_map = rres.supportedLayersMap;
+        auto rl_map = ie.query_model(func, deviceName);
         for (const auto& op : func->get_ops()) {
             if (!rl_map.count(op->get_friendly_name())) {
                 FAIL() << "Op " << op->get_friendly_name() << " is not supported by " << deviceName;
@@ -556,7 +565,7 @@ TEST_P(OVClassNetworkTestP, SetAffinityWithConstantBranches) {
             std::string affinity = rl_map[op->get_friendly_name()];
             op->get_rt_info()["affinity"] = std::make_shared<ngraph::VariantWrapper<std::string>>(affinity);
         }
-        ExecutableNetwork exeNetwork = ie.compile_model(ksoNetwork, deviceName);
+        auto exeNetwork = ie.compile_model(ksoNetwork, deviceName);
     } catch (const NotImplemented& ex) {
         std::string message = ex.what();
         ASSERT_STR_CONTAINS(message, "[NOT_IMPLEMENTED]  ngraph::Function is not supported natively");
@@ -568,8 +577,7 @@ TEST_P(OVClassNetworkTestP, SetAffinityWithKSO) {
     ov::runtime::Core ie = createCoreWithTemplate();
 
     try {
-        auto rres = ie.query_model(ksoNetwork, deviceName);
-        auto rl_map = rres.supportedLayersMap;
+        auto rl_map = ie.query_model(ksoNetwork, deviceName);
         auto func = ksoNetwork;
         for (const auto& op : func->get_ops()) {
             if (!rl_map.count(op->get_friendly_name())) {
@@ -580,7 +588,7 @@ TEST_P(OVClassNetworkTestP, SetAffinityWithKSO) {
             std::string affinity = rl_map[op->get_friendly_name()];
             op->get_rt_info()["affinity"] = std::make_shared<ngraph::VariantWrapper<std::string>>(affinity);
         }
-        ExecutableNetwork exeNetwork = ie.compile_model(ksoNetwork, deviceName);
+        auto exeNetwork = ie.compile_model(ksoNetwork, deviceName);
     } catch (const InferenceEngine::Exception& ex) {
         std::string message = ex.what();
         ASSERT_STR_CONTAINS(message, "[NOT_IMPLEMENTED]  ngraph::Function is not supported natively");
@@ -590,10 +598,10 @@ TEST_P(OVClassNetworkTestP, SetAffinityWithKSO) {
 TEST_P(OVClassNetworkTestP, QueryNetworkHeteroActualNoThrow) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED()
     ov::runtime::Core ie = createCoreWithTemplate();
-    QueryNetworkResult res;
+    ov::runtime::SupportedOpsMap res;
     ASSERT_NO_THROW(
         res = ie.query_model(actualNetwork, CommonTestUtils::DEVICE_HETERO, {{"TARGET_FALLBACK", deviceName}}));
-    ASSERT_LT(0, res.supportedLayersMap.size());
+    ASSERT_LT(0, res.size());
 }
 
 TEST_P(OVClassNetworkTestP, QueryNetworkMultiThrows) {
@@ -909,9 +917,9 @@ TEST_P(OVClassExecutableNetworkGetMetricTest_SUPPORTED_CONFIG_KEYS, GetMetricNoT
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetMetric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
+    ASSERT_NO_THROW(p = exeNetwork.get_metric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
     std::vector<std::string> configValues = p;
 
     std::cout << "Supported config keys: " << std::endl;
@@ -928,9 +936,9 @@ TEST_P(OVClassExecutableNetworkGetMetricTest_SUPPORTED_METRICS, GetMetricNoThrow
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetMetric(METRIC_KEY(SUPPORTED_METRICS)));
+    ASSERT_NO_THROW(p = exeNetwork.get_metric(METRIC_KEY(SUPPORTED_METRICS)));
     std::vector<std::string> metricValues = p;
 
     std::cout << "Supported metric keys: " << std::endl;
@@ -947,9 +955,9 @@ TEST_P(OVClassExecutableNetworkGetMetricTest_NETWORK_NAME, GetMetricNoThrow) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetMetric(EXEC_NETWORK_METRIC_KEY(NETWORK_NAME)));
+    ASSERT_NO_THROW(p = exeNetwork.get_metric(EXEC_NETWORK_METRIC_KEY(NETWORK_NAME)));
     std::string networkname = p;
 
     std::cout << "Exe network name: " << std::endl << networkname << std::endl;
@@ -962,9 +970,9 @@ TEST_P(OVClassExecutableNetworkGetMetricTest_OPTIMAL_NUMBER_OF_INFER_REQUESTS, G
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetMetric(EXEC_NETWORK_METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)));
+    ASSERT_NO_THROW(p = exeNetwork.get_metric(EXEC_NETWORK_METRIC_KEY(OPTIMAL_NUMBER_OF_INFER_REQUESTS)));
     unsigned int value = p;
 
     std::cout << "Optimal number of Inference Requests: " << value << std::endl;
@@ -977,9 +985,9 @@ TEST_P(OVClassExecutableNetworkGetMetricTest_ThrowsUnsupported, GetMetricThrow)
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(p = exeNetwork.GetMetric("unsupported_metric"), Exception);
+    ASSERT_THROW(p = exeNetwork.get_metric("unsupported_metric"), Exception);
 }
 
 TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigNoThrow) {
@@ -987,9 +995,9 @@ TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigNoThrow) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetMetric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
+    ASSERT_NO_THROW(p = exeNetwork.get_metric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
     std::vector<std::string> configValues = p;
 
     for (auto&& confKey : configValues) {
@@ -1004,9 +1012,9 @@ TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigThrows) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(p = exeNetwork.GetConfig("unsupported_config"), Exception);
+    ASSERT_THROW(p = exeNetwork.get_config("unsupported_config"), Exception);
 }
 
 TEST_P(OVClassExecutableNetworkSetConfigTest, SetConfigThrows) {
@@ -1014,9 +1022,9 @@ TEST_P(OVClassExecutableNetworkSetConfigTest, SetConfigThrows) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(exeNetwork.SetConfig({{"unsupported_config", "some_value"}}), Exception);
+    ASSERT_THROW(exeNetwork.set_config({{"unsupported_config", "some_value"}}), Exception);
 }
 
 TEST_P(OVClassExecutableNetworkSupportedConfigTest, SupportedConfigWorks) {
@@ -1024,10 +1032,10 @@ TEST_P(OVClassExecutableNetworkSupportedConfigTest, SupportedConfigWorks) {
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_NO_THROW(exeNetwork.SetConfig({{configKey, configValue}}));
-    ASSERT_NO_THROW(p = exeNetwork.GetConfig(configKey));
+    ASSERT_NO_THROW(exeNetwork.set_config({{configKey, configValue}}));
+    ASSERT_NO_THROW(p = exeNetwork.get_config(configKey));
     ASSERT_EQ(p, configValue);
 }
 
@@ -1035,9 +1043,9 @@ TEST_P(OVClassExecutableNetworkUnsupportedConfigTest, UnsupportedConfigThrows) {
     SKIP_IF_CURRENT_TEST_IS_DISABLED();
     ov::runtime::Core ie = createCoreWithTemplate();
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_THROW(exeNetwork.SetConfig({{configKey, configValue}}), Exception);
+    ASSERT_THROW(exeNetwork.set_config({{configKey, configValue}}), Exception);
 }
 
 TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigNoEmptyNoThrow) {
@@ -1048,9 +1056,9 @@ TEST_P(OVClassExecutableNetworkGetConfigTest, GetConfigNoEmptyNoThrow) {
     ASSERT_NO_THROW(p = ie.get_metric(deviceName, METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
     std::vector<std::string> devConfigValues = p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(simpleNetwork, deviceName);
+    auto exeNetwork = ie.compile_model(simpleNetwork, deviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetMetric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
+    ASSERT_NO_THROW(p = exeNetwork.get_metric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
     std::vector<std::string> execConfigValues = p;
 
     /*
@@ -1068,11 +1076,11 @@ TEST_P(OVClassHeteroExecutableNetworkGetMetricTest_SUPPORTED_CONFIG_KEYS, GetMet
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter pHetero, pDevice;
 
-    ExecutableNetwork heteroExeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
-    ExecutableNetwork deviceExeNetwork = ie.compile_model(actualNetwork, deviceName);
+    auto heteroExeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
+    auto deviceExeNetwork = ie.compile_model(actualNetwork, deviceName);
 
-    ASSERT_NO_THROW(pHetero = heteroExeNetwork.GetMetric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
-    ASSERT_NO_THROW(pDevice = deviceExeNetwork.GetMetric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
+    ASSERT_NO_THROW(pHetero = heteroExeNetwork.get_metric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
+    ASSERT_NO_THROW(pDevice = deviceExeNetwork.get_metric(METRIC_KEY(SUPPORTED_CONFIG_KEYS)));
     std::vector<std::string> heteroConfigValues = pHetero, deviceConfigValues = pDevice;
 
     std::cout << "Supported config keys: " << std::endl;
@@ -1087,8 +1095,8 @@ TEST_P(OVClassHeteroExecutableNetworkGetMetricTest_SUPPORTED_CONFIG_KEYS, GetMet
         auto it = std::find(heteroConfigValues.begin(), heteroConfigValues.end(), deviceConf);
         ASSERT_TRUE(it != heteroConfigValues.end());
 
-        Parameter heteroConfigValue = heteroExeNetwork.GetConfig(deviceConf);
-        Parameter deviceConfigValue = deviceExeNetwork.GetConfig(deviceConf);
+        Parameter heteroConfigValue = heteroExeNetwork.get_config(deviceConf);
+        Parameter deviceConfigValue = deviceExeNetwork.get_config(deviceConf);
 
         // HETERO returns EXCLUSIVE_ASYNC_REQUESTS as a boolean value
         if (CONFIG_KEY(EXCLUSIVE_ASYNC_REQUESTS) != deviceConf) {
@@ -1102,11 +1110,11 @@ TEST_P(OVClassHeteroExecutableNetworkGetMetricTest_SUPPORTED_METRICS, GetMetricN
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter pHetero, pDevice;
 
-    ExecutableNetwork heteroExeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
-    ExecutableNetwork deviceExeNetwork = ie.compile_model(actualNetwork, deviceName);
+    auto heteroExeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
+    auto deviceExeNetwork = ie.compile_model(actualNetwork, deviceName);
 
-    ASSERT_NO_THROW(pHetero = heteroExeNetwork.GetMetric(METRIC_KEY(SUPPORTED_METRICS)));
-    ASSERT_NO_THROW(pDevice = deviceExeNetwork.GetMetric(METRIC_KEY(SUPPORTED_METRICS)));
+    ASSERT_NO_THROW(pHetero = heteroExeNetwork.get_metric(METRIC_KEY(SUPPORTED_METRICS)));
+    ASSERT_NO_THROW(pDevice = deviceExeNetwork.get_metric(METRIC_KEY(SUPPORTED_METRICS)));
     std::vector<std::string> heteroMetricValues = pHetero, deviceMetricValues = pDevice;
 
     std::cout << "Supported metric keys: " << std::endl;
@@ -1124,8 +1132,8 @@ TEST_P(OVClassHeteroExecutableNetworkGetMetricTest_SUPPORTED_METRICS, GetMetricN
         auto it = std::find(heteroMetricValues.begin(), heteroMetricValues.end(), deviceMetricName);
         ASSERT_TRUE(it != heteroMetricValues.end());
 
-        Parameter heteroMetricValue = heteroExeNetwork.GetMetric(deviceMetricName);
-        Parameter deviceMetricValue = deviceExeNetwork.GetMetric(deviceMetricName);
+        Parameter heteroMetricValue = heteroExeNetwork.get_metric(deviceMetricName);
+        Parameter deviceMetricValue = deviceExeNetwork.get_metric(deviceMetricName);
 
         if (std::find(heteroSpecificMetrics.begin(), heteroSpecificMetrics.end(), deviceMetricName) ==
             heteroSpecificMetrics.end()) {
@@ -1139,9 +1147,9 @@ TEST_P(OVClassHeteroExecutableNetworkGetMetricTest_NETWORK_NAME, GetMetricNoThro
     ov::runtime::Core ie = createCoreWithTemplate();
     Parameter p;
 
-    ExecutableNetwork exeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
+    auto exeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetMetric(EXEC_NETWORK_METRIC_KEY(NETWORK_NAME)));
+    ASSERT_NO_THROW(p = exeNetwork.get_metric(EXEC_NETWORK_METRIC_KEY(NETWORK_NAME)));
     std::string networkname = p;
 
     std::cout << "Exe network name: " << std::endl << networkname << std::endl;
@@ -1154,9 +1162,9 @@ TEST_P(OVClassHeteroExecutableNetworkGetMetricTest_TARGET_FALLBACK, GetMetricNoT
 
     setHeteroNetworkAffinity(deviceName);
 
-    ExecutableNetwork exeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
+    auto exeNetwork = ie.compile_model(actualNetwork, heteroDeviceName);
 
-    ASSERT_NO_THROW(p = exeNetwork.GetConfig("TARGET_FALLBACK"));
+    ASSERT_NO_THROW(p = exeNetwork.get_config("TARGET_FALLBACK"));
     std::string targets = p;
     auto expectedTargets = deviceName + "," + CommonTestUtils::DEVICE_CPU;
 
@@ -1397,7 +1405,7 @@ TEST_P(OVClassLoadNetworkTest, QueryNetworkHETEROWithMULTINoThrow_V10) {
         for (auto&& node : function->get_ops()) {
             expectedLayers.emplace(node->get_friendly_name());
         }
-        QueryNetworkResult result;
+        ov::runtime::SupportedOpsMap result;
         std::string targetFallback(CommonTestUtils::DEVICE_MULTI + std::string(",") + deviceName);
         ASSERT_NO_THROW(result = ie.query_model(
                             multinputNetwork,
@@ -1405,7 +1413,7 @@ TEST_P(OVClassLoadNetworkTest, QueryNetworkHETEROWithMULTINoThrow_V10) {
                             {{MULTI_CONFIG_KEY(DEVICE_PRIORITIES), devices}, {"TARGET_FALLBACK", targetFallback}}));
 
         std::unordered_set<std::string> actualLayers;
-        for (auto&& layer : result.supportedLayersMap) {
+        for (auto&& layer : result) {
             actualLayers.emplace(layer.first);
         }
         ASSERT_EQ(expectedLayers, actualLayers);
@@ -1433,14 +1441,14 @@ TEST_P(OVClassLoadNetworkTest, QueryNetworkMULTIWithHETERONoThrow_V10) {
         for (auto&& node : function->get_ops()) {
             expectedLayers.emplace(node->get_friendly_name());
         }
-        QueryNetworkResult result;
+        ov::runtime::SupportedOpsMap result;
         ASSERT_NO_THROW(result = ie.query_model(multinputNetwork,
                                                  CommonTestUtils::DEVICE_MULTI,
                                                  {{MULTI_CONFIG_KEY(DEVICE_PRIORITIES), devices},
                                                   {"TARGET_FALLBACK", deviceName + "," + deviceName}}));
 
         std::unordered_set<std::string> actualLayers;
-        for (auto&& layer : result.supportedLayersMap) {
+        for (auto&& layer : result) {
             actualLayers.emplace(layer.first);
         }
         ASSERT_EQ(expectedLayers, actualLayers);
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/add_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/add_transformation.hpp
index 1611191bcbfc62..0848b16789d11b 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/add_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/add_transformation.hpp
@@ -31,7 +31,7 @@ class AddTransformation :
     public testing::WithParamInterface<AddTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<AddTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<AddTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/clamp_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/clamp_transformation.hpp
index f87f2e32fc278d..dbb860bc26e9e0 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/clamp_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/clamp_transformation.hpp
@@ -29,7 +29,7 @@ class ClampTransformation :
     public testing::WithParamInterface<ClampTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ClampTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ClampTransformationParams>& obj);
 protected:
     void SetUp() override;
 };
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_transformation.hpp
index 6364994019f398..a484e122b1e484 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_transformation.hpp
@@ -28,7 +28,7 @@ class ConcatTransformation :
     public testing::WithParamInterface<ConcatTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConcatTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConcatTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_child_and_output.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_child_and_output.hpp
index 2ae292c8002795..ae7805b5cfee2a 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_child_and_output.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_child_and_output.hpp
@@ -29,7 +29,7 @@ class ConcatWithChildAndOutputTransformation :
     public testing::WithParamInterface<ConcatWithChildAndOutputTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConcatWithChildAndOutputTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConcatWithChildAndOutputTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_different_precision_on_children.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_different_precision_on_children.hpp
index 72a7c4b06e871c..9617b135fdc1f7 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_different_precision_on_children.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_different_precision_on_children.hpp
@@ -30,7 +30,7 @@ class ConcatWithDifferentChildrenTransformation :
     public testing::WithParamInterface<ConcatWithDifferentChildrenTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConcatWithDifferentChildrenTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConcatWithDifferentChildrenTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_intermediate_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_intermediate_transformation.hpp
index 11e7a1d145217f..9ebbab46e32d75 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_intermediate_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_intermediate_transformation.hpp
@@ -24,7 +24,7 @@ class ConcatWithIntermediateTransformation :
     public testing::WithParamInterface<ConcatWithIntermediateTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConcatWithIntermediateTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConcatWithIntermediateTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_neighbors_graph_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_neighbors_graph_transformation.hpp
index c419cf6b283901..205e0f1bba6f46 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_neighbors_graph_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_neighbors_graph_transformation.hpp
@@ -21,7 +21,7 @@ class ConcatWithNeighborsGraphTransformation :
     public testing::WithParamInterface<ConcatNeighboringGraphTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConcatNeighboringGraphTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConcatNeighboringGraphTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_split_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_split_transformation.hpp
index 2dfd8560650700..990ce764da79b0 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_split_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/concat_with_split_transformation.hpp
@@ -28,7 +28,7 @@ class ConcatWithSplitTransformation :
     public testing::WithParamInterface<ConcatWithSplitTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConcatWithSplitTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConcatWithSplitTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_backprop_data_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_backprop_data_transformation.hpp
index 738854ae315f18..0532d32ee74f71 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_backprop_data_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_backprop_data_transformation.hpp
@@ -54,7 +54,7 @@ class ConvolutionBackpropDataTransformation :
     public testing::WithParamInterface<ConvolutionBackpropDataTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConvolutionBackpropDataTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConvolutionBackpropDataTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_qdq_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_qdq_transformation.hpp
index 371349f7d55cc0..fd67876721d656 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_qdq_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_qdq_transformation.hpp
@@ -57,7 +57,7 @@ class ConvolutionQDqTransformation :
     public testing::WithParamInterface<ConvolutionQDqTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConvolutionQDqTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConvolutionQDqTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_transformation.hpp
index 6b3c1f641506d3..6dd90823e23ae6 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_transformation.hpp
@@ -35,7 +35,7 @@ class ConvolutionTransformation :
     public testing::WithParamInterface<ConvolutionTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConvolutionTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConvolutionTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_with_incorrect_weights.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_with_incorrect_weights.hpp
index 95eddf1d2b2ac2..1b44f4b4dbd106 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_with_incorrect_weights.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/convolution_with_incorrect_weights.hpp
@@ -32,7 +32,7 @@ class ConvolutionWIthIncorrectWeightsTransformation :
     public testing::WithParamInterface<ConvolutionWIthIncorrectWeightsParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConvolutionWIthIncorrectWeightsParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConvolutionWIthIncorrectWeightsParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/depth_to_space_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/depth_to_space_transformation.hpp
index fe0393ccc31e20..3a689d08bc7154 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/depth_to_space_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/depth_to_space_transformation.hpp
@@ -22,7 +22,7 @@ class DepthToSpaceTransformation :
     public testing::WithParamInterface<DepthToSpaceTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<DepthToSpaceTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<DepthToSpaceTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_avg_pool_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_avg_pool_transformation.hpp
index d821a5900c9bd8..ec8536515cbc39 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_avg_pool_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_avg_pool_transformation.hpp
@@ -23,7 +23,7 @@ class FakeQuantizeAndAvgPoolTransformation :
     public testing::WithParamInterface<FakeQuantizeAndAvgPoolTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FakeQuantizeAndAvgPoolTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FakeQuantizeAndAvgPoolTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_max_pool_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_max_pool_transformation.hpp
index db5a4c7a6d5800..f1f2dc45fd32d5 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_max_pool_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_max_pool_transformation.hpp
@@ -23,7 +23,7 @@ class FakeQuantizeAndMaxPoolTransformation :
     public testing::WithParamInterface<FakeQuantizeAndMaxPoolTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FakeQuantizeAndMaxPoolTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FakeQuantizeAndMaxPoolTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.hpp
index 8268cb3fcdd380..7f7b6c49306e53 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.hpp
@@ -32,7 +32,7 @@ class FakeQuantizeAndTwoOutputBranchesWithConvolutionTransformation :
     public testing::WithParamInterface<FakeQuantizeAndTwoOutputBranchesWithConvolutionParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FakeQuantizeAndTwoOutputBranchesWithConvolutionParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FakeQuantizeAndTwoOutputBranchesWithConvolutionParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_precision_selection_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_precision_selection_transformation.hpp
index ba3032e3b5f84c..bb0b4b0cf2341e 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_precision_selection_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_precision_selection_transformation.hpp
@@ -59,7 +59,7 @@ class FakeQuantizePrecisionSelectionTransformation :
     public testing::WithParamInterface<FakeQuantizeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FakeQuantizeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FakeQuantizeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_transformation.hpp
index aa372252ca121f..b56e230973777f 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_transformation.hpp
@@ -29,7 +29,7 @@ class FakeQuantizeTransformation :
     public testing::WithParamInterface<FakeQuantizeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FakeQuantizeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FakeQuantizeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.hpp
index 10521951e6c5ef..7cf29151aaf32a 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.hpp
@@ -59,7 +59,7 @@ class FakeQuantizeWithNotOptimalTransformation :
     public testing::WithParamInterface<FakeQuantizeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FakeQuantizeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FakeQuantizeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fully_connected_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fully_connected_transformation.hpp
index 6613b6db436d9b..d285052944a621 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fully_connected_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fully_connected_transformation.hpp
@@ -29,7 +29,7 @@ class FullyConnectedTransformation :
     public testing::WithParamInterface<FullyConnectedTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FullyConnectedTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FullyConnectedTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_convert_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_convert_transformation.hpp
index 1113c87b365622..ca421795d90e11 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_convert_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_convert_transformation.hpp
@@ -26,7 +26,7 @@ class FuseConvertTransformation :
         public testing::WithParamInterface<FuseConvertTransformationParams>,
         public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FuseConvertTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FuseConvertTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.hpp
index 82a0e8fb8b2fff..a0662063287b6a 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.hpp
@@ -22,7 +22,7 @@ class FuseFakeQuantizeAndScaleShiftTransformation :
     public testing::WithParamInterface<FuseFakeQuantizeAndScaleShiftTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FuseFakeQuantizeAndScaleShiftTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FuseFakeQuantizeAndScaleShiftTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_transformation.hpp
index f4cd6a924a2dc0..e2a9d97b76d20f 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_fake_quantize_transformation.hpp
@@ -39,7 +39,7 @@ class FuseFakeQuantizeTransformation :
     public testing::WithParamInterface<FuseFakeQuantizeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FuseFakeQuantizeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FuseFakeQuantizeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.hpp
index 07705f8d336ad9..aaa4d64ddeaa63 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.hpp
@@ -35,7 +35,7 @@ class FuseMultiplyToFakeQuantizeTransformation :
     public testing::WithParamInterface<FuseMultiplyToFakeQuantizeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FuseMultiplyToFakeQuantizeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FuseMultiplyToFakeQuantizeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.hpp
index 64cfa3645faab2..10e544cd39b7a2 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.hpp
@@ -35,7 +35,7 @@ class FuseSubtractToFakeQuantizeTransformation :
     public testing::WithParamInterface<FuseSubtractToFakeQuantizeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FuseSubtractToFakeQuantizeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FuseSubtractToFakeQuantizeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/gemm_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/gemm_transformation.hpp
index 16d1747b5b9629..9c6ad835e90a82 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/gemm_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/gemm_transformation.hpp
@@ -22,7 +22,7 @@ class GemmTransformation :
     public testing::WithParamInterface<GemmTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<GemmTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<GemmTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/group_convolution_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/group_convolution_transformation.hpp
index ed63c92a9fc22a..237a6b12448f45 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/group_convolution_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/group_convolution_transformation.hpp
@@ -37,7 +37,7 @@ class GroupConvolutionTransformation :
     public testing::WithParamInterface<GroupConvolutionTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<GroupConvolutionTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<GroupConvolutionTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/groupconvolution_qdq_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/groupconvolution_qdq_transformation.hpp
index 99dffb4714f28d..0d2ae11d9a2263 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/groupconvolution_qdq_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/groupconvolution_qdq_transformation.hpp
@@ -61,7 +61,7 @@ class GroupConvolutionQDqTransformation :
     public testing::WithParamInterface<GroupConvolutionQDqTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<GroupConvolutionQDqTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<GroupConvolutionQDqTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/interpolate_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/interpolate_transformation.hpp
index c702d02645180d..26b6efafc06bb9 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/interpolate_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/interpolate_transformation.hpp
@@ -45,7 +45,7 @@ class InterpolateTransformation :
     public testing::WithParamInterface<InterpolateTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<InterpolateTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<InterpolateTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_transformation.hpp
index cc4231e6a14928..70556d5b4fca3c 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_transformation.hpp
@@ -33,7 +33,7 @@ class MatMulTransformation :
     public testing::WithParamInterface<MatMulTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MatMulTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MatMulTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_constant_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_constant_transformation.hpp
index 7840e282313bf8..c01d6b5bff99d2 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_constant_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_constant_transformation.hpp
@@ -39,7 +39,7 @@ class MatMulWithConstantTransformation :
     public testing::WithParamInterface<MatMulWithConstantTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MatMulWithConstantTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MatMulWithConstantTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.hpp
index 54d800a7e27e85..7002f58a8ac954 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.hpp
@@ -29,7 +29,7 @@ class MatMulWithOptimizedConstantFakeQuantizeTransformation :
     public testing::WithParamInterface<MatMulWithOptimizedConstantFakeQuantizeTransformationTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MatMulWithOptimizedConstantFakeQuantizeTransformationTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MatMulWithOptimizedConstantFakeQuantizeTransformationTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/move_fake_quantize_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/move_fake_quantize_transformation.hpp
new file mode 100644
index 00000000000000..e53eef8b048ee1
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/move_fake_quantize_transformation.hpp
@@ -0,0 +1,57 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+#include <memory>
+
+#include "shared_test_classes/base/low_precision_transformations/layer_transformation.hpp"
+#include "lpt_ngraph_functions/common/fake_quantize_on_data.hpp"
+#include "lpt_ngraph_functions/common/fake_quantize_on_weights.hpp"
+
+#include "low_precision/move_fake_quantize.hpp"
+
+#include "lpt_ngraph_functions/move_fake_quantize_function.hpp"
+
+namespace LayerTestsDefinitions {
+
+class MoveFakeQuantizeTransformationParam {
+public:
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeBefore1;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertBefore1;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationBefore1;
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeBefore2;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertBefore2;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationBefore2;
+    std::string operation;
+    ngraph::builder::subgraph::FakeQuantizeOnDataWithConstant fakeQuantizeAfter;
+    ngraph::builder::subgraph::DequantizationOperations::Convert convertAfter;
+    ngraph::builder::subgraph::DequantizationOperations dequantizationAfter;
+    std::string layerName;
+    std::string expectedKernelType;
+    std::int64_t axis;
+};
+
+typedef std::tuple <
+    ngraph::element::Type,
+    ngraph::Shape,
+    std::string,
+    ngraph::pass::low_precision::LayerTransformation::Params,
+    MoveFakeQuantizeTransformationParam
+> MoveFakeQuantizeTransformationParams;
+
+class MoveFakeQuantizeTransformation :
+    public testing::WithParamInterface<MoveFakeQuantizeTransformationParams>,
+    public LayerTestsUtils::LayerTransformation {
+public:
+    static std::string getTestCaseName(testing::TestParamInfo<MoveFakeQuantizeTransformationParams> obj);
+
+protected:
+    void SetUp() override;
+
+    void Run() override;
+};
+
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_to_group_convolution_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_to_group_convolution_transformation.hpp
index 898bce4db4c715..5381e07868a576 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_to_group_convolution_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_to_group_convolution_transformation.hpp
@@ -34,7 +34,7 @@ class MultiplyToGroupConvolutionTransformation :
     public testing::WithParamInterface<MultiplyToGroupConvolutionTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MultiplyToGroupConvolutionTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MultiplyToGroupConvolutionTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_transformation.hpp
index f9a28f2ee2117f..81816916e637dc 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_transformation.hpp
@@ -32,7 +32,7 @@ class MultiplyTransformation :
     public testing::WithParamInterface<MultiplyTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MultiplyTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MultiplyTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_with_one_parent_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_with_one_parent_transformation.hpp
index 4fa9d821e306d5..fd38f188a22e84 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_with_one_parent_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/multiply_with_one_parent_transformation.hpp
@@ -28,7 +28,7 @@ class MultiplyWithOneParentTransformation :
     public testing::WithParamInterface<MultiplyWithOneParentTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MultiplyWithOneParentTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MultiplyWithOneParentTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mvn_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mvn_transformation.hpp
index dc206a5095b159..8e71e6f3a48d8a 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mvn_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/mvn_transformation.hpp
@@ -25,7 +25,7 @@ class MVNTransformation :
     public testing::WithParamInterface<MVNTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MVNTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MVNTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/normalize_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/normalize_transformation.hpp
index 2efe1c850a8f0e..d0d32d0fa527e7 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/normalize_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/normalize_transformation.hpp
@@ -24,7 +24,7 @@ class NormalizeL2Transformation :
     public testing::WithParamInterface<NormalizeL2TransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<NormalizeL2TransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<NormalizeL2TransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations.hpp
index 2c9f349c01de0d..be9b1c49e65770 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations.hpp
@@ -15,7 +15,7 @@ class OutputLayersHandlingInTransformations :
     public testing::WithParamInterface<LayerTestsUtils::LayerTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat.hpp
index f96ab634c12656..4a0a3fe799fc24 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat.hpp
@@ -15,7 +15,7 @@ class OutputLayersHandlingInTransformationsForConcat :
     public testing::WithParamInterface<LayerTestsUtils::LayerTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.hpp
index a5c4f4b1ae7798..c68e6c41b28626 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.hpp
@@ -22,7 +22,7 @@ class OutputLayersHandlingInTransformationsForConcatMultiChannel :
     public testing::WithParamInterface<LayerTestsUtils::LayerTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pad_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pad_transformation.hpp
index 2cdc21f1378383..b2bb7b1ea1cd9b 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pad_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pad_transformation.hpp
@@ -31,7 +31,7 @@ class PadTransformation :
     public testing::WithParamInterface<PadTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<PadTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<PadTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/prelu_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/prelu_transformation.hpp
index 096cd314f1dda2..c7e409a9ca950b 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/prelu_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/prelu_transformation.hpp
@@ -27,7 +27,7 @@ class PReluTransformation :
     public testing::WithParamInterface<PReluTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<PReluTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<PReluTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pull_reshape_through_dequantization_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pull_reshape_through_dequantization_transformation.hpp
index 198a879ff30dc7..8523c4733b8731 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pull_reshape_through_dequantization_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/pull_reshape_through_dequantization_transformation.hpp
@@ -46,7 +46,7 @@ class PullReshapeThroughDequantizationTransformation :
     public testing::WithParamInterface<PullReshapeThroughDequantizationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<PullReshapeThroughDequantizationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<PullReshapeThroughDequantizationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_max_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_max_transformation.hpp
index 911b3d13f4f6ae..f5f90fbd4bfc68 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_max_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_max_transformation.hpp
@@ -30,7 +30,7 @@ class ReduceMaxTransformation :
     public testing::WithParamInterface<ReduceMaxTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ReduceMaxTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ReduceMaxTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_mean_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_mean_transformation.hpp
index 5ea346285307c4..544f94a2356e79 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_mean_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_mean_transformation.hpp
@@ -29,7 +29,7 @@ class ReduceMeanTransformation :
     public testing::WithParamInterface<ReduceMeanTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ReduceMeanTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ReduceMeanTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_min_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_min_transformation.hpp
index a52e4df34ebf2d..fd4b7cf9f00f56 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_min_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_min_transformation.hpp
@@ -30,7 +30,7 @@ class ReduceMinTransformation :
     public testing::WithParamInterface<ReduceMinTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ReduceMinTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ReduceMinTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_sum_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_sum_transformation.hpp
index ec7af415c10226..8d71bd765581d0 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_sum_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reduce_sum_transformation.hpp
@@ -30,7 +30,7 @@ class ReduceSumTransformation :
     public testing::WithParamInterface<ReduceSumTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ReduceSumTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ReduceSumTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/relu_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/relu_transformation.hpp
index cf7b2e633c7808..f95758a808c8f6 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/relu_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/relu_transformation.hpp
@@ -27,7 +27,7 @@ class ReluTransformation :
     public testing::WithParamInterface<ReluTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ReluTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ReluTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reshape_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reshape_transformation.hpp
index 9275538b8cff11..d3b91359dfdb4c 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reshape_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/reshape_transformation.hpp
@@ -32,7 +32,7 @@ class ReshapeTransformation :
     public testing::WithParamInterface<ReshapeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ReshapeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ReshapeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/shuffle_channels_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/shuffle_channels_transformation.hpp
index 8439211c8395dd..43081d2748cc12 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/shuffle_channels_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/shuffle_channels_transformation.hpp
@@ -33,7 +33,7 @@ class ShuffleChannelsTransformation :
     public testing::WithParamInterface<ShuffleChannelsTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ShuffleChannelsTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ShuffleChannelsTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/split_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/split_transformation.hpp
index a7c3892a08220d..359c61fd171312 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/split_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/split_transformation.hpp
@@ -27,7 +27,7 @@ class SplitTransformation :
     public testing::WithParamInterface<SplitTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<SplitTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<SplitTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/squeeze_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/squeeze_transformation.hpp
index b93f26d06458dd..a38c9e9d704c7d 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/squeeze_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/squeeze_transformation.hpp
@@ -33,7 +33,7 @@ class SqueezeTransformation :
     public LayerTestsUtils::LayerTransformation {
 public:
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
-    static std::string getTestCaseName(testing::TestParamInfo<SqueezeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<SqueezeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/strided_slice_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/strided_slice_transformation.hpp
index d64a9e0935be26..6e9833a34359aa 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/strided_slice_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/strided_slice_transformation.hpp
@@ -34,7 +34,7 @@ class StridedSliceTransformation :
     public testing::WithParamInterface<StridedSliceTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<StridedSliceTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<StridedSliceTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.hpp
index da6eb048d6e466..33a30f2c05c5a8 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.hpp
@@ -27,7 +27,7 @@ class SubtractMultiplyToMultiplyAddTransformation :
     public testing::WithParamInterface<SubtractMultiplyToMultiplyAddTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<SubtractMultiplyToMultiplyAddTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<SubtractMultiplyToMultiplyAddTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_transformation.hpp
index 43a58471a946b8..d7b208e7345abd 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/subtract_transformation.hpp
@@ -22,7 +22,7 @@ class SubtractTransformation :
     public testing::WithParamInterface<SubtractTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<SubtractTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<SubtractTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_after_matmul_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_after_matmul_transformation.hpp
index 7b15ce69bced52..7832430ecefeae 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_after_matmul_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_after_matmul_transformation.hpp
@@ -23,7 +23,7 @@ class TransposeAfterMatMulTransformation :
     public testing::WithParamInterface<TransposeAfterMatMulTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<TransposeAfterMatMulTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<TransposeAfterMatMulTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_transformation.hpp
index 1f8679b5228af9..2cfed041acf39b 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/transpose_transformation.hpp
@@ -30,7 +30,7 @@ class TransposeTransformation :
     public testing::WithParamInterface<TransposeTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<TransposeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<TransposeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/unsqueeze_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/unsqueeze_transformation.hpp
index 91c396a1fce034..dd1c659c3bbf9d 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/unsqueeze_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/unsqueeze_transformation.hpp
@@ -31,7 +31,7 @@ class UnsqueezeTransformation :
     public LayerTestsUtils::LayerTransformation {
 public:
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
-    static std::string getTestCaseName(testing::TestParamInfo<UnsqueezeTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<UnsqueezeTransformationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/variadic_split_transformation.hpp b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/variadic_split_transformation.hpp
index 69b2a5247e8552..4c7049ecf618ae 100644
--- a/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/variadic_split_transformation.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/low_precision_transformations/variadic_split_transformation.hpp
@@ -27,7 +27,7 @@ class VariadicSplitTransformation :
     public testing::WithParamInterface<VariadicSplitTransformationParams>,
     public LayerTestsUtils::LayerTransformation {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<VariadicSplitTransformationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<VariadicSplitTransformationParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/plugin/shared/include/single_layer_tests/mvn.hpp b/inference-engine/tests/functional/plugin/shared/include/single_layer_tests/mvn.hpp
index d1a9ff52a108e0..eda135431726cb 100644
--- a/inference-engine/tests/functional/plugin/shared/include/single_layer_tests/mvn.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/single_layer_tests/mvn.hpp
@@ -8,11 +8,6 @@
 
 namespace LayerTestsDefinitions {
 
-// DEPRECATED, remove MvnLayerTest when KMB and ARM plugin will switch to use Mvn1LayerTest (#60420)
-TEST_P(MvnLayerTest, CompareWithRefs) {
-    Run();
-};
-
 TEST_P(Mvn1LayerTest, CompareWithRefs) {
     Run();
 };
diff --git a/inference-engine/tests/functional/plugin/shared/include/subgraph_tests/mul_conv_fusion.hpp b/inference-engine/tests/functional/plugin/shared/include/subgraph_tests/mul_conv_fusion.hpp
new file mode 100644
index 00000000000000..d5050efd7bbf7d
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/shared/include/subgraph_tests/mul_conv_fusion.hpp
@@ -0,0 +1,14 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "shared_test_classes/subgraph/mul_conv_fusion.hpp"
+
+namespace SubgraphTestsDefinitions {
+
+TEST_P(MulConvFusion, CompareWithRefs) {
+    Run();
+}
+} // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/shared/include/subgraph_tests/transpose_add.hpp b/inference-engine/tests/functional/plugin/shared/include/subgraph_tests/transpose_add.hpp
new file mode 100644
index 00000000000000..a9c44baa4b0032
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/shared/include/subgraph_tests/transpose_add.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "shared_test_classes/subgraph/transpose_add.hpp"
+
+namespace SubgraphTestsDefinitions {
+
+TEST_P(TransposeAdd, CompareWithRefImpl) {
+    Run();
+};
+
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/add_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/add_transformation.cpp
index 3d0bd61fe9fd9f..3474298c797a73 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/add_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/add_transformation.cpp
@@ -16,7 +16,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string AddTransformation::getTestCaseName(testing::TestParamInfo< AddTransformationParams> obj) {
+std::string AddTransformation::getTestCaseName(const testing::TestParamInfo< AddTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/clamp_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/clamp_transformation.cpp
index 39a89073c90c76..1da0972305b6d9 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/clamp_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/clamp_transformation.cpp
@@ -12,7 +12,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ClampTransformation::getTestCaseName(testing::TestParamInfo<ClampTransformationParams> obj) {
+std::string ClampTransformation::getTestCaseName(const testing::TestParamInfo<ClampTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_transformation.cpp
index 74a140d1c51264..be9817d929d58f 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_transformation.cpp
@@ -16,7 +16,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConcatTransformation::getTestCaseName(testing::TestParamInfo<ConcatTransformationParams> obj) {
+std::string ConcatTransformation::getTestCaseName(const testing::TestParamInfo<ConcatTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_child_and_output.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_child_and_output.cpp
index debf6671ec0a09..11f65f23804230 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_child_and_output.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_child_and_output.cpp
@@ -19,7 +19,7 @@ using namespace InferenceEngine::details;
 
 namespace LayerTestsDefinitions {
 
-std::string ConcatWithChildAndOutputTransformation::getTestCaseName(testing::TestParamInfo<ConcatWithChildAndOutputTransformationParams> obj) {
+std::string ConcatWithChildAndOutputTransformation::getTestCaseName(const testing::TestParamInfo<ConcatWithChildAndOutputTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_different_precision_on_children.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_different_precision_on_children.cpp
index 1bca896058b55f..22935540a05a40 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_different_precision_on_children.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_different_precision_on_children.cpp
@@ -19,7 +19,7 @@ using namespace InferenceEngine::details;
 
 namespace LayerTestsDefinitions {
 
-std::string ConcatWithDifferentChildrenTransformation::getTestCaseName(testing::TestParamInfo<ConcatWithDifferentChildrenTransformationParams> obj) {
+std::string ConcatWithDifferentChildrenTransformation::getTestCaseName(const testing::TestParamInfo<ConcatWithDifferentChildrenTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_intermediate_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_intermediate_transformation.cpp
index 9d1af48a6ee47e..4c1e6dde2b87d6 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_intermediate_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_intermediate_transformation.cpp
@@ -19,7 +19,7 @@ using namespace InferenceEngine::details;
 
 namespace LayerTestsDefinitions {
 
-std::string ConcatWithIntermediateTransformation::getTestCaseName(testing::TestParamInfo<ConcatWithIntermediateTransformationParams> obj) {
+std::string ConcatWithIntermediateTransformation::getTestCaseName(const testing::TestParamInfo<ConcatWithIntermediateTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_neighbors_graph_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_neighbors_graph_transformation.cpp
index 84adcc30c34489..95ca88a51045e4 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_neighbors_graph_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_neighbors_graph_transformation.cpp
@@ -16,7 +16,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConcatWithNeighborsGraphTransformation::getTestCaseName(testing::TestParamInfo<ConcatNeighboringGraphTransformationParams> obj) {
+std::string ConcatWithNeighborsGraphTransformation::getTestCaseName(const testing::TestParamInfo<ConcatNeighboringGraphTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_split_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_split_transformation.cpp
index c8f7d43422e11a..d0f4cc2520aacd 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_split_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/concat_with_split_transformation.cpp
@@ -19,7 +19,7 @@ using namespace InferenceEngine::details;
 
 namespace LayerTestsDefinitions {
 
-std::string ConcatWithSplitTransformation::getTestCaseName(testing::TestParamInfo<ConcatWithSplitTransformationParams> obj) {
+std::string ConcatWithSplitTransformation::getTestCaseName(const testing::TestParamInfo<ConcatWithSplitTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_backprop_data_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_backprop_data_transformation.cpp
index 913ec3e39a69e2..6f634d5fed0619 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_backprop_data_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_backprop_data_transformation.cpp
@@ -12,7 +12,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConvolutionBackpropDataTransformation::getTestCaseName(testing::TestParamInfo<ConvolutionBackpropDataTransformationParams> obj) {
+std::string ConvolutionBackpropDataTransformation::getTestCaseName(const testing::TestParamInfo<ConvolutionBackpropDataTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     std::pair<ngraph::PartialShape, bool> inputShape;
     ngraph::Shape outputShape;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_qdq_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_qdq_transformation.cpp
index d90427b904b945..d874f5f5284c93 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_qdq_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_qdq_transformation.cpp
@@ -20,7 +20,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConvolutionQDqTransformation::getTestCaseName(testing::TestParamInfo<ConvolutionQDqTransformationParams> obj) {
+std::string ConvolutionQDqTransformation::getTestCaseName(const testing::TestParamInfo<ConvolutionQDqTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_transformation.cpp
index c88acbe38abfd7..89b900011a5cbc 100755
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_transformation.cpp
@@ -20,7 +20,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConvolutionTransformation::getTestCaseName(testing::TestParamInfo<ConvolutionTransformationParams> obj) {
+std::string ConvolutionTransformation::getTestCaseName(const testing::TestParamInfo<ConvolutionTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_with_incorrect_weights.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_with_incorrect_weights.cpp
index ae73d952ba3413..4ffaf537c9eb26 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_with_incorrect_weights.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/convolution_with_incorrect_weights.cpp
@@ -20,7 +20,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConvolutionWIthIncorrectWeightsTransformation::getTestCaseName(testing::TestParamInfo<ConvolutionWIthIncorrectWeightsParams> obj) {
+std::string ConvolutionWIthIncorrectWeightsTransformation::getTestCaseName(const testing::TestParamInfo<ConvolutionWIthIncorrectWeightsParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/depth_to_space_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/depth_to_space_transformation.cpp
index e81263fa958e6c..1a7d912bc34d1b 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/depth_to_space_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/depth_to_space_transformation.cpp
@@ -32,7 +32,7 @@ using namespace ngraph::opset1;
 
 namespace LayerTestsDefinitions {
 
-std::string DepthToSpaceTransformation::getTestCaseName(testing::TestParamInfo<DepthToSpaceTransformationParams> obj) {
+std::string DepthToSpaceTransformation::getTestCaseName(const testing::TestParamInfo<DepthToSpaceTransformationParams>& obj) {
     static std::map<DepthToSpace::DepthToSpaceMode, std::string> names = {
         {DepthToSpace::DepthToSpaceMode::BLOCKS_FIRST, "BLOCKS_FIRST"},
         {DepthToSpace::DepthToSpaceMode::DEPTH_FIRST, "DEPTH_FIRST"},
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_avg_pool_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_avg_pool_transformation.cpp
index 53c444e8aa7393..95fb7331950c6e 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_avg_pool_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_avg_pool_transformation.cpp
@@ -16,7 +16,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FakeQuantizeAndAvgPoolTransformation::getTestCaseName(testing::TestParamInfo<FakeQuantizeAndAvgPoolTransformationParams> obj) {
+std::string FakeQuantizeAndAvgPoolTransformation::getTestCaseName(const testing::TestParamInfo<FakeQuantizeAndAvgPoolTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_max_pool_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_max_pool_transformation.cpp
index 399045c2e90a64..dfb5f503e72444 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_max_pool_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_max_pool_transformation.cpp
@@ -16,7 +16,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FakeQuantizeAndMaxPoolTransformation::getTestCaseName(testing::TestParamInfo<FakeQuantizeAndMaxPoolTransformationParams> obj) {
+std::string FakeQuantizeAndMaxPoolTransformation::getTestCaseName(const testing::TestParamInfo<FakeQuantizeAndMaxPoolTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.cpp
index 81f5bc6f0e35e3..6f1c8912bf468d 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_and_two_output_branches_with_convolution.cpp
@@ -20,7 +20,7 @@
 namespace LayerTestsDefinitions {
 
 std::string FakeQuantizeAndTwoOutputBranchesWithConvolutionTransformation::getTestCaseName(
-    testing::TestParamInfo<FakeQuantizeAndTwoOutputBranchesWithConvolutionParams> obj) {
+    const testing::TestParamInfo<FakeQuantizeAndTwoOutputBranchesWithConvolutionParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_precision_selection_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_precision_selection_transformation.cpp
index 95c2317f26deda..03e75b24ec6ec1 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_precision_selection_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_precision_selection_transformation.cpp
@@ -15,7 +15,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FakeQuantizePrecisionSelectionTransformation::getTestCaseName(testing::TestParamInfo<FakeQuantizeTransformationParams> obj) {
+std::string FakeQuantizePrecisionSelectionTransformation::getTestCaseName(const testing::TestParamInfo<FakeQuantizeTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_transformation.cpp
index 3dd9bc7552911a..083f1e64bee974 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_transformation.cpp
@@ -17,7 +17,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FakeQuantizeTransformation::getTestCaseName(testing::TestParamInfo<FakeQuantizeTransformationParams> obj) {
+std::string FakeQuantizeTransformation::getTestCaseName(const testing::TestParamInfo<FakeQuantizeTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.cpp
index 4f726d8e217668..f4531374303308 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fake_quantize_with_dq_not_optimal_transformation.cpp
@@ -15,7 +15,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FakeQuantizeWithNotOptimalTransformation::getTestCaseName(testing::TestParamInfo<FakeQuantizeTransformationParams> obj) {
+std::string FakeQuantizeWithNotOptimalTransformation::getTestCaseName(const testing::TestParamInfo<FakeQuantizeTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fully_connected_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fully_connected_transformation.cpp
index 3392a086dcbcd4..97407a419302ed 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fully_connected_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fully_connected_transformation.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FullyConnectedTransformation::getTestCaseName(testing::TestParamInfo<FullyConnectedTransformationParams> obj) {
+std::string FullyConnectedTransformation::getTestCaseName(const testing::TestParamInfo<FullyConnectedTransformationParams>& obj) {
     ngraph::element::Type precision;
     MatMulShapes shapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_convert_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_convert_transformation.cpp
index 0f9f0135665601..ed156c079c0c8d 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_convert_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_convert_transformation.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FuseConvertTransformation::getTestCaseName(testing::TestParamInfo<FuseConvertTransformationParams> obj) {
+std::string FuseConvertTransformation::getTestCaseName(const testing::TestParamInfo<FuseConvertTransformationParams>& obj) {
     std::string targetDevice;
     ngraph::PartialShape shape;
     ngraph::element::Type precision;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.cpp
index 46fb7b6ae4a315..6a3b2587f01933 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_and_scale_shift_transformation.cpp
@@ -14,7 +14,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FuseFakeQuantizeAndScaleShiftTransformation::getTestCaseName(testing::TestParamInfo<FuseFakeQuantizeAndScaleShiftTransformationParams> obj) {
+std::string FuseFakeQuantizeAndScaleShiftTransformation::getTestCaseName(const testing::TestParamInfo<FuseFakeQuantizeAndScaleShiftTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_transformation.cpp
index b65b2792564f83..10d2f102d62350 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_fake_quantize_transformation.cpp
@@ -14,7 +14,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FuseFakeQuantizeTransformation::getTestCaseName(testing::TestParamInfo<FuseFakeQuantizeTransformationParams> obj) {
+std::string FuseFakeQuantizeTransformation::getTestCaseName(const testing::TestParamInfo<FuseFakeQuantizeTransformationParams>& obj) {
     std::string targetDevice;
     FuseFakeQuantizeTransformationTestValues testValues;
     std::tie(targetDevice, testValues) = obj.param;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.cpp
index 806eb8dc26c246..a22f80c7d8082b 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_multiply_to_fake_quantize_transformation.cpp
@@ -14,7 +14,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FuseMultiplyToFakeQuantizeTransformation::getTestCaseName(testing::TestParamInfo<FuseMultiplyToFakeQuantizeTransformationParams> obj) {
+std::string FuseMultiplyToFakeQuantizeTransformation::getTestCaseName(const testing::TestParamInfo<FuseMultiplyToFakeQuantizeTransformationParams>& obj) {
     std::string targetDevice;
     FuseMultiplyToFakeQuantizeTransformationTestValues testValues;
     std::tie(targetDevice, testValues) = obj.param;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.cpp
index 59a65e5d04d309..93781f654b6d2c 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/fuse_subtract_to_fake_quantize_transformation.cpp
@@ -14,7 +14,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string FuseSubtractToFakeQuantizeTransformation::getTestCaseName(testing::TestParamInfo<FuseSubtractToFakeQuantizeTransformationParams> obj) {
+std::string FuseSubtractToFakeQuantizeTransformation::getTestCaseName(const testing::TestParamInfo<FuseSubtractToFakeQuantizeTransformationParams>& obj) {
     std::string targetDevice;
     FuseSubtractToFakeQuantizeTransformationTestValues testValues;
     std::tie(targetDevice, testValues) = obj.param;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/gemm_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/gemm_transformation.cpp
index ceec2a8b646a97..17d8a6460691b8 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/gemm_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/gemm_transformation.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string GemmTransformation::getTestCaseName(testing::TestParamInfo<GemmTransformationParams> obj) {
+std::string GemmTransformation::getTestCaseName(const testing::TestParamInfo<GemmTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/group_convolution_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/group_convolution_transformation.cpp
index df70070e7333c5..28aee25c464f43 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/group_convolution_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/group_convolution_transformation.cpp
@@ -20,7 +20,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string GroupConvolutionTransformation::getTestCaseName(testing::TestParamInfo<GroupConvolutionTransformationParams> obj) {
+std::string GroupConvolutionTransformation::getTestCaseName(const testing::TestParamInfo<GroupConvolutionTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     std::string targetDevice;
     ngraph::pass::low_precision::LayerTransformation::Params params;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/groupconvolution_qdq_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/groupconvolution_qdq_transformation.cpp
index 40c4afae04fdb8..32c3783ef7523e 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/groupconvolution_qdq_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/groupconvolution_qdq_transformation.cpp
@@ -20,7 +20,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string GroupConvolutionQDqTransformation::getTestCaseName(testing::TestParamInfo<GroupConvolutionQDqTransformationParams> obj) {
+std::string GroupConvolutionQDqTransformation::getTestCaseName(const testing::TestParamInfo<GroupConvolutionQDqTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/interpolate_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/interpolate_transformation.cpp
index 338ed73147b77c..e7762406754a6a 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/interpolate_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/interpolate_transformation.cpp
@@ -28,7 +28,7 @@ inline std::ostream& operator<<(std::ostream& os, const std::vector<T>& values)
     return os;
 }
 
-std::string InterpolateTransformation::getTestCaseName(testing::TestParamInfo<InterpolateTransformationParams> obj) {
+std::string InterpolateTransformation::getTestCaseName(const testing::TestParamInfo<InterpolateTransformationParams>& obj) {
     ngraph::element::Type precision;
     std::pair<ngraph::PartialShape, ngraph::Shape> shapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_transformation.cpp
index f82dd4ac001bf2..a4691987400941 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_transformation.cpp
@@ -19,7 +19,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string MatMulTransformation::getTestCaseName(testing::TestParamInfo<MatMulTransformationParams> obj) {
+std::string MatMulTransformation::getTestCaseName(const testing::TestParamInfo<MatMulTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_constant_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_constant_transformation.cpp
index 44233cf52a001e..b4df377a620263 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_constant_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_constant_transformation.cpp
@@ -19,7 +19,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string MatMulWithConstantTransformation::getTestCaseName(testing::TestParamInfo<MatMulWithConstantTransformationParams> obj) {
+std::string MatMulWithConstantTransformation::getTestCaseName(const testing::TestParamInfo<MatMulWithConstantTransformationParams>& obj) {
     ngraph::element::Type precision;
     std::string targetDevice;
     MatMulWithConstantTransformationTestValues testValues;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.cpp
index aa5be33128f2a9..68732730f91033 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mat_mul_with_optimized_constant_fake_quantize_transformation.cpp
@@ -21,7 +21,7 @@
 namespace LayerTestsDefinitions {
 
 std::string MatMulWithOptimizedConstantFakeQuantizeTransformation::getTestCaseName(
-    testing::TestParamInfo<MatMulWithOptimizedConstantFakeQuantizeTransformationTransformationParams> obj) {
+    const testing::TestParamInfo<MatMulWithOptimizedConstantFakeQuantizeTransformationTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     std::pair<ngraph::PartialShape, ngraph::PartialShape> shapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/move_fake_quantize_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/move_fake_quantize_transformation.cpp
new file mode 100644
index 00000000000000..d92181e34c2542
--- /dev/null
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/move_fake_quantize_transformation.cpp
@@ -0,0 +1,77 @@
+﻿// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "low_precision_transformations/move_fake_quantize_transformation.hpp"
+
+#include <memory>
+#include <tuple>
+#include <vector>
+#include <string>
+
+#include <ie_core.hpp>
+
+#include "common_test_utils/common_utils.hpp"
+#include "shared_test_classes/base/layer_test_utils.hpp"
+#include "functional_test_utils/blob_utils.hpp"
+#include "lpt_ngraph_functions/move_fake_quantize_function.hpp"
+
+namespace LayerTestsDefinitions {
+
+std::string MoveFakeQuantizeTransformation::getTestCaseName(testing::TestParamInfo<MoveFakeQuantizeTransformationParams> obj) {
+    ngraph::element::Type netPrecision;
+    ngraph::PartialShape inputShape;
+    std::string targetDevice;
+    ngraph::pass::low_precision::LayerTransformation::Params params;
+    MoveFakeQuantizeTransformationParam param;
+    std::tie(netPrecision, inputShape, targetDevice, params, param) = obj.param;
+
+    std::ostringstream result;
+    result << getTestCaseNameByParams(netPrecision, inputShape, targetDevice, params) <<
+        param.operation << param.fakeQuantizeAfter;
+    return result.str();
+}
+
+void MoveFakeQuantizeTransformation::SetUp() {
+    ngraph::element::Type netPrecision;
+    ngraph::PartialShape inputShape;
+    ngraph::pass::low_precision::LayerTransformation::Params params;
+    MoveFakeQuantizeTransformationParam param;
+    std::tie(netPrecision, inputShape, targetDevice, params, param) = this->GetParam();
+
+    function = ngraph::builder::subgraph::MoveFakeQuantize::get(
+        netPrecision,
+        inputShape,
+        param.fakeQuantizeBefore1,
+        param.convertBefore1,
+        param.dequantizationBefore1,
+        param.fakeQuantizeBefore2,
+        param.convertBefore2,
+        param.dequantizationBefore2,
+        param.operation,
+        param.fakeQuantizeAfter,
+        param.convertAfter,
+        param.dequantizationAfter,
+        {},
+        {},
+        {},
+        param.axis);
+}
+
+void MoveFakeQuantizeTransformation::Run() {
+    LayerTestsCommon::Run();
+
+    const auto params = std::get<4>(GetParam());
+    const auto actualPrecision = getRuntimePrecisionByType(params.layerName);
+    auto expectedPrecision = params.expectedKernelType;
+    if (expectedPrecision == "FP32" && std::get<0>(GetParam()) == ngraph::element::f16) {
+        expectedPrecision = "FP16";
+    }
+    EXPECT_EQ(actualPrecision, expectedPrecision);
+}
+
+TEST_P(MoveFakeQuantizeTransformation, CompareWithRefImpl) {
+    Run();
+};
+
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_to_group_convolution_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_to_group_convolution_transformation.cpp
index 5260bbfcc11add..65a878ea16c3cc 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_to_group_convolution_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_to_group_convolution_transformation.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string MultiplyToGroupConvolutionTransformation::getTestCaseName(testing::TestParamInfo<MultiplyToGroupConvolutionTransformationParams> obj) {
+std::string MultiplyToGroupConvolutionTransformation::getTestCaseName(const testing::TestParamInfo<MultiplyToGroupConvolutionTransformationParams>& obj) {
     std::string targetDevice;
     ngraph::element::Type precision;
     ngraph::PartialShape shape;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_transformation.cpp
index 62be4e6092d9cc..cf0c42c06e99f2 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_transformation.cpp
@@ -17,7 +17,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string MultiplyTransformation::getTestCaseName(testing::TestParamInfo<MultiplyTransformationParams> obj) {
+std::string MultiplyTransformation::getTestCaseName(const testing::TestParamInfo<MultiplyTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_with_one_parent_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_with_one_parent_transformation.cpp
index 34a78299be7a95..a5214e02d6aafc 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_with_one_parent_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/multiply_with_one_parent_transformation.cpp
@@ -15,7 +15,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string MultiplyWithOneParentTransformation::getTestCaseName(testing::TestParamInfo<MultiplyWithOneParentTransformationParams> obj) {
+std::string MultiplyWithOneParentTransformation::getTestCaseName(const testing::TestParamInfo<MultiplyWithOneParentTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mvn_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mvn_transformation.cpp
index 597a95d102be06..fffb70d9c777cf 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mvn_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/mvn_transformation.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string MVNTransformation::getTestCaseName(testing::TestParamInfo<MVNTransformationParams> obj) {
+std::string MVNTransformation::getTestCaseName(const testing::TestParamInfo<MVNTransformationParams>& obj) {
     std::string targetDevice;
     ngraph::PartialShape shape;
     ngraph::element::Type precision;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/normalize_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/normalize_transformation.cpp
index b6a6afed9f84f2..0e663991bd7a9a 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/normalize_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/normalize_transformation.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string NormalizeL2Transformation::getTestCaseName(testing::TestParamInfo<NormalizeL2TransformationParams> obj) {
+std::string NormalizeL2Transformation::getTestCaseName(const testing::TestParamInfo<NormalizeL2TransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     std::pair<ngraph::PartialShape, ngraph::Shape> shapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations.cpp
index 11b1b6bc489072..1caa0f5d02dcf6 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string OutputLayersHandlingInTransformations::getTestCaseName(testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams> obj) {
+std::string OutputLayersHandlingInTransformations::getTestCaseName(const testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat.cpp
index 5b18981cd4c817..0068d8af6fd4ac 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string OutputLayersHandlingInTransformationsForConcat::getTestCaseName(testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams> obj) {
+std::string OutputLayersHandlingInTransformationsForConcat::getTestCaseName(const testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.cpp
index 5ee5a1d7dfe1ad..02f4cc539d3202 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/output_layers_handling_in_transformations_for_concat_multi_channel.cpp
@@ -29,7 +29,7 @@ std::pair<float, float> outputLayersHandlingInTransformationsForConcatMultiChann
 }
 
 std::string OutputLayersHandlingInTransformationsForConcatMultiChannel::getTestCaseName(
-    testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams> obj) {
+    const testing::TestParamInfo<LayerTestsUtils::LayerTransformationParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pad_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pad_transformation.cpp
index 80a7a23b9591ee..0da5b32d33bd88 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pad_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pad_transformation.cpp
@@ -12,7 +12,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string PadTransformation::getTestCaseName(testing::TestParamInfo<PadTransformationParams> obj) {
+std::string PadTransformation::getTestCaseName(const testing::TestParamInfo<PadTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     ngraph::op::PadMode padMode;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/prelu_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/prelu_transformation.cpp
index 38bff18b3f0334..5d425a0f7dffe1 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/prelu_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/prelu_transformation.cpp
@@ -15,7 +15,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string PReluTransformation::getTestCaseName(testing::TestParamInfo<PReluTransformationParams> obj) {
+std::string PReluTransformation::getTestCaseName(const testing::TestParamInfo<PReluTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pull_reshape_through_dequantization_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pull_reshape_through_dequantization_transformation.cpp
index 2824a2adc3c3f5..035201eb5e66c3 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pull_reshape_through_dequantization_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/pull_reshape_through_dequantization_transformation.cpp
@@ -20,7 +20,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string PullReshapeThroughDequantizationTransformation::getTestCaseName(testing::TestParamInfo<PullReshapeThroughDequantizationParams> obj) {
+std::string PullReshapeThroughDequantizationTransformation::getTestCaseName(const testing::TestParamInfo<PullReshapeThroughDequantizationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_max_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_max_transformation.cpp
index 3c7830a2c49a05..be7309daa20133 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_max_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_max_transformation.cpp
@@ -12,7 +12,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ReduceMaxTransformation::getTestCaseName(testing::TestParamInfo<ReduceMaxTransformationParams> obj) {
+std::string ReduceMaxTransformation::getTestCaseName(const testing::TestParamInfo<ReduceMaxTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_mean_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_mean_transformation.cpp
index 54facc6ffdc446..61a74ca4695c68 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_mean_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_mean_transformation.cpp
@@ -12,7 +12,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ReduceMeanTransformation::getTestCaseName(testing::TestParamInfo<ReduceMeanTransformationParams> obj) {
+std::string ReduceMeanTransformation::getTestCaseName(const testing::TestParamInfo<ReduceMeanTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_min_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_min_transformation.cpp
index 43de5bbf9b6937..da1f229583d0ef 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_min_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_min_transformation.cpp
@@ -12,7 +12,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ReduceMinTransformation::getTestCaseName(testing::TestParamInfo<ReduceMinTransformationParams> obj) {
+std::string ReduceMinTransformation::getTestCaseName(const testing::TestParamInfo<ReduceMinTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_sum_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_sum_transformation.cpp
index 3c0f618359db8b..1c6e11febe692c 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_sum_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reduce_sum_transformation.cpp
@@ -12,7 +12,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ReduceSumTransformation::getTestCaseName(testing::TestParamInfo<ReduceSumTransformationParams> obj) {
+std::string ReduceSumTransformation::getTestCaseName(const testing::TestParamInfo<ReduceSumTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/relu_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/relu_transformation.cpp
index 9b681dc1d2b0cd..197bf8ec1fd213 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/relu_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/relu_transformation.cpp
@@ -15,7 +15,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ReluTransformation::getTestCaseName(testing::TestParamInfo<ReluTransformationParams> obj) {
+std::string ReluTransformation::getTestCaseName(const testing::TestParamInfo<ReluTransformationParams>& obj) {
     ngraph::element::Type precision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reshape_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reshape_transformation.cpp
index 1c227ce27a349b..dc927ef9427209 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reshape_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/reshape_transformation.cpp
@@ -13,7 +13,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ReshapeTransformation::getTestCaseName(testing::TestParamInfo<ReshapeTransformationParams> obj) {
+std::string ReshapeTransformation::getTestCaseName(const testing::TestParamInfo<ReshapeTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     std::string targetDevice;
     ngraph::pass::low_precision::LayerTransformation::Params params;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/shuffle_channels_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/shuffle_channels_transformation.cpp
index 476f30b6ad14e1..4943de4fcb85f0 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/shuffle_channels_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/shuffle_channels_transformation.cpp
@@ -18,7 +18,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ShuffleChannelsTransformation::getTestCaseName(testing::TestParamInfo<ShuffleChannelsTransformationParams> obj) {
+std::string ShuffleChannelsTransformation::getTestCaseName(const testing::TestParamInfo<ShuffleChannelsTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/split_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/split_transformation.cpp
index 0a872acfdb5f4d..94ac53bab8f7d6 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/split_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/split_transformation.cpp
@@ -15,7 +15,7 @@
 #include "lpt_ngraph_functions/split_function.hpp"
 
 namespace LayerTestsDefinitions {
-std::string SplitTransformation::getTestCaseName(testing::TestParamInfo<SplitTransformationParams> obj) {
+std::string SplitTransformation::getTestCaseName(const testing::TestParamInfo<SplitTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape  inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/squeeze_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/squeeze_transformation.cpp
index 7d14b198b219ff..7976c9be0a6d4c 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/squeeze_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/squeeze_transformation.cpp
@@ -46,7 +46,7 @@ InferenceEngine::Blob::Ptr SqueezeTransformation::GenerateInput(const InferenceE
         1ul);
 }
 
-std::string SqueezeTransformation::getTestCaseName(testing::TestParamInfo<SqueezeTransformationParams> obj) {
+std::string SqueezeTransformation::getTestCaseName(const testing::TestParamInfo<SqueezeTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::pass::low_precision::LayerTransformation::Params params;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/strided_slice_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/strided_slice_transformation.cpp
index ef14239fc936c6..08a5da998e3e49 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/strided_slice_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/strided_slice_transformation.cpp
@@ -24,7 +24,7 @@ inline std::ostream& operator<<(std::ostream& os, const std::vector<int64_t>& va
     return os;
 }
 
-std::string StridedSliceTransformation::getTestCaseName(testing::TestParamInfo<StridedSliceTransformationParams> obj) {
+std::string StridedSliceTransformation::getTestCaseName(const testing::TestParamInfo<StridedSliceTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShape;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.cpp
index af06bd2d5f1858..7b6726d9ae259d 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_multiply_to_multiply_add_transformation.cpp
@@ -15,7 +15,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string SubtractMultiplyToMultiplyAddTransformation::getTestCaseName(testing::TestParamInfo<SubtractMultiplyToMultiplyAddTransformationParams> obj) {
+std::string SubtractMultiplyToMultiplyAddTransformation::getTestCaseName(const testing::TestParamInfo<SubtractMultiplyToMultiplyAddTransformationParams>& obj) {
     std::string targetDevice;
     SubtractMultiplyToMultiplyAddTransformationTestValues testValues;
     std::tie(targetDevice, testValues) = obj.param;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_transformation.cpp
index 55841cc8760ce0..58898d9be441ac 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/subtract_transformation.cpp
@@ -17,7 +17,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string SubtractTransformation::getTestCaseName(testing::TestParamInfo<SubtractTransformationParams> obj) {
+std::string SubtractTransformation::getTestCaseName(const testing::TestParamInfo<SubtractTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_after_matmul_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_after_matmul_transformation.cpp
index 11c7bdb729b4f0..037296f321c646 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_after_matmul_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_after_matmul_transformation.cpp
@@ -21,7 +21,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string TransposeAfterMatMulTransformation::getTestCaseName(testing::TestParamInfo<TransposeAfterMatMulTransformationParams> obj) {
+std::string TransposeAfterMatMulTransformation::getTestCaseName(const testing::TestParamInfo<TransposeAfterMatMulTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_transformation.cpp
index 874a0f2e2a725c..09832342af1fc5 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/transpose_transformation.cpp
@@ -15,7 +15,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string TransposeTransformation::getTestCaseName(testing::TestParamInfo<TransposeTransformationParams> obj) {
+std::string TransposeTransformation::getTestCaseName(const testing::TestParamInfo<TransposeTransformationParams>& obj) {
     ngraph::element::Type precision;
     std::string targetDevice;
     TransposeTransformationTestValues testValues;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/unsqueeze_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/unsqueeze_transformation.cpp
index 3678f160babc16..31761f5ef3adb9 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/unsqueeze_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/unsqueeze_transformation.cpp
@@ -46,7 +46,7 @@ InferenceEngine::Blob::Ptr UnsqueezeTransformation::GenerateInput(const Inferenc
         1ul);
 }
 
-std::string UnsqueezeTransformation::getTestCaseName(testing::TestParamInfo<UnsqueezeTransformationParams> obj) {
+std::string UnsqueezeTransformation::getTestCaseName(const testing::TestParamInfo<UnsqueezeTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::pass::low_precision::LayerTransformation::Params params;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/variadic_split_transformation.cpp b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/variadic_split_transformation.cpp
index 695883b600462a..a5cf92e691c05c 100644
--- a/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/variadic_split_transformation.cpp
+++ b/inference-engine/tests/functional/plugin/shared/src/low_precision_transformations/variadic_split_transformation.cpp
@@ -15,7 +15,7 @@
 #include "lpt_ngraph_functions/variadic_split_function.hpp"
 
 namespace LayerTestsDefinitions {
-std::string VariadicSplitTransformation::getTestCaseName(testing::TestParamInfo<VariadicSplitTransformationParams> obj) {
+std::string VariadicSplitTransformation::getTestCaseName(const testing::TestParamInfo<VariadicSplitTransformationParams>& obj) {
     ngraph::element::Type netPrecision;
     ngraph::PartialShape inputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/CMakeLists.txt b/inference-engine/tests/functional/shared_test_classes/CMakeLists.txt
index cb160f94b513a9..c25ee8f9f04d03 100644
--- a/inference-engine/tests/functional/shared_test_classes/CMakeLists.txt
+++ b/inference-engine/tests/functional/shared_test_classes/CMakeLists.txt
@@ -23,12 +23,6 @@ addIeTarget(
                 ngraphFunctions
 )
 
-# CVS-55373
-set_source_files_properties(
-    "${CMAKE_CURRENT_SOURCE_DIR}/src/subgraph/softsign.cpp"
-    PROPERTIES INCLUDE_DIRECTORIES
-        $<TARGET_PROPERTY:inference_engine_legacy,INTERFACE_INCLUDE_DIRECTORIES>)
-
 ie_faster_build(${TARGET_NAME}
         PCH PRIVATE "src/precomp.hpp"
         )
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/adaptive_pooling.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/adaptive_pooling.hpp
index fcbb8d0ebcf678..83ca0a9a9f40df 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/adaptive_pooling.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/adaptive_pooling.hpp
@@ -17,7 +17,7 @@ using adapoolParams = std::tuple<
 class AdaPoolLayerTest : public testing::WithParamInterface<adapoolParams>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<adapoolParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<adapoolParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/binary_convolution.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/binary_convolution.hpp
index 196c659786e9a6..8c4b87c3081dcf 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/binary_convolution.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/binary_convolution.hpp
@@ -38,7 +38,7 @@ using binaryConvolutionTestParamsSet = std::tuple<
 class BinaryConvolutionLayerTest : public testing::WithParamInterface<binaryConvolutionTestParamsSet>,
                                    virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<binaryConvolutionTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<binaryConvolutionTestParamsSet>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/bucketize.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/bucketize.hpp
index 8917ee3681a9f1..d5ffc42b36feed 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/bucketize.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/bucketize.hpp
@@ -26,7 +26,7 @@ using bucketizeParamsTuple = std::tuple<
 class BucketizeLayerTest : public testing::WithParamInterface<bucketizeParamsTuple>,
                            virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<bucketizeParamsTuple> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<bucketizeParamsTuple>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/clamp.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/clamp.hpp
index bcf34636513df6..65e1ee381e347c 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/clamp.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/clamp.hpp
@@ -23,7 +23,7 @@ using clampParamsTuple = std::tuple<
 class ClampLayerTest : public testing::WithParamInterface<clampParamsTuple>,
                        virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<clampParamsTuple> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<clampParamsTuple>& obj);
 protected:
     void SetUp() override;
 };
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution.hpp
index c8d7b0b89698a3..ce8badb6da7e29 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution.hpp
@@ -39,7 +39,7 @@ typedef std::tuple<
 class ConvolutionLayerTest : public testing::WithParamInterface<convLayerTestParamsSet>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<convLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<convLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop.hpp
index 794782396da858..ef0af87cad5262 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop.hpp
@@ -40,7 +40,7 @@ typedef std::tuple<
 class ConvolutionBackpropLayerTest : public testing::WithParamInterface<convBackpropLayerTestParamsSet>,
                                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<convBackpropLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<convBackpropLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop_data.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop_data.hpp
index 933f3d6d89be60..d73bdf7328916f 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop_data.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/convolution_backprop_data.hpp
@@ -42,7 +42,7 @@ typedef std::tuple<
 class ConvolutionBackpropDataLayerTest : public testing::WithParamInterface<convBackpropDataLayerTestParamsSet>,
                                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<convBackpropDataLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<convBackpropDataLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/cum_sum.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/cum_sum.hpp
index 6a52af687c27ed..d59918fecfdcb0 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/cum_sum.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/cum_sum.hpp
@@ -22,7 +22,7 @@ typedef std::tuple<
 
 class CumSumLayerTest : public testing::WithParamInterface<cumSumParams>, virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<cumSumParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<cumSumParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_convolution.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_convolution.hpp
index 40cf7db1f5a42a..1b1cff6a0d3c4e 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_convolution.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_convolution.hpp
@@ -44,7 +44,7 @@ typedef std::tuple<
 class DeformableConvolutionLayerTest : public testing::WithParamInterface<deformableConvLayerTestParamsSet>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<deformableConvLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<deformableConvLayerTestParamsSet>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_psroi_pooling.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_psroi_pooling.hpp
index f870e11aba8ee6..a891d1ca87fbfa 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_psroi_pooling.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/deformable_psroi_pooling.hpp
@@ -35,7 +35,7 @@ using deformablePSROILayerTestParams = std::tuple<
 class DeformablePSROIPoolingLayerTest : public testing::WithParamInterface<deformablePSROILayerTestParams>,
     virtual public LayerTestsUtils::LayerTestsCommon {
         public:
-            static std::string getTestCaseName(testing::TestParamInfo<deformablePSROILayerTestParams> obj);
+            static std::string getTestCaseName(const testing::TestParamInfo<deformablePSROILayerTestParams>& obj);
             void GenerateInputs() override;
 
         protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/detection_output.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/detection_output.hpp
index e7279c83c74001..31cfd4b79af402 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/detection_output.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/detection_output.hpp
@@ -59,7 +59,7 @@ using DetectionOutputParams = std::tuple<
 
 class DetectionOutputLayerTest : public testing::WithParamInterface<DetectionOutputParams>, virtual public LayerTestsUtils::LayerTestsCommon {
   public:
-    static std::string getTestCaseName(testing::TestParamInfo<DetectionOutputParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<DetectionOutputParams>& obj);
     ngraph::op::DetectionOutputAttrs attrs;
     std::vector<InferenceEngine::SizeVector> inShapes;
     void GenerateInputs() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/dft.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/dft.hpp
index 9f46000fc56671..bd44f88e3b202d 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/dft.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/dft.hpp
@@ -22,7 +22,7 @@ typedef std::tuple<
 
 class DFTLayerTest : public testing::WithParamInterface<DFTParams>, virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<DFTParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<DFTParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/eltwise.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/eltwise.hpp
index b17b8891922212..842bcdd0f7ea0a 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/eltwise.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/eltwise.hpp
@@ -35,6 +35,6 @@ class EltwiseLayerTest : public testing::WithParamInterface<EltwiseTestParams>,
     void SetUp() override;
 
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<EltwiseTestParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<EltwiseTestParams>& obj);
 };
 } // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_offsets_sum.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_offsets_sum.hpp
index 1d72b248bdcfe8..b18014a2cb52ef 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_offsets_sum.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_offsets_sum.hpp
@@ -30,7 +30,7 @@ typedef std::tuple<
 class EmbeddingBagOffsetsSumLayerTest : public testing::WithParamInterface<embeddingBagOffsetsSumLayerTestParamsSet>,
             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<embeddingBagOffsetsSumLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<embeddingBagOffsetsSumLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_packed_sum.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_packed_sum.hpp
index 711de79841bcf8..03b18af7aa19a4 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_packed_sum.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_bag_packed_sum.hpp
@@ -28,7 +28,7 @@ typedef std::tuple<
 class EmbeddingBagPackedSumLayerTest : public testing::WithParamInterface<embeddingBagPackedSumLayerTestParamsSet>,
             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<embeddingBagPackedSumLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<embeddingBagPackedSumLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_segments_sum.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_segments_sum.hpp
index d6498a1379f58c..80390f26c14438 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_segments_sum.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/embedding_segments_sum.hpp
@@ -31,7 +31,7 @@ typedef std::tuple<
 class EmbeddingSegmentsSumLayerTest : public testing::WithParamInterface<embeddingSegmentsSumLayerTestParamsSet>,
             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<embeddingSegmentsSumLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<embeddingSegmentsSumLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution.hpp
index 37b61b3f9582e8..874573b810efca 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution.hpp
@@ -36,10 +36,10 @@ typedef std::tuple<
 class GroupConvolutionLayerTest : public testing::WithParamInterface<groupConvLayerTestParamsSet>,
                                   virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<groupConvLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<groupConvLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution_backprop_data.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution_backprop_data.hpp
index fbeaecb719f249..2d61e90059f19d 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution_backprop_data.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/group_convolution_backprop_data.hpp
@@ -38,7 +38,7 @@ using  groupConvBackpropDataLayerTestParamsSet = std::tuple<
 class GroupConvBackpropDataLayerTest : public testing::WithParamInterface<groupConvBackpropDataLayerTestParamsSet>,
                                        virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<groupConvBackpropDataLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<groupConvBackpropDataLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/interpolate.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/interpolate.hpp
index 541f3c4fa16a73..37cfacc51ef515 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/interpolate.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/interpolate.hpp
@@ -45,7 +45,7 @@ typedef std::tuple<
 class InterpolateLayerTest : public testing::WithParamInterface<InterpolateLayerTestParams>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<InterpolateLayerTestParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<InterpolateLayerTestParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/log_softmax.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/log_softmax.hpp
index 3b32a1f6658c7f..3a086c03d25be8 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/log_softmax.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/log_softmax.hpp
@@ -31,7 +31,7 @@ using logSoftmaxLayerTestParams = std::tuple<
 class LogSoftmaxLayerTest : public testing::WithParamInterface<logSoftmaxLayerTestParams>,
                             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<logSoftmaxLayerTestParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<logSoftmaxLayerTestParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/logical.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/logical.hpp
index d5702f43302a34..697dc1ffdd1266 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/logical.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/logical.hpp
@@ -40,7 +40,7 @@ class LogicalLayerTest : public testing::WithParamInterface<LogicalTestParams>,
     void SetUp() override;
 
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LogicalTestParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LogicalTestParams>& obj);
     static std::vector<LogicalParams::InputShapesTuple> combineShapes(const std::map<std::vector<size_t>, std::vector<std::vector<size_t >>>& inputShapes);
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/low_precision.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/low_precision.hpp
index d45b6d605d992b..46cb931bdf431e 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/low_precision.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/low_precision.hpp
@@ -24,7 +24,7 @@ typedef std::tuple<
 class LowPrecisionTest : public testing::WithParamInterface<lowPrecisionTestParamsSet>,
     virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<lowPrecisionTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<lowPrecisionTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/lrn.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/lrn.hpp
index 5b5c94236f268b..f47f883871fb23 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/lrn.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/lrn.hpp
@@ -33,7 +33,7 @@ class LrnLayerTest
         : public testing::WithParamInterface<lrnLayerTestParamsSet>,
           virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<lrnLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<lrnLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/matrix_nms.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/matrix_nms.hpp
index 9be3b082c3b808..f318c6930af7a2 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/matrix_nms.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/matrix_nms.hpp
@@ -40,7 +40,7 @@ using NmsParams = std::tuple<InputShapeParams,
 
 class MatrixNmsLayerTest : public testing::WithParamInterface<NmsParams>, virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<NmsParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<NmsParams>& obj);
     void GenerateInputs() override;
     void Compare(const std::vector<std::pair<ngraph::element::Type, std::vector<std::uint8_t>>> &expectedOutputs,
                  const std::vector<InferenceEngine::Blob::Ptr> &actualOutputs)
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/multiclass_nms.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/multiclass_nms.hpp
index 4add46d8ce13f2..4dd7777b4b9c83 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/multiclass_nms.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/multiclass_nms.hpp
@@ -42,7 +42,7 @@ using MulticlassNmsParams = std::tuple<InputShapeParams,
 
 class MulticlassNmsLayerTest : public testing::WithParamInterface<MulticlassNmsParams>, virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<MulticlassNmsParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<MulticlassNmsParams>& obj);
     void GenerateInputs() override;
     void Compare(const std::vector<std::pair<ngraph::element::Type, std::vector<std::uint8_t>>>& expectedOutputs,
                  const std::vector<InferenceEngine::Blob::Ptr>& actualOutputs) override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/mvn.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/mvn.hpp
index 747e0940da7fef..9876e825034958 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/mvn.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/mvn.hpp
@@ -11,23 +11,6 @@
 
 namespace LayerTestsDefinitions {
 
-// DEPRECATED, remove MvnLayerTest when KMB and ARM plugin will switch to use Mvn1LayerTest (#60420)
-typedef std::tuple<
-        InferenceEngine::SizeVector, // Input shapes
-        InferenceEngine::Precision,  // Input precision
-        bool,                        // Across channels
-        bool,                        // Normalize variance
-        double,                      // Epsilon
-        std::string> mvnParams;      // Device name
-
-class MvnLayerTest : public testing::WithParamInterface<mvnParams>, virtual public LayerTestsUtils::LayerTestsCommon {
-public:
-    static std::string getTestCaseName(const testing::TestParamInfo<mvnParams>& obj);
-
-protected:
-    void SetUp() override;
-};
-
 typedef std::tuple<
         InferenceEngine::SizeVector, // Input shapes
         InferenceEngine::Precision,  // Input precision
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/non_max_suppression.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/non_max_suppression.hpp
index 0714f0236d8629..92a4e6cde227a7 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/non_max_suppression.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/non_max_suppression.hpp
@@ -43,7 +43,7 @@ using NmsParams = std::tuple<InputShapeParams,
 
 class NmsLayerTest : public testing::WithParamInterface<NmsParams>, virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<NmsParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<NmsParams>& obj);
     void GenerateInputs() override;
     void Compare(const std::vector<std::pair<ngraph::element::Type, std::vector<std::uint8_t>>> &expectedOutputs,
                  const std::vector<InferenceEngine::Blob::Ptr> &actualOutputs)
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/nonzero.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/nonzero.hpp
index 7953aab58b0cbd..e3fbc5b0c84980 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/nonzero.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/nonzero.hpp
@@ -27,7 +27,7 @@ using NonZeroLayerTestParamsSet = typename std::tuple<
 class NonZeroLayerTest : public testing::WithParamInterface<NonZeroLayerTestParamsSet>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<NonZeroLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<NonZeroLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/normalize_l2.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/normalize_l2.hpp
index c0740d48f40d7c..5d047f52def11e 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/normalize_l2.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/normalize_l2.hpp
@@ -25,7 +25,7 @@ using NormalizeL2LayerTestParams = std::tuple<
 class NormalizeL2LayerTest : public testing::WithParamInterface<NormalizeL2LayerTestParams>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<NormalizeL2LayerTestParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<NormalizeL2LayerTestParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/one_hot.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/one_hot.hpp
index 13d8b533687e51..62b6b0fdc61ee0 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/one_hot.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/one_hot.hpp
@@ -27,7 +27,7 @@ typedef std::tuple<
 class OneHotLayerTest : public testing::WithParamInterface<oneHotLayerTestParamsSet>,
                      virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<oneHotLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<oneHotLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pad.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pad.hpp
index 799c0c8ba67ebb..1580ecd45e6cb8 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pad.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pad.hpp
@@ -29,7 +29,7 @@ typedef std::tuple<
 class PadLayerTest : public testing::WithParamInterface<padLayerTestParamsSet>,
                      virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<padLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<padLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pooling.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pooling.hpp
index 72c96115806d45..12417959d22bf7 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pooling.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/pooling.hpp
@@ -51,7 +51,7 @@ typedef std::tuple<
 class PoolingLayerTest : public testing::WithParamInterface<poolLayerTestParamsSet>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<poolLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<poolLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
@@ -60,7 +60,7 @@ class PoolingLayerTest : public testing::WithParamInterface<poolLayerTestParamsS
 class GlobalPoolingLayerTest : public testing::WithParamInterface<globalPoolLayerTestParamsSet>,
                                virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<globalPoolLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<globalPoolLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/proposal.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/proposal.hpp
index 2514dcd1b51b13..5d889dec8fae56 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/proposal.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/proposal.hpp
@@ -55,7 +55,7 @@ class ProposalLayerTest
         : public testing::WithParamInterface<proposalLayerTestParamsSet>,
           virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<proposalLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<proposalLayerTestParamsSet>& obj);
     static std::string SerializeProposalSpecificParams(proposalSpecificParams& params);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
     void Compare(const std::vector<std::pair<ngraph::element::Type, std::vector<std::uint8_t>>> &expectedOutputs,
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/psroi_pooling.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/psroi_pooling.hpp
index 1787cc047842fe..3e15e38da62d54 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/psroi_pooling.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/psroi_pooling.hpp
@@ -30,7 +30,7 @@ using psroiParams = std::tuple<std::vector<size_t>,            // input shape
 class PSROIPoolingLayerTest : public testing::WithParamInterface<psroiParams>,
     virtual public LayerTestsUtils::LayerTestsCommon {
         public:
-            static std::string getTestCaseName(testing::TestParamInfo<psroiParams> obj);
+            static std::string getTestCaseName(const testing::TestParamInfo<psroiParams>& obj);
             void GenerateInputs() override;
     static void fillROITensor(float* buffer, int numROIs, int batchSize,
                               int height, int width, int groupSize,
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/range.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/range.hpp
index 573f79eeec2908..1901d71dc6d92d 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/range.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/range.hpp
@@ -29,7 +29,7 @@ class RangeLayerTest : public testing::WithParamInterface<RangeParams>,
                        virtual public LayerTestsUtils::LayerTestsCommon {
     float start, stop, step;
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<RangeParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<RangeParams>& obj);
     void Infer() override;
 
 protected:
@@ -39,7 +39,7 @@ class RangeLayerTest : public testing::WithParamInterface<RangeParams>,
 class RangeNumpyLayerTest : public testing::WithParamInterface<RangeParams>,
                             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<RangeParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<RangeParams>& obj);
     void Infer() override;
 protected:
     void SetUp() override;
@@ -47,4 +47,4 @@ class RangeNumpyLayerTest : public testing::WithParamInterface<RangeParams>,
     float start, stop, step;
 };
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reduce_ops.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reduce_ops.hpp
index 98029b6ebef55d..dc164a0d1e02cb 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reduce_ops.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reduce_ops.hpp
@@ -30,7 +30,7 @@ typedef std::tuple<
 class ReduceOpsLayerTest : public testing::WithParamInterface<reduceMeanParams>,
                            virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<reduceMeanParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<reduceMeanParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 
 protected:
@@ -42,4 +42,4 @@ class ReduceOpsLayerWithSpecificInputTest : public ReduceOpsLayerTest {
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo &info) const override;
 };
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reshape.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reshape.hpp
index ead04a5f4e9fb9..7ca1c3f29beb55 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reshape.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/reshape.hpp
@@ -30,8 +30,7 @@ typedef std::tuple<bool,                               // SpecialZero
 class ReshapeLayerTest : public testing::WithParamInterface<reshapeParams>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(
-        testing::TestParamInfo<reshapeParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<reshapeParams> &obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/result.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/result.hpp
index f3573eea4c3100..8287603463bdfc 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/result.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/result.hpp
@@ -26,7 +26,7 @@ using ResultTestParamSet = typename std::tuple<
 class ResultLayerTest : public testing::WithParamInterface<ResultTestParamSet>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ResultTestParamSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ResultTestParamSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_align.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_align.hpp
index b4f4064292790e..1f7281d57fafec 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_align.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_align.hpp
@@ -21,7 +21,7 @@ using roialignParams = std::tuple<std::vector<size_t>,  // feature map shape
 class ROIAlignLayerTest : public testing::WithParamInterface<roialignParams>,
                               virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<roialignParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<roialignParams>& obj);
     static void fillCoordTensor(std::vector<float>& coords, int height, int width,
                                 float spatialScale, int pooledRatio, int pooledH, int pooledW);
     static void fillIdxTensor(std::vector<int>& idx, int batchSize);
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_pooling.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_pooling.hpp
index bdd446c021646a..798123c1bda9d7 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_pooling.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roi_pooling.hpp
@@ -28,7 +28,7 @@ using roiPoolingParamsTuple = std::tuple<
 class ROIPoolingLayerTest : public testing::WithParamInterface<roiPoolingParamsTuple>,
                             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<roiPoolingParamsTuple> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<roiPoolingParamsTuple>& obj);
     void GenerateInputs() override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roll.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roll.hpp
index 97dfcdb7fbc52d..b43042f46462f2 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roll.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/roll.hpp
@@ -21,7 +21,7 @@ typedef std::tuple<
 
 class RollLayerTest : public testing::WithParamInterface<rollParams>, virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<rollParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<rollParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shape_of.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shape_of.hpp
index 8756f824c1ad26..135b327cc3bfe6 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shape_of.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shape_of.hpp
@@ -23,7 +23,7 @@ typedef std::tuple<
 class ShapeOfLayerTest : public testing::WithParamInterface<shapeOfParams>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<shapeOfParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<shapeOfParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shuffle_channels.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shuffle_channels.hpp
index 6646b622a82ab6..d0cf2bfc4fcecf 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shuffle_channels.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/shuffle_channels.hpp
@@ -32,7 +32,7 @@ typedef std::tuple<
 class ShuffleChannelsLayerTest : public testing::WithParamInterface<shuffleChannelsLayerTestParamsSet>,
                                  virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<shuffleChannelsLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<shuffleChannelsLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/softmax.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/softmax.hpp
index 02fd100035698d..b997e3651f2159 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/softmax.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/softmax.hpp
@@ -31,7 +31,7 @@ using softMaxLayerTestParams = std::tuple<
 class SoftMaxLayerTest : public testing::WithParamInterface<softMaxLayerTestParams>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<softMaxLayerTestParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<softMaxLayerTestParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/split.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/split.hpp
index bc45e82a0db8c6..d0fb931919bda2 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/split.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/split.hpp
@@ -30,7 +30,7 @@ typedef std::tuple<
 class SplitLayerTest : public testing::WithParamInterface<splitParams>,
                        virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<splitParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<splitParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/squeeze_unsqueeze.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/squeeze_unsqueeze.hpp
index 6dd1d0dad9073b..2c4edf90c21941 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/squeeze_unsqueeze.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/squeeze_unsqueeze.hpp
@@ -29,9 +29,9 @@ typedef std::tuple<
 class SqueezeUnsqueezeLayerTest : public testing::WithParamInterface<squeezeParams>,
                        virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<squeezeParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<squeezeParams>& obj);
 protected:
     void SetUp() override;
 };
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/tile.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/tile.hpp
index c4cffefe29a803..9b17424e26d1a1 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/tile.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/tile.hpp
@@ -29,7 +29,7 @@ typedef std::tuple<
 class TileLayerTest : public testing::WithParamInterface<TileLayerTestParamsSet>,
                       virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<TileLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<TileLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/topk.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/topk.hpp
index 26262fe1d5d570..f2e3667d78f28d 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/topk.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/topk.hpp
@@ -27,10 +27,10 @@ typedef std::tuple<
 class TopKLayerTest : public testing::WithParamInterface<TopKParams>,
                       virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<TopKParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<TopKParams>& obj);
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/transpose.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/transpose.hpp
index 22c253dede91bc..6fc59a9dcc06f8 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/transpose.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/transpose.hpp
@@ -28,10 +28,10 @@ typedef std::tuple<
 class TransposeLayerTest : public testing::WithParamInterface<transposeParams>,
                            virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<transposeParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<transposeParams>& obj);
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/variadic_split.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/variadic_split.hpp
index 02f40f99077978..2e6b731fd7cf76 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/variadic_split.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/single_layer/variadic_split.hpp
@@ -29,7 +29,7 @@ typedef std::tuple<
 class VariadicSplitLayerTest : public testing::WithParamInterface<VariadicSplitParams>,
                            public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<VariadicSplitParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<VariadicSplitParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_concats_eltwise.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_concats_eltwise.hpp
index c47a9099cfcabd..bc35614d4756bd 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_concats_eltwise.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_concats_eltwise.hpp
@@ -22,7 +22,7 @@ using ActivationConcatsEltwiseParamsTuple = typename std::tuple<
 class ActivationConcatsEltwise : public testing::WithParamInterface<ActivationConcatsEltwiseParamsTuple>,
                           public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ParamType> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ParamType>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_fq.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_fq.hpp
index 6fabc5dfbf6caa..514276bb1f9b09 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_fq.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/activation_fq.hpp
@@ -45,7 +45,7 @@ typedef std::tuple<
 class ActivationFakeQuantizeSubgraphTest : public testing::WithParamInterface<fqSubgraphTestParamsSet>,
                                            virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<fqSubgraphTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<fqSubgraphTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/basic_lstm.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/basic_lstm.hpp
index 39c7ac71f356c5..c0dd8d278e76f9 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/basic_lstm.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/basic_lstm.hpp
@@ -26,7 +26,7 @@ typedef std::tuple<
 class Basic_LSTM_S : public testing::WithParamInterface<basicLstmParams>,
                      public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<basicLstmParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<basicLstmParams>& obj);
 
     void Run() override;
     static std::shared_ptr<ngraph::Function> GetNetwork(size_t thirdDimOut,
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/broadcast_power.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/broadcast_power.hpp
index 75f2067a926cd9..04a04dab32fe43 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/broadcast_power.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/broadcast_power.hpp
@@ -25,7 +25,7 @@ typedef std::tuple<
 class BroadcastPowerTest : public testing::WithParamInterface<BroadCastPowerTuple>,
                          virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<BroadCastPowerTuple> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<BroadCastPowerTuple>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/clamp_fq.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/clamp_fq.hpp
index 4012370d0887bb..b0cf33d3c24475 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/clamp_fq.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/clamp_fq.hpp
@@ -35,7 +35,7 @@ typedef std::tuple<
 class ClampFakeQuantizeSubgraphTest : public testing::WithParamInterface<fqSubgraphTestParamsSet>,
                                  virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<fqSubgraphTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<fqSubgraphTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_conv.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_conv.hpp
index dfc1b73c78a329..f16b79dbd36577 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_conv.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_conv.hpp
@@ -33,11 +33,11 @@ typedef std::tuple<
 class ConcatConvTest : public testing::WithParamInterface<ConcatConvParams>,
                        public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConcatConvParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConcatConvParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_multi_input.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_multi_input.hpp
index d599aba181ac8c..e796a3ad79035f 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_multi_input.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_multi_input.hpp
@@ -33,7 +33,7 @@ class ConcatMultiInput : public testing::WithParamInterface<concatMultiParams>,
     void GenerateStridedSliceModel();
     void GenerateConstOnlyModel();
     void GenerateMemoryModel();
-    static std::string getTestCaseName(testing::TestParamInfo<concatMultiParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<concatMultiParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_quantization.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_quantization.hpp
index 57221f50f54f40..5d9214faff018a 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_quantization.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/concat_quantization.hpp
@@ -24,7 +24,7 @@ typedef std::tuple<
 class ConcatQuantization : public testing::WithParamInterface<concatQuantizationParams>,
                         virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<concatQuantizationParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<concatQuantizationParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_conv_concat.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_conv_concat.hpp
index 6c5984f2cba6f5..418e583064e567 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_conv_concat.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_conv_concat.hpp
@@ -33,7 +33,7 @@ typedef std::tuple<
 class ConstConvConcatTest : public testing::WithParamInterface<ConstConvConcatParams>,
                             public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConstConvConcatParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConstConvConcatParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_strided_slice_concat.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_strided_slice_concat.hpp
index cc24702e1cfde0..2616b2f9459fb1 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_strided_slice_concat.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/const_strided_slice_concat.hpp
@@ -29,7 +29,7 @@ typedef std::tuple<
 class ConstStridedSliceConcatTest : public testing::WithParamInterface<ConstStridedSliceConcatParams>,
                             public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConstStridedSliceConcatParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConstStridedSliceConcatParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/constant_result.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/constant_result.hpp
index 4386940d629901..16cf9b3ebda526 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/constant_result.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/constant_result.hpp
@@ -31,8 +31,8 @@ typedef std::tuple <
 class ConstantResultSubgraphTest : public testing::WithParamInterface<constResultParams>,
                                    virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<constResultParams> obj);
-    void createGraph(ConstantSubgraphType type, const InferenceEngine::SizeVector &inputShape, const InferenceEngine::Precision &inputPrecision);
+    static std::string getTestCaseName(const testing::TestParamInfo<constResultParams>& obj);
+    void createGraph(const ConstantSubgraphType& type, const InferenceEngine::SizeVector &inputShape, const InferenceEngine::Precision &inputPrecision);
 protected:
     void SetUp() override;
 };
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_eltwise.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_eltwise.hpp
index c55c8e4761a813..c9fdc4f56eab9e 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_eltwise.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_eltwise.hpp
@@ -39,7 +39,7 @@ typedef std::tuple<
 class ConvFqEltwiseTest : public testing::WithParamInterface<ConvFqEltwiseTestParamsSet>,
                    virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConvFqEltwiseTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConvFqEltwiseTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_relu.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_relu.hpp
index e3fdc059fd140e..2f869a1ea0fdcd 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_relu.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/conv_fq_relu.hpp
@@ -39,7 +39,7 @@ typedef std::tuple<
 class ConvFqReluTest : public testing::WithParamInterface<ConvFqReluTestParamsSet>,
                        virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConvFqReluTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConvFqReluTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/convolution_relu_sequence.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/convolution_relu_sequence.hpp
index b49ccd00ac29f5..2fa43c79bb0c7a 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/convolution_relu_sequence.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/convolution_relu_sequence.hpp
@@ -43,7 +43,7 @@ typedef std::tuple<
 class ConvolutionReluSequenceTest : public testing::WithParamInterface<convReluSequenceTestParamsSet>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<convReluSequenceTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<convReluSequenceTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_conv_eltwise.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_conv_eltwise.hpp
index 56ba88646551cb..bf77a334082f93 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_conv_eltwise.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_conv_eltwise.hpp
@@ -53,11 +53,11 @@ class EltwiseBeforeConvTest : public testing::WithParamInterface<EltwiseConvEltw
 class EltwiseWithTwoConvsAsInputsTest : public testing::WithParamInterface<EltwiseConvEltwiseParams>,
                                         public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<EltwiseConvEltwiseParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<EltwiseConvEltwiseParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_reshape_activation.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_reshape_activation.hpp
index 5a20bfe40f0fd0..6778b98bf361e0 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_reshape_activation.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/eltwise_reshape_activation.hpp
@@ -20,7 +20,7 @@ using EltwiseReshapeActivationParams = typename std::tuple<
 class EltwiseReshapeActivation : public testing::WithParamInterface<EltwiseReshapeActivationParams>,
                                  public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ParamType> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ParamType>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fc_conv_fc.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fc_conv_fc.hpp
index b3c99dac2adc2e..d34c5de52547f3 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fc_conv_fc.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fc_conv_fc.hpp
@@ -33,7 +33,7 @@ typedef std::tuple<
 class FcAfterConvTest : public testing::WithParamInterface<FcConvFcParams>,
                         public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FcConvFcParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FcConvFcParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
@@ -43,7 +43,7 @@ class FcAfterConvTest : public testing::WithParamInterface<FcConvFcParams>,
 class FcBeforeConvTest : public testing::WithParamInterface<FcConvFcParams>,
                          public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FcConvFcParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FcConvFcParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
@@ -53,7 +53,7 @@ class FcBeforeConvTest : public testing::WithParamInterface<FcConvFcParams>,
 class FcBetweenConvsTest : public testing::WithParamInterface<FcConvFcParams>,
                            public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FcConvFcParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FcConvFcParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/first_connect_input_concat.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/first_connect_input_concat.hpp
index 6ad904443e820e..bef5dd58810a36 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/first_connect_input_concat.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/first_connect_input_concat.hpp
@@ -25,7 +25,7 @@ typedef std::tuple<
 class ConcatFirstInputTest : public testing::WithParamInterface<concatFirstInputParams>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<concatFirstInputParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<concatFirstInputParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fq_conv_fq_affine.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fq_conv_fq_affine.hpp
index 30c014dd498430..9f9c0fe54d8d93 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fq_conv_fq_affine.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/fq_conv_fq_affine.hpp
@@ -40,7 +40,7 @@ typedef std::tuple<
 class FqConvFqAffineTest : public testing::WithParamInterface<FqConvFqAffineTestParamsSet>,
                            virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<FqConvFqAffineTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<FqConvFqAffineTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_conv.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_conv.hpp
index c05d38a3d26653..addcf52b819ed2 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_conv.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_conv.hpp
@@ -33,7 +33,7 @@ typedef std::tuple<
 class InputConvTest : public testing::WithParamInterface<inputConvParams>,
                      public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<inputConvParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<inputConvParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_split_concat.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_split_concat.hpp
index ba5991c431b447..a95f796fe1a195 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_split_concat.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/input_split_concat.hpp
@@ -25,7 +25,7 @@ typedef std::tuple<
 class InputSplitConcatTest : public testing::WithParamInterface<InputSplitConcatParams>,
                              public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<InputSplitConcatParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<InputSplitConcatParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/matmul_squeeze_add.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/matmul_squeeze_add.hpp
index 680f237d27763b..a23233b2fd1b29 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/matmul_squeeze_add.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/matmul_squeeze_add.hpp
@@ -26,7 +26,7 @@ typedef std::tuple<
 class MatmulSqueezeAddTest : public testing::WithParamInterface<matmulSqueezeAddParams>,
                      public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<matmulSqueezeAddParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<matmulSqueezeAddParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/mul_conv_fusion.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/mul_conv_fusion.hpp
new file mode 100644
index 00000000000000..67b798297b9251
--- /dev/null
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/mul_conv_fusion.hpp
@@ -0,0 +1,35 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <tuple>
+#include <string>
+#include <vector>
+#include "shared_test_classes/base/layer_test_utils.hpp"
+#include <ngraph/shape.hpp>
+#include <ngraph/node.hpp>
+
+namespace SubgraphTestsDefinitions {
+
+typedef std::tuple<
+        ngraph::NodeTypeInfo,       // Convolution type
+        ngraph::Shape,              // Input shape
+        ngraph::Shape,              // Weights shape
+        ngraph::Shape,              // Const shape
+        ngraph::element::Type,      // Network precision
+        bool,                       // True if test is negative
+        std::string                 // Device name
+        > MulConvFusionParams;
+
+class MulConvFusion
+        : public testing::WithParamInterface<MulConvFusionParams>,
+          public LayerTestsUtils::LayerTestsCommon {
+public:
+    static std::string getTestCaseName(const testing::TestParamInfo<MulConvFusionParams> &obj);
+
+protected:
+    void SetUp() override;
+};
+} // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_result.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_result.hpp
index ed3a99f2885d18..83d0185788fc89 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_result.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_result.hpp
@@ -21,7 +21,7 @@ typedef std::tuple<
 class ParameterResultSubgraphTest : public testing::WithParamInterface<parameterResultParams>,
                                     virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<parameterResultParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<parameterResultParams>& obj);
 protected:
     void SetUp() override;
 };
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_shapeof_result.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_shapeof_result.hpp
index cf7d444cf1f21d..1bb5fc43a5d51e 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_shapeof_result.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/parameter_shapeof_result.hpp
@@ -22,7 +22,7 @@ typedef std::tuple<
 class ParameterShapeOfResultSubgraphTest : public testing::WithParamInterface<parameterShapeOfResultParams>,
                                            virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<parameterShapeOfResultParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<parameterShapeOfResultParams>& obj);
 protected:
     void SetUp() override;
 };
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/perm_conv_perm_concat.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/perm_conv_perm_concat.hpp
index 761075efcb3838..20e568bcb11e86 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/perm_conv_perm_concat.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/perm_conv_perm_concat.hpp
@@ -27,7 +27,7 @@ typedef std::tuple<
 class PermConvPermConcat : public testing::WithParamInterface<PermConvPermConcatParams>,
     virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<PermConvPermConcatParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<PermConvPermConcatParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_convolution_backprop_data.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_convolution_backprop_data.hpp
index 59d36270341a15..53259d8891e888 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_convolution_backprop_data.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_convolution_backprop_data.hpp
@@ -34,10 +34,10 @@ typedef std::tuple<
 class QuantConvBackpropDataLayerTest : public testing::WithParamInterface<quantConvBackpropDataLayerTestParamsSet>,
                                             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<quantConvBackpropDataLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<quantConvBackpropDataLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution.hpp
index 5461a2dd400623..f9ca5d84dedad6 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution.hpp
@@ -35,10 +35,10 @@ typedef std::tuple<
 class QuantGroupConvLayerTest : public testing::WithParamInterface<quantGroupConvLayerTestParamsSet>,
                                             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<quantGroupConvLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<quantGroupConvLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution_backprop_data.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution_backprop_data.hpp
index e7a2a8695a0655..3a78f2b73e5ea8 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution_backprop_data.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/quantized_group_convolution_backprop_data.hpp
@@ -35,10 +35,10 @@ typedef std::tuple<
 class QuantGroupConvBackpropDataLayerTest : public testing::WithParamInterface<quantGroupConvBackpropDataLayerTestParamsSet>,
                                             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<quantGroupConvBackpropDataLayerTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<quantGroupConvBackpropDataLayerTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/range_add.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/range_add.hpp
index aa350bb2e253ab..5badbc0102fefd 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/range_add.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/range_add.hpp
@@ -21,7 +21,7 @@ namespace SubgraphTestsDefinitions {
 class RangeAddSubgraphTest : public testing::WithParamInterface<LayerTestsDefinitions::RangeParams>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LayerTestsDefinitions::RangeParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LayerTestsDefinitions::RangeParams>& obj);
 protected:
     void SetUp() override;
 };
@@ -31,7 +31,7 @@ class RangeAddSubgraphTest : public testing::WithParamInterface<LayerTestsDefini
 class RangeNumpyAddSubgraphTest : public testing::WithParamInterface<LayerTestsDefinitions::RangeParams>,
                              virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LayerTestsDefinitions::RangeParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LayerTestsDefinitions::RangeParams>& obj);
 protected:
     void SetUp() override;
 };
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/relu_shape_of.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/relu_shape_of.hpp
index 749b841b0459ac..ec0852d013035f 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/relu_shape_of.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/relu_shape_of.hpp
@@ -19,8 +19,8 @@ namespace SubgraphTestsDefinitions {
 class ReluShapeOfSubgraphTest : public testing::WithParamInterface<LayerTestsDefinitions::shapeOfParams>,
         virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LayerTestsDefinitions::shapeOfParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LayerTestsDefinitions::shapeOfParams>& obj);
 protected:
     void SetUp() override;
 };
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/reshape_permute_conv_permute_reshape_act.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/reshape_permute_conv_permute_reshape_act.hpp
index 97fd8c1406bf1a..efbd9f41049f61 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/reshape_permute_conv_permute_reshape_act.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/reshape_permute_conv_permute_reshape_act.hpp
@@ -27,7 +27,7 @@ namespace SubgraphTestsDefinitions {
 class ConvReshapeAct : public testing::WithParamInterface<ConvReshapeActParams>,
                         virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ConvReshapeActParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ConvReshapeActParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/scaleshift_conv_scaleshift.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/scaleshift_conv_scaleshift.hpp
index 7d3e5b8bce560e..721c4723bc1ff2 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/scaleshift_conv_scaleshift.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/scaleshift_conv_scaleshift.hpp
@@ -33,7 +33,7 @@ typedef std::tuple<
 class ScaleShiftAfterConvTest : public testing::WithParamInterface<ScaleShiftConvScaleShiftParams>,
                                 public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ScaleShiftConvScaleShiftParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ScaleShiftConvScaleShiftParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
@@ -43,7 +43,7 @@ class ScaleShiftAfterConvTest : public testing::WithParamInterface<ScaleShiftCon
 class ScaleShiftBeforeConvTest : public testing::WithParamInterface<ScaleShiftConvScaleShiftParams>,
                                  public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ScaleShiftConvScaleShiftParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ScaleShiftConvScaleShiftParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/softsign.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/softsign.hpp
index 0c56e6067ea199..d584e70659f7f9 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/softsign.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/softsign.hpp
@@ -25,7 +25,7 @@ typedef std::tuple<
 class SoftsignTest : public testing::WithParamInterface<softsignParams>,
                      public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<softsignParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<softsignParams>& obj);
 
     void Run() override;
 
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_concat_memory.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_concat_memory.hpp
index e7e53e34dd369b..3e6dcb0e188941 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_concat_memory.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_concat_memory.hpp
@@ -21,7 +21,7 @@ using SplitConcatMemoryParamsTuple = typename std::tuple<
 class SplitConcatMemory : public testing::WithParamInterface<SplitConcatMemoryParamsTuple>,
                           public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<ParamType> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<ParamType>& obj);
 
 protected:
     void SetUp() override;
@@ -29,4 +29,4 @@ class SplitConcatMemory : public testing::WithParamInterface<SplitConcatMemoryPa
     int axis;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv.hpp
index 3682f595f96cdf..53208f0e658043 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv.hpp
@@ -33,11 +33,11 @@ typedef std::tuple<
 class SplitConvTest : public testing::WithParamInterface<SplitConvParams>,
                       public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<SplitConvParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<SplitConvParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv_concat.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv_concat.hpp
index 53c566d8cd2346..12c676a465fb8a 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv_concat.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/split_conv_concat.hpp
@@ -18,10 +18,10 @@ namespace SubgraphTestsDefinitions {
 class SplitConvConcat : public testing::WithParamInterface<LayerTestsUtils::basicParams>,
                         virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<LayerTestsUtils::basicParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<LayerTestsUtils::basicParams>& obj);
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/stridedslice_conv.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/stridedslice_conv.hpp
index c4212667ea734c..498328a36cc7d1 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/stridedslice_conv.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/stridedslice_conv.hpp
@@ -32,11 +32,11 @@ typedef std::tuple<
 class SliceConvTest : public testing::WithParamInterface<SliceConvParams>,
                       public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<SliceConvParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<SliceConvParams>& obj);
     InferenceEngine::Blob::Ptr GenerateInput(const InferenceEngine::InputInfo& info) const override;
 
 protected:
     void SetUp() override;
 };
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/tensor_names.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/tensor_names.hpp
index e863688af0180f..376eec608d6e71 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/tensor_names.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/tensor_names.hpp
@@ -21,7 +21,7 @@ typedef std::tuple<
 class TensorNamesTest : public testing::WithParamInterface<constResultParams>,
                             virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<constResultParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<constResultParams>& obj);
 protected:
     void SetUp() override;
 };
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/transpose_add.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/transpose_add.hpp
new file mode 100644
index 00000000000000..ecc1a896efb21e
--- /dev/null
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/transpose_add.hpp
@@ -0,0 +1,32 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <tuple>
+#include <vector>
+#include <string>
+#include <memory>
+
+#include "shared_test_classes/base/layer_test_utils.hpp"
+#include "ngraph_functions/utils/ngraph_helpers.hpp"
+#include "ngraph_functions/builders.hpp"
+
+namespace SubgraphTestsDefinitions {
+typedef std::tuple<
+    InferenceEngine::Precision,         // Network Precision
+    std::string,                        // Target Device
+    std::vector<size_t>,                // Input shape
+    std::map<std::string, std::string>  // Configuration
+> TransposeAddParams;
+
+class TransposeAdd : public testing::WithParamInterface<TransposeAddParams>,
+    virtual public LayerTestsUtils::LayerTestsCommon {
+public:
+    static std::string getTestCaseName(testing::TestParamInfo<TransposeAddParams> obj);
+
+protected:
+    void SetUp() override;
+};
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/transpose_conv_transpose_squeeze.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/transpose_conv_transpose_squeeze.hpp
index 2811ed7c9de5b3..81591f18d89877 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/transpose_conv_transpose_squeeze.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/transpose_conv_transpose_squeeze.hpp
@@ -33,7 +33,7 @@ typedef std::tuple<
 class TransposeConvTest : public testing::WithParamInterface<TransposeConvTestParams>,
                    virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<TransposeConvTestParams> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<TransposeConvTestParams>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/two_fake_quantize_to_fullyconnected.hpp b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/two_fake_quantize_to_fullyconnected.hpp
index 3393e143a2e336..e8c138ede45e9c 100644
--- a/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/two_fake_quantize_to_fullyconnected.hpp
+++ b/inference-engine/tests/functional/shared_test_classes/include/shared_test_classes/subgraph/two_fake_quantize_to_fullyconnected.hpp
@@ -37,7 +37,7 @@ typedef std::tuple<
 class FakeQuantizeSubgraphTest : public testing::WithParamInterface<fqSubgraphTestParamsSet>,
                                  virtual public LayerTestsUtils::LayerTestsCommon {
 public:
-    static std::string getTestCaseName(testing::TestParamInfo<fqSubgraphTestParamsSet> obj);
+    static std::string getTestCaseName(const testing::TestParamInfo<fqSubgraphTestParamsSet>& obj);
 
 protected:
     void SetUp() override;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/adaptive_pooling.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/adaptive_pooling.cpp
index 4cf40860130100..a7248f61f0c978 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/adaptive_pooling.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/adaptive_pooling.cpp
@@ -12,7 +12,7 @@ using namespace FuncTestUtils::PrecisionUtils;
 
 namespace LayerTestsDefinitions {
 
-std::string AdaPoolLayerTest::getTestCaseName(testing::TestParamInfo<adapoolParams> obj) {
+std::string AdaPoolLayerTest::getTestCaseName(const testing::TestParamInfo<adapoolParams>& obj) {
     std::vector<size_t> inputShape;
     std::vector<int> pooledSpatialShape;
 
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/binary_convolution.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/binary_convolution.cpp
index a5ca59e73faeb6..42195b5c6d8460 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/binary_convolution.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/binary_convolution.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string BinaryConvolutionLayerTest::getTestCaseName(testing::TestParamInfo<binaryConvolutionTestParamsSet> obj) {
+std::string BinaryConvolutionLayerTest::getTestCaseName(const testing::TestParamInfo<binaryConvolutionTestParamsSet>& obj) {
     binConvSpecificParams binConvParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/bucketize.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/bucketize.cpp
index c10d47cc699f7b..18b88fe52b5e43 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/bucketize.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/bucketize.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-    std::string BucketizeLayerTest::getTestCaseName(testing::TestParamInfo<bucketizeParamsTuple> obj) {
+    std::string BucketizeLayerTest::getTestCaseName(const testing::TestParamInfo<bucketizeParamsTuple>& obj) {
         InferenceEngine::SizeVector dataShape;
         InferenceEngine::SizeVector bucketsShape;
         bool with_right_bound;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/clamp.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/clamp.cpp
index 0fae07ccc745e1..e95406dde343f0 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/clamp.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/clamp.cpp
@@ -7,7 +7,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ClampLayerTest::getTestCaseName(testing::TestParamInfo<clampParamsTuple> obj) {
+std::string ClampLayerTest::getTestCaseName(const testing::TestParamInfo<clampParamsTuple>& obj) {
     InferenceEngine::SizeVector inShape;
     std::pair<float, float> interval;
     InferenceEngine::Precision netPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution.cpp
index 744bb9a2b73126..e419e08e0d8148 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConvolutionLayerTest::getTestCaseName(testing::TestParamInfo<convLayerTestParamsSet> obj) {
+std::string ConvolutionLayerTest::getTestCaseName(const testing::TestParamInfo<convLayerTestParamsSet>& obj) {
     convSpecificParams convParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop.cpp
index 55aae5e0a215b3..124dcc0fb9483e 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConvolutionBackpropLayerTest::getTestCaseName(testing::TestParamInfo<convBackpropLayerTestParamsSet> obj) {
+std::string ConvolutionBackpropLayerTest::getTestCaseName(const testing::TestParamInfo<convBackpropLayerTestParamsSet>& obj) {
     convBackpropSpecificParams convBackpropDataParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop_data.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop_data.cpp
index c1e642d6764065..83d0587fda3a0c 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop_data.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/convolution_backprop_data.cpp
@@ -8,7 +8,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ConvolutionBackpropDataLayerTest::getTestCaseName(testing::TestParamInfo<convBackpropDataLayerTestParamsSet> obj) {
+std::string ConvolutionBackpropDataLayerTest::getTestCaseName(const testing::TestParamInfo<convBackpropDataLayerTestParamsSet>& obj) {
     convBackpropDataSpecificParams convBackpropDataParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/cum_sum.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/cum_sum.cpp
index 3d0b62963a6c5c..024fdf43c7bc4d 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/cum_sum.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/cum_sum.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string CumSumLayerTest::getTestCaseName(testing::TestParamInfo<cumSumParams> obj) {
+std::string CumSumLayerTest::getTestCaseName(const testing::TestParamInfo<cumSumParams>& obj) {
     InferenceEngine::SizeVector inputShapes;
     InferenceEngine::Precision inputPrecision;
     int64_t axis;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_convolution.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_convolution.cpp
index d8014598cbabc2..e787de0226f611 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_convolution.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_convolution.cpp
@@ -4,7 +4,7 @@
 #include "shared_test_classes/single_layer/deformable_convolution.hpp"
 
 namespace LayerTestsDefinitions {
-std::string DeformableConvolutionLayerTest::getTestCaseName(testing::TestParamInfo<deformableConvLayerTestParamsSet> obj) {
+std::string DeformableConvolutionLayerTest::getTestCaseName(const testing::TestParamInfo<deformableConvLayerTestParamsSet>& obj) {
     deformableConvSpecificParams convParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
@@ -101,4 +101,4 @@ void DeformableConvolutionLayerTest::SetUp() {
     ngraph::ResultVector results{std::make_shared<ngraph::opset1::Result>(deformable_conv)};
     function = std::make_shared<ngraph::Function>(results, parameters, "deformable_convolution");
 }
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_psroi_pooling.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_psroi_pooling.cpp
index 4f8fa43b06ae7d..a48d7faca51d3f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_psroi_pooling.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/deformable_psroi_pooling.cpp
@@ -7,7 +7,7 @@
 
 namespace LayerTestsDefinitions {
 
-    std::string DeformablePSROIPoolingLayerTest::getTestCaseName(testing::TestParamInfo<deformablePSROILayerTestParams> obj) {
+    std::string DeformablePSROIPoolingLayerTest::getTestCaseName(const testing::TestParamInfo<deformablePSROILayerTestParams>& obj) {
         std::vector<size_t> dataShape;
         std::vector<size_t> roisShape;
         std::vector<size_t> offsetsShape;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/detection_output.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/detection_output.cpp
index 4068abff126099..02a1655d56c47a 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/detection_output.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/detection_output.cpp
@@ -7,7 +7,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string DetectionOutputLayerTest::getTestCaseName(testing::TestParamInfo<DetectionOutputParams> obj) {
+std::string DetectionOutputLayerTest::getTestCaseName(const testing::TestParamInfo<DetectionOutputParams>& obj) {
     DetectionOutputAttributes commonAttrs;
     ParamsWhichSizeDepends specificAttrs;
     ngraph::op::DetectionOutputAttrs attrs;
@@ -153,4 +153,3 @@ void DetectionOutputLayerTest::SetUp() {
     function = std::make_shared<ngraph::Function>(results, params, "DetectionOutput");
 }
 }  // namespace LayerTestsDefinitions
-
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/dft.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/dft.cpp
index 28b3b0b11dc976..5f31beff78a252 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/dft.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/dft.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string DFTLayerTest::getTestCaseName(testing::TestParamInfo<DFTParams> obj) {
+std::string DFTLayerTest::getTestCaseName(const testing::TestParamInfo<DFTParams>& obj) {
     InferenceEngine::SizeVector inputShapes;
     InferenceEngine::Precision inputPrecision;
     std::vector<int64_t> axes;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/eltwise.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/eltwise.cpp
index 0a84a71aa6e329..3c4366db2d0ce2 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/eltwise.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/eltwise.cpp
@@ -8,7 +8,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string EltwiseLayerTest::getTestCaseName(testing::TestParamInfo<EltwiseTestParams> obj) {
+std::string EltwiseLayerTest::getTestCaseName(const testing::TestParamInfo<EltwiseTestParams>& obj) {
     std::vector<std::vector<size_t>> inputShapes;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_offsets_sum.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_offsets_sum.cpp
index 54991d0b237f70..6dd70b9183bd35 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_offsets_sum.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_offsets_sum.cpp
@@ -7,7 +7,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string EmbeddingBagOffsetsSumLayerTest::getTestCaseName(testing::TestParamInfo<embeddingBagOffsetsSumLayerTestParamsSet> obj) {
+std::string EmbeddingBagOffsetsSumLayerTest::getTestCaseName(const testing::TestParamInfo<embeddingBagOffsetsSumLayerTestParamsSet>& obj) {
     embeddingBagOffsetsSumParams params;
     InferenceEngine::Precision netPrecision, indPrecision;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_packed_sum.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_packed_sum.cpp
index 32ba24efa30378..910f37ce512212 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_packed_sum.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_bag_packed_sum.cpp
@@ -7,7 +7,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string EmbeddingBagPackedSumLayerTest::getTestCaseName(testing::TestParamInfo<embeddingBagPackedSumLayerTestParamsSet> obj) {
+std::string EmbeddingBagPackedSumLayerTest::getTestCaseName(const testing::TestParamInfo<embeddingBagPackedSumLayerTestParamsSet>& obj) {
     embeddingBagPackedSumParams params;
     InferenceEngine::Precision netPrecision, indPrecision;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_segments_sum.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_segments_sum.cpp
index 3fe0faf563932a..3a86daf0e315e8 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_segments_sum.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/embedding_segments_sum.cpp
@@ -8,7 +8,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string EmbeddingSegmentsSumLayerTest::getTestCaseName(testing::TestParamInfo<embeddingSegmentsSumLayerTestParamsSet> obj) {
+std::string EmbeddingSegmentsSumLayerTest::getTestCaseName(const testing::TestParamInfo<embeddingSegmentsSumLayerTestParamsSet>& obj) {
     embeddingSegmentsSumParams params;
     InferenceEngine::Precision netPrecision, indPrecision;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution.cpp
index 0b301b5d273090..dcf59efd210f9d 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string GroupConvolutionLayerTest::getTestCaseName(testing::TestParamInfo<groupConvLayerTestParamsSet> obj) {
+std::string GroupConvolutionLayerTest::getTestCaseName(const testing::TestParamInfo<groupConvLayerTestParamsSet>& obj) {
     groupConvSpecificParams groupConvParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution_backprop_data.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution_backprop_data.cpp
index 5f536397de7c51..caf94578935d23 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution_backprop_data.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/group_convolution_backprop_data.cpp
@@ -8,7 +8,7 @@ namespace LayerTestsDefinitions {
 
 // DEPRECATED, remove this old API when KMB (#58495) and ARM (#58496) plugins are migrated to new API
 
-std::string GroupConvBackpropDataLayerTest::getTestCaseName(testing::TestParamInfo<groupConvBackpropDataLayerTestParamsSet> obj) {
+std::string GroupConvBackpropDataLayerTest::getTestCaseName(const testing::TestParamInfo<groupConvBackpropDataLayerTestParamsSet>& obj) {
     groupConvBackpropDataSpecificParams groupConvBackpropDataParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/interpolate.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/interpolate.cpp
index 77d22a1af3a5cb..ce01e26d97fe8c 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/interpolate.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/interpolate.cpp
@@ -11,7 +11,7 @@ using ngraph::helpers::operator<<;
 
 namespace LayerTestsDefinitions {
 
-std::string InterpolateLayerTest::getTestCaseName(testing::TestParamInfo<InterpolateLayerTestParams> obj) {
+std::string InterpolateLayerTest::getTestCaseName(const testing::TestParamInfo<InterpolateLayerTestParams>& obj) {
     InterpolateSpecificParams interpolateParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/log_softmax.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/log_softmax.cpp
index 8b1bf040748930..669ea0ec501b2c 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/log_softmax.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/log_softmax.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string LogSoftmaxLayerTest::getTestCaseName(testing::TestParamInfo<logSoftmaxLayerTestParams> obj) {
+std::string LogSoftmaxLayerTest::getTestCaseName(const testing::TestParamInfo<logSoftmaxLayerTestParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout, outLayout;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/logical.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/logical.cpp
index 2172ec87e2e435..a6015debc23c07 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/logical.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/logical.cpp
@@ -8,7 +8,7 @@
 using namespace LayerTestsDefinitions::LogicalParams;
 
 namespace LayerTestsDefinitions {
-std::string LogicalLayerTest::getTestCaseName(testing::TestParamInfo<LogicalTestParams> obj) {
+std::string LogicalLayerTest::getTestCaseName(const testing::TestParamInfo<LogicalTestParams>& obj) {
     InputShapesTuple inputShapes;
     ngraph::helpers::LogicalTypes comparisonOpType;
     ngraph::helpers::InputLayerType secondInputType;
@@ -79,4 +79,4 @@ void LogicalLayerTest::SetUp() {
 
     function = std::make_shared<ngraph::Function>(logicalNode, inputs, "Logical");
 }
-} // namespace LayerTestsDefinitions
\ No newline at end of file
+} // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/low_precision.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/low_precision.cpp
index bc4ad3f3f083fe..d4aee621def4b5 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/low_precision.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/low_precision.cpp
@@ -7,7 +7,7 @@
 
 namespace LowPrecisionTestDefinitions {
 
-std::string LowPrecisionTest::getTestCaseName(testing::TestParamInfo<lowPrecisionTestParamsSet> obj) {
+std::string LowPrecisionTest::getTestCaseName(const testing::TestParamInfo<lowPrecisionTestParamsSet>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::pair<std::string, std::map<std::string, std::string>> config;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/lrn.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/lrn.cpp
index 248493a38515ff..71ac393a72965b 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/lrn.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/lrn.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string LrnLayerTest::getTestCaseName(testing::TestParamInfo<lrnLayerTestParamsSet> obj) {
+std::string LrnLayerTest::getTestCaseName(const testing::TestParamInfo<lrnLayerTestParamsSet>& obj) {
     double alpha, beta, bias;
     size_t size;
     std::vector<int64_t> axes;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/matrix_nms.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/matrix_nms.cpp
index 2b33a25ae1e764..de4787cdf22e15 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/matrix_nms.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/matrix_nms.cpp
@@ -10,7 +10,7 @@ using namespace ngraph;
 using namespace InferenceEngine;
 using namespace FuncTestUtils::PrecisionUtils;
 
-std::string MatrixNmsLayerTest::getTestCaseName(testing::TestParamInfo<NmsParams> obj) {
+std::string MatrixNmsLayerTest::getTestCaseName(const testing::TestParamInfo<NmsParams>& obj) {
     InputShapeParams inShapeParams;
     InputPrecisions inPrecisions;
     op::v8::MatrixNms::SortResultType sortResultType;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/multiclass_nms.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/multiclass_nms.cpp
index e8532bad22706f..dd42206f63f0b5 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/multiclass_nms.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/multiclass_nms.cpp
@@ -10,7 +10,7 @@ using namespace ngraph;
 using namespace InferenceEngine;
 using namespace FuncTestUtils::PrecisionUtils;
 
-std::string MulticlassNmsLayerTest::getTestCaseName(testing::TestParamInfo<MulticlassNmsParams> obj) {
+std::string MulticlassNmsLayerTest::getTestCaseName(const testing::TestParamInfo<MulticlassNmsParams>& obj) {
     InputShapeParams inShapeParams;
     InputPrecisions inPrecisions;
     int32_t nmsTopK, backgroundClass, keepTopK;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/mvn.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/mvn.cpp
index d4e2a0c0df8536..5c04c6f177e75b 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/mvn.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/mvn.cpp
@@ -7,38 +7,6 @@
 
 namespace LayerTestsDefinitions {
 
-// DEPRECATED, remove MvnLayerTest when KMB and ARM plugin will switch to use Mvn1LayerTest (#60420)
-std::string MvnLayerTest::getTestCaseName(const testing::TestParamInfo<mvnParams>& obj) {
-    InferenceEngine::SizeVector inputShapes;
-    InferenceEngine::Precision inputPrecision;
-    bool acrossChannels, normalizeVariance;
-    double eps;
-    std::string targetDevice;
-    std::tie(inputShapes, inputPrecision, acrossChannels, normalizeVariance, eps, targetDevice) = obj.param;
-    std::ostringstream result;
-    result << "IS=" << CommonTestUtils::vec2str(inputShapes) << "_";
-    result << "Precision=" << inputPrecision.name() << "_";
-    result << "AcrossChannels=" << (acrossChannels ? "TRUE" : "FALSE") << "_";
-    result << "NormalizeVariance=" << (normalizeVariance ? "TRUE" : "FALSE") << "_";
-    result << "Epsilon=" << eps << "_";
-    result << "TargetDevice=" << targetDevice;
-    return result.str();
-}
-
-void MvnLayerTest::SetUp() {
-    InferenceEngine::SizeVector inputShapes;
-    InferenceEngine::Precision inputPrecision;
-    bool acrossChanels, normalizeVariance;
-    double eps;
-    std::tie(inputShapes, inputPrecision, acrossChanels, normalizeVariance, eps, targetDevice) = this->GetParam();
-    auto inType = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(inputPrecision);
-    auto param = ngraph::builder::makeParams(inType, {inputShapes});
-    auto paramOuts = ngraph::helpers::convert2OutputVector(ngraph::helpers::castOps2Nodes<ngraph::op::Parameter>(param));
-    auto mvn = std::dynamic_pointer_cast<ngraph::op::MVN>(ngraph::builder::makeMVN(paramOuts[0], acrossChanels, normalizeVariance, eps));
-    ngraph::ResultVector results{std::make_shared<ngraph::opset1::Result>(mvn)};
-    function = std::make_shared<ngraph::Function>(results, param, "mvn");
-}
-
 std::string Mvn1LayerTest::getTestCaseName(const testing::TestParamInfo<mvn1Params>& obj) {
     InferenceEngine::SizeVector inputShapes;
     InferenceEngine::Precision inputPrecision;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/non_max_suppression.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/non_max_suppression.cpp
index fd8499e889755b..f9b01f4f7dbe74 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/non_max_suppression.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/non_max_suppression.cpp
@@ -11,7 +11,7 @@ using namespace ngraph;
 using namespace InferenceEngine;
 using namespace FuncTestUtils::PrecisionUtils;
 
-std::string NmsLayerTest::getTestCaseName(testing::TestParamInfo<NmsParams> obj) {
+std::string NmsLayerTest::getTestCaseName(const testing::TestParamInfo<NmsParams>& obj) {
     InputShapeParams inShapeParams;
     InputPrecisions inPrecisions;
     int32_t maxOutBoxesPerClass;
@@ -162,7 +162,7 @@ class Box {
 };
 
 /*
- * 1: selected_indices - tensor of type T_IND and shape [number of selected boxes, 3] containing information about selected boxes as triplets 
+ * 1: selected_indices - tensor of type T_IND and shape [number of selected boxes, 3] containing information about selected boxes as triplets
  *    [batch_index, class_index, box_index].
  * 2: selected_scores - tensor of type T_THRESHOLDS and shape [number of selected boxes, 3] containing information about scores for each selected box as triplets
  *    [batch_index, class_index, box_score].
@@ -368,10 +368,14 @@ void NmsLayerTest::SetUp() {
 
     auto nms = builder::makeNms(paramOuts[0], paramOuts[1], convertIE2nGraphPrc(maxBoxPrec), convertIE2nGraphPrc(thrPrec), maxOutBoxesPerClass, iouThr,
                                 scoreThr, softNmsSigma, boxEncoding, sortResDescend, outType);
-    auto nms_0_identity = std::make_shared<opset5::Multiply>(nms->output(0), opset5::Constant::create(outType, Shape{1}, {1}));
-    auto nms_1_identity = std::make_shared<opset5::Multiply>(nms->output(1), opset5::Constant::create(ngPrc, Shape{1}, {1}));
-    auto nms_2_identity = std::make_shared<opset5::Multiply>(nms->output(2), opset5::Constant::create(outType, Shape{1}, {1}));
-    function = std::make_shared<Function>(OutputVector{nms_0_identity, nms_1_identity, nms_2_identity}, params, "NMS");
+    if (targetDevice == CommonTestUtils::DEVICE_CPU) {
+        function = std::make_shared<Function>(nms, params, "NMS");
+    } else {
+        auto nms_0_identity = std::make_shared<opset5::Multiply>(nms->output(0), opset5::Constant::create(outType, Shape{1}, {1}));
+        auto nms_1_identity = std::make_shared<opset5::Multiply>(nms->output(1), opset5::Constant::create(ngPrc, Shape{1}, {1}));
+        auto nms_2_identity = std::make_shared<opset5::Multiply>(nms->output(2), opset5::Constant::create(outType, Shape{1}, {1}));
+        function = std::make_shared<Function>(OutputVector{nms_0_identity, nms_1_identity, nms_2_identity}, params, "NMS");
+    }
 }
 
 }  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/nonzero.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/nonzero.cpp
index 1613cabc719dd6..744d850071d513 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/nonzero.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/nonzero.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string NonZeroLayerTest::getTestCaseName(testing::TestParamInfo<NonZeroLayerTestParamsSet> obj) {
+std::string NonZeroLayerTest::getTestCaseName(const testing::TestParamInfo<NonZeroLayerTestParamsSet>& obj) {
     std::vector<size_t> inputShape;
     InferenceEngine::Precision inputPrecision;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/normalize_l2.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/normalize_l2.cpp
index a7816e395711a6..140175b1532a83 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/normalize_l2.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/normalize_l2.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string NormalizeL2LayerTest::getTestCaseName(testing::TestParamInfo<NormalizeL2LayerTestParams> obj) {
+std::string NormalizeL2LayerTest::getTestCaseName(const testing::TestParamInfo<NormalizeL2LayerTestParams>& obj) {
     std::vector<int64_t> axes;
     float eps;
     ngraph::op::EpsMode epsMode;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/one_hot.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/one_hot.cpp
index 324989b93f74fc..a2713d97e3cc58 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/one_hot.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/one_hot.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string OneHotLayerTest::getTestCaseName(testing::TestParamInfo<oneHotLayerTestParamsSet> obj) {
+std::string OneHotLayerTest::getTestCaseName(const testing::TestParamInfo<oneHotLayerTestParamsSet>& obj) {
     int64_t axis;
     ngraph::element::Type depth_type, set_type;
     int64_t depth_val;
@@ -49,4 +49,4 @@ void OneHotLayerTest::SetUp() {
     ngraph::ResultVector results{std::make_shared<ngraph::opset3::Result>(onehot)};
     function = std::make_shared<ngraph::Function>(results, params, "OneHot");
 }
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/pad.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/pad.cpp
index 71353007f6f128..6f9127b2431e32 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/pad.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/pad.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string PadLayerTest::getTestCaseName(testing::TestParamInfo<padLayerTestParamsSet> obj) {
+std::string PadLayerTest::getTestCaseName(const testing::TestParamInfo<padLayerTestParamsSet>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout;
@@ -50,4 +50,4 @@ void PadLayerTest::SetUp() {
     ngraph::ResultVector results{std::make_shared<ngraph::opset3::Result>(pad)};
     function = std::make_shared<ngraph::Function>(results, params, "pad");
 }
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/pooling.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/pooling.cpp
index 8a68be10a8d588..276fc2bfb6fec4 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/pooling.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/pooling.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string PoolingLayerTest::getTestCaseName(testing::TestParamInfo<poolLayerTestParamsSet> obj) {
+std::string PoolingLayerTest::getTestCaseName(const testing::TestParamInfo<poolLayerTestParamsSet>& obj) {
     poolSpecificParams poolParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
@@ -48,7 +48,7 @@ std::string PoolingLayerTest::getTestCaseName(testing::TestParamInfo<poolLayerTe
     return result.str();
 }
 
-std::string GlobalPoolingLayerTest::getTestCaseName(testing::TestParamInfo<globalPoolLayerTestParamsSet> obj) {
+std::string GlobalPoolingLayerTest::getTestCaseName(const testing::TestParamInfo<globalPoolLayerTestParamsSet>& obj) {
     poolSpecificParams poolParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/proposal.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/proposal.cpp
index 6d2281352218f9..a0e575ffe5c9ec 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/proposal.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/proposal.cpp
@@ -51,7 +51,7 @@ std::string ProposalLayerTest::SerializeProposalSpecificParams(proposalSpecificP
     return result.str();
 }
 
-std::string ProposalLayerTest::getTestCaseName(testing::TestParamInfo<proposalLayerTestParamsSet> obj) {
+std::string ProposalLayerTest::getTestCaseName(const testing::TestParamInfo<proposalLayerTestParamsSet>& obj) {
     proposalSpecificParams proposalParams;
     std::string targetDevice;
     std::tie(proposalParams, targetDevice) = obj.param;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/psroi_pooling.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/psroi_pooling.cpp
index d2260b3d3dcd2f..d0701be3bd3c87 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/psroi_pooling.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/psroi_pooling.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string PSROIPoolingLayerTest::getTestCaseName(testing::TestParamInfo<psroiParams> obj) {
+std::string PSROIPoolingLayerTest::getTestCaseName(const testing::TestParamInfo<psroiParams>& obj) {
     std::vector<size_t> inputShape;
     std::vector<size_t> coordsShape;
     size_t outputDim;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/range.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/range.cpp
index 1695737c3ef72e..a008c09991d2b4 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/range.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/range.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string RangeLayerTest::getTestCaseName(testing::TestParamInfo<RangeParams> obj) {
+std::string RangeLayerTest::getTestCaseName(const testing::TestParamInfo<RangeParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout, outLayout;
@@ -59,7 +59,7 @@ void RangeLayerTest::SetUp() {
     function = std::make_shared<ngraph::Function>(results, params, "Range");
 }
 
-std::string RangeNumpyLayerTest::getTestCaseName(testing::TestParamInfo<RangeParams> obj) {
+std::string RangeNumpyLayerTest::getTestCaseName(const testing::TestParamInfo<RangeParams>& obj) {
     InferenceEngine::Precision netPrc;
     InferenceEngine::Precision paramPrc;
     InferenceEngine::Precision outPrc;
@@ -113,4 +113,4 @@ void RangeNumpyLayerTest::SetUp() {
     const ngraph::ResultVector results{std::make_shared<ngraph::opset1::Result>(range)};
     function = std::make_shared<ngraph::Function>(results, params, "Range");
 }
-} // namespace LayerTestsDefinitions
\ No newline at end of file
+} // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/reduce_ops.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/reduce_ops.cpp
index 32dd59edd5a34a..bafb2f60af8970 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/reduce_ops.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/reduce_ops.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ReduceOpsLayerTest::getTestCaseName(testing::TestParamInfo<reduceMeanParams> obj) {
+std::string ReduceOpsLayerTest::getTestCaseName(const testing::TestParamInfo<reduceMeanParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout;
@@ -104,4 +104,4 @@ InferenceEngine::Blob::Ptr ReduceOpsLayerWithSpecificInputTest::GenerateInput(co
     return blob;
 }
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/reshape.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/reshape.cpp
index 27fd61ea169fca..478f2ce0e27507 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/reshape.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/reshape.cpp
@@ -5,7 +5,7 @@
 #include "shared_test_classes/single_layer/reshape.hpp"
 
 namespace LayerTestsDefinitions {
-std::string ReshapeLayerTest::getTestCaseName(testing::TestParamInfo<reshapeParams> obj) {
+std::string ReshapeLayerTest::getTestCaseName(const testing::TestParamInfo<reshapeParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout, outLayout;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/result.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/result.cpp
index 0a3456e143822b..e349a92ec0e7bd 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/result.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/result.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ResultLayerTest::getTestCaseName(testing::TestParamInfo<ResultTestParamSet> obj) {
+std::string ResultLayerTest::getTestCaseName(const testing::TestParamInfo<ResultTestParamSet>& obj) {
     std::vector<size_t> inputShape;
     InferenceEngine::Precision inputPrecision;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_align.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_align.cpp
index 57b5393811d6ca..be7318f31c525f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_align.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_align.cpp
@@ -12,7 +12,7 @@ using namespace FuncTestUtils::PrecisionUtils;
 
 namespace LayerTestsDefinitions {
 
-std::string ROIAlignLayerTest::getTestCaseName(testing::TestParamInfo<roialignParams> obj) {
+std::string ROIAlignLayerTest::getTestCaseName(const testing::TestParamInfo<roialignParams>& obj) {
     std::vector<size_t> inputShape;
     std::vector<size_t> coordsShape;
 
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_pooling.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_pooling.cpp
index c9a6ed3d135b6c..a59a224a52b6c0 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_pooling.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/roi_pooling.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-    std::string ROIPoolingLayerTest::getTestCaseName(testing::TestParamInfo<roiPoolingParamsTuple> obj) {
+    std::string ROIPoolingLayerTest::getTestCaseName(const testing::TestParamInfo<roiPoolingParamsTuple>& obj) {
         std::vector<size_t> inputShape;
         std::vector<size_t> coordsShape;
         std::vector<size_t> poolShape;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/roll.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/roll.cpp
index e54abc943d987d..a9a385fd29c947 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/roll.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/roll.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string RollLayerTest::getTestCaseName(testing::TestParamInfo<rollParams> obj) {
+std::string RollLayerTest::getTestCaseName(const testing::TestParamInfo<rollParams>& obj) {
     InferenceEngine::SizeVector inputShapes;
     InferenceEngine::Precision inputPrecision;
     std::vector<int64_t> shift;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/shape_of.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/shape_of.cpp
index fabec53f8baa2f..cef18b4b1cfe1c 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/shape_of.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/shape_of.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-    std::string ShapeOfLayerTest::getTestCaseName(testing::TestParamInfo<shapeOfParams> obj) {
+    std::string ShapeOfLayerTest::getTestCaseName(const testing::TestParamInfo<shapeOfParams>& obj) {
         InferenceEngine::SizeVector inputShapes;
         InferenceEngine::Precision inputPrecision;
         std::string targetDevice;
@@ -30,4 +30,4 @@ namespace LayerTestsDefinitions {
         function = std::make_shared<ngraph::Function>(results, param, "shapeOf");
     }
 
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/shuffle_channels.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/shuffle_channels.cpp
index c6312fac05b537..b8bfe7ff4d913b 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/shuffle_channels.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/shuffle_channels.cpp
@@ -7,7 +7,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string ShuffleChannelsLayerTest::getTestCaseName(testing::TestParamInfo<shuffleChannelsLayerTestParamsSet> obj) {
+std::string ShuffleChannelsLayerTest::getTestCaseName(const testing::TestParamInfo<shuffleChannelsLayerTestParamsSet>& obj) {
     shuffleChannelsSpecificParams shuffleChannelsParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/softmax.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/softmax.cpp
index d492f5e763cba2..1f88945baa18d3 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/softmax.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/softmax.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string SoftMaxLayerTest::getTestCaseName(testing::TestParamInfo<softMaxLayerTestParams> obj) {
+std::string SoftMaxLayerTest::getTestCaseName(const testing::TestParamInfo<softMaxLayerTestParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout, outLayout;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/split.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/split.cpp
index 33a6c385412b14..446533dd3def8f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/split.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/split.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string SplitLayerTest::getTestCaseName(testing::TestParamInfo<splitParams> obj) {
+std::string SplitLayerTest::getTestCaseName(const testing::TestParamInfo<splitParams>& obj) {
     size_t numSplits;
     int64_t axis;
     InferenceEngine::Precision netPrecision;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/squeeze_unsqueeze.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/squeeze_unsqueeze.cpp
index ca78f3805ef482..0b30db48aeca0f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/squeeze_unsqueeze.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/squeeze_unsqueeze.cpp
@@ -5,7 +5,7 @@
 #include "shared_test_classes/single_layer/squeeze_unsqueeze.hpp"
 
 namespace LayerTestsDefinitions {
-std::string SqueezeUnsqueezeLayerTest::getTestCaseName(testing::TestParamInfo<squeezeParams> obj) {
+std::string SqueezeUnsqueezeLayerTest::getTestCaseName(const testing::TestParamInfo<squeezeParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout, outLayout;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/tile.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/tile.cpp
index 6e22c9769bf376..765448b7ed19d1 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/tile.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/tile.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string TileLayerTest::getTestCaseName(testing::TestParamInfo<TileLayerTestParamsSet> obj) {
+std::string TileLayerTest::getTestCaseName(const testing::TestParamInfo<TileLayerTestParamsSet>& obj) {
     TileSpecificParams tileParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/topk.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/topk.cpp
index 3886f7f391a3d3..9f84287cb4d95a 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/topk.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/topk.cpp
@@ -5,7 +5,7 @@
 #include "shared_test_classes/single_layer/topk.hpp"
 
 namespace LayerTestsDefinitions {
-    std::string TopKLayerTest::getTestCaseName(testing::TestParamInfo<TopKParams> obj) {
+    std::string TopKLayerTest::getTestCaseName(const testing::TestParamInfo<TopKParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout;
@@ -52,4 +52,4 @@ void TopKLayerTest::SetUp() {
     }
     function = std::make_shared<ngraph::Function>(results, params, "TopK");
 }
-}  // namespace LayerTestsDefinitions
\ No newline at end of file
+}  // namespace LayerTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/transpose.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/transpose.cpp
index bbcda7b53c4ea9..f78868ccfd2cd7 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/transpose.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/transpose.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-std::string TransposeLayerTest::getTestCaseName(testing::TestParamInfo<transposeParams> obj) {
+std::string TransposeLayerTest::getTestCaseName(const testing::TestParamInfo<transposeParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout, outLayout;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/single_layer/variadic_split.cpp b/inference-engine/tests/functional/shared_test_classes/src/single_layer/variadic_split.cpp
index 7f3e7c4b2c632a..b7b948828a4e20 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/single_layer/variadic_split.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/single_layer/variadic_split.cpp
@@ -6,7 +6,7 @@
 
 namespace LayerTestsDefinitions {
 
-    std::string VariadicSplitLayerTest::getTestCaseName(testing::TestParamInfo<VariadicSplitParams> obj) {
+    std::string VariadicSplitLayerTest::getTestCaseName(const testing::TestParamInfo<VariadicSplitParams>& obj) {
         size_t axis;
         std::vector<size_t> numSplits;
         InferenceEngine::Precision netPrecision;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_concats_eltwise.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_concats_eltwise.cpp
index 6eab9fce1b7e6c..d5ad676e7e800b 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_concats_eltwise.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_concats_eltwise.cpp
@@ -10,7 +10,7 @@ namespace SubgraphTestsDefinitions {
 using namespace CommonTestUtils;
 using namespace InferenceEngine;
 
-std::string ActivationConcatsEltwise::getTestCaseName(testing::TestParamInfo<ParamType> obj) {
+std::string ActivationConcatsEltwise::getTestCaseName(const testing::TestParamInfo<ParamType>& obj) {
     InferenceEngine::Precision netPrecision;
     size_t inputSize;
     size_t concatSize;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_fq.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_fq.cpp
index 6138604af78ecf..38beeed7528a1e 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_fq.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/activation_fq.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-    std::string ActivationFakeQuantizeSubgraphTest::getTestCaseName(testing::TestParamInfo<fqSubgraphTestParamsSet> obj) {
+    std::string ActivationFakeQuantizeSubgraphTest::getTestCaseName(const testing::TestParamInfo<fqSubgraphTestParamsSet>& obj) {
         fqSpecificParams fqParams;
         ngraph::helpers::ActivationTypes activationType;
         InferenceEngine::Precision netPrecision;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/basic_lstm.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/basic_lstm.cpp
index 264b817054ffb1..bb943f71b032d3 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/basic_lstm.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/basic_lstm.cpp
@@ -9,7 +9,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string Basic_LSTM_S::getTestCaseName(testing::TestParamInfo<basicLstmParams> obj) {
+std::string Basic_LSTM_S::getTestCaseName(const testing::TestParamInfo<basicLstmParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes, newInputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/broadcast_power.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/broadcast_power.cpp
index a8f05c22ea675c..153456e83f97fb 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/broadcast_power.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/broadcast_power.cpp
@@ -5,7 +5,7 @@
 #include "shared_test_classes/subgraph/broadcast_power.hpp"
 
 namespace SubgraphTestsDefinitions {
-std::string BroadcastPowerTest::getTestCaseName(testing::TestParamInfo<BroadCastPowerTuple> obj) {
+std::string BroadcastPowerTest::getTestCaseName(const testing::TestParamInfo<BroadCastPowerTuple>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/clamp_fq.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/clamp_fq.cpp
index a3bdb01d98367b..340f12f1c2cf74 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/clamp_fq.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/clamp_fq.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-    std::string ClampFakeQuantizeSubgraphTest::getTestCaseName(testing::TestParamInfo<fqSubgraphTestParamsSet> obj) {
+    std::string ClampFakeQuantizeSubgraphTest::getTestCaseName(const testing::TestParamInfo<fqSubgraphTestParamsSet>& obj) {
         fqSpecificParams fqParams;
         InferenceEngine::Precision netPrecision;
         InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_conv.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_conv.cpp
index f2f80e00e8aee3..d5c26edc48fa5f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_conv.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_conv.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConcatConvTest::getTestCaseName(testing::TestParamInfo<ConcatConvParams> obj) {
+std::string ConcatConvTest::getTestCaseName(const testing::TestParamInfo<ConcatConvParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_multi_input.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_multi_input.cpp
index a19a410fef96e0..4442ee4b6a821f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_multi_input.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_multi_input.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConcatMultiInput::getTestCaseName(testing::TestParamInfo<concatMultiParams> obj) {
+std::string ConcatMultiInput::getTestCaseName(const testing::TestParamInfo<concatMultiParams>& obj) {
     std::vector<std::vector<size_t>> inputShapes;
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_qunatization.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_qunatization.cpp
index 18de96d4713bd0..d404ce6a2bbd34 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_qunatization.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/concat_qunatization.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConcatQuantization::getTestCaseName(testing::TestParamInfo<concatQuantizationParams> obj) {
+std::string ConcatQuantization::getTestCaseName(const testing::TestParamInfo<concatQuantizationParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes, newInputShapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_conv_concat.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_conv_concat.cpp
index 06014dfb17a796..609b5ba45f806f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_conv_concat.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_conv_concat.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConstConvConcatTest::getTestCaseName(testing::TestParamInfo<ConstConvConcatParams> obj) {
+std::string ConstConvConcatTest::getTestCaseName(const testing::TestParamInfo<ConstConvConcatParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_strided_slice_concat.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_strided_slice_concat.cpp
index 485aa72fce7914..f05e3e2e732518 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_strided_slice_concat.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/const_strided_slice_concat.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConstStridedSliceConcatTest::getTestCaseName(testing::TestParamInfo<ConstStridedSliceConcatParams> obj) {
+std::string ConstStridedSliceConcatTest::getTestCaseName(const testing::TestParamInfo<ConstStridedSliceConcatParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/constant_result.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/constant_result.cpp
index 90acce06d3df6f..c629008442f4be 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/constant_result.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/constant_result.cpp
@@ -23,7 +23,7 @@ std::ostream& operator<<(std::ostream &os, ConstantSubgraphType type) {
     return os;
 }
 
-std::string ConstantResultSubgraphTest::getTestCaseName(testing::TestParamInfo<constResultParams> obj) {
+std::string ConstantResultSubgraphTest::getTestCaseName(const testing::TestParamInfo<constResultParams>& obj) {
     ConstantSubgraphType type;
     SizeVector IS;
     Precision inputPrecision;
@@ -38,7 +38,7 @@ std::string ConstantResultSubgraphTest::getTestCaseName(testing::TestParamInfo<c
     return result.str();
 }
 
-void ConstantResultSubgraphTest::createGraph(ConstantSubgraphType type, const SizeVector &inputShape, const Precision &inputPrecision) {
+void ConstantResultSubgraphTest::createGraph(const ConstantSubgraphType& type, const SizeVector &inputShape, const Precision &inputPrecision) {
     auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(inputPrecision);
 
     ParameterVector params;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_eltwise.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_eltwise.cpp
index 830ba8638b3d24..aaefa54ccf44cb 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_eltwise.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_eltwise.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConvFqEltwiseTest::getTestCaseName(testing::TestParamInfo<ConvFqEltwiseTestParamsSet> obj) {
+std::string ConvFqEltwiseTest::getTestCaseName(const testing::TestParamInfo<ConvFqEltwiseTestParamsSet>& obj) {
     FqSpecificParams fqParams;
     ConvParams convParams;
     InferenceEngine::Precision netPrecision;
@@ -114,4 +114,4 @@ InferenceEngine::Blob::Ptr ConvFqEltwiseTest::GenerateInput(const InferenceEngin
     return FuncTestUtils::createAndFillBlob(info.getTensorDesc(), inputDataMax - inputDataMin, inputDataMin, 1 / inputDataResolution,
                                             seed);
 }
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_relu.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_relu.cpp
index e59a980ab80564..5b7c4ae57356f0 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_relu.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/conv_fq_relu.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConvFqReluTest::getTestCaseName(testing::TestParamInfo<ConvFqReluTestParamsSet> obj) {
+std::string ConvFqReluTest::getTestCaseName(const testing::TestParamInfo<ConvFqReluTestParamsSet>& obj) {
     FqSpecificParams fqParams;
     ConvParams convParams;
     InferenceEngine::Precision netPrecision;
@@ -113,4 +113,4 @@ InferenceEngine::Blob::Ptr ConvFqReluTest::GenerateInput(const InferenceEngine::
     return FuncTestUtils::createAndFillBlob(info.getTensorDesc(), inputDataMax - inputDataMin, inputDataMin, 1 / inputDataResolution,
                                             seed);
 }
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/convolution_relu_sequence.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/convolution_relu_sequence.cpp
index 5c98569885c659..531c30828a49a6 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/convolution_relu_sequence.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/convolution_relu_sequence.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConvolutionReluSequenceTest::getTestCaseName(testing::TestParamInfo<convReluSequenceTestParamsSet> obj) {
+std::string ConvolutionReluSequenceTest::getTestCaseName(const testing::TestParamInfo<convReluSequenceTestParamsSet>& obj) {
     convReluSpecificParamsAll convParamsAll;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_conv_eltwise.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_conv_eltwise.cpp
index d5ce0907607f1b..4d5fd16a1f358d 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_conv_eltwise.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_conv_eltwise.cpp
@@ -168,7 +168,7 @@ void EltwiseBeforeConvTest::SetUp() {
     function = std::make_shared<ngraph::Function>(reshape2, params, "EltwiseBeforeConvTest");
 }
 
-std::string EltwiseWithTwoConvsAsInputsTest::getTestCaseName(testing::TestParamInfo<EltwiseConvEltwiseParams> obj) {
+std::string EltwiseWithTwoConvsAsInputsTest::getTestCaseName(const testing::TestParamInfo<EltwiseConvEltwiseParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_reshape_activation.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_reshape_activation.cpp
index 74b8e76bf16977..fa949c68065229 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_reshape_activation.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/eltwise_reshape_activation.cpp
@@ -9,7 +9,7 @@ namespace SubgraphTestsDefinitions {
 using namespace CommonTestUtils;
 using namespace InferenceEngine;
 
-std::string EltwiseReshapeActivation::getTestCaseName(testing::TestParamInfo<ParamType> obj) {
+std::string EltwiseReshapeActivation::getTestCaseName(const testing::TestParamInfo<ParamType>& obj) {
     InferenceEngine::Precision netPrecision;
     std::vector<std::vector<size_t>> shapes;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/fc_conv_fc.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/fc_conv_fc.cpp
index 406182b79d6929..a1a5e9e08340ac 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/fc_conv_fc.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/fc_conv_fc.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string FcAfterConvTest::getTestCaseName(testing::TestParamInfo<FcConvFcParams> obj) {
+std::string FcAfterConvTest::getTestCaseName(const testing::TestParamInfo<FcConvFcParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
@@ -87,7 +87,7 @@ void FcAfterConvTest::SetUp() {
     function = std::make_shared<ngraph::Function>(fc4, params, "FcAfterConvTest");
 }
 
-std::string FcBeforeConvTest::getTestCaseName(testing::TestParamInfo<FcConvFcParams> obj) {
+std::string FcBeforeConvTest::getTestCaseName(const testing::TestParamInfo<FcConvFcParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
@@ -166,7 +166,7 @@ void FcBeforeConvTest::SetUp() {
     function = std::make_shared<ngraph::Function>(reshape2, params, "FcBeforeConvTest");
 }
 
-std::string FcBetweenConvsTest::getTestCaseName(testing::TestParamInfo<FcConvFcParams> obj) {
+std::string FcBetweenConvsTest::getTestCaseName(const testing::TestParamInfo<FcConvFcParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/first_connect_input_concat.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/first_connect_input_concat.cpp
index bf37af3d6d96bb..9a92a5936dba70 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/first_connect_input_concat.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/first_connect_input_concat.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ConcatFirstInputTest::getTestCaseName(testing::TestParamInfo<concatFirstInputParams> obj) {
+std::string ConcatFirstInputTest::getTestCaseName(const testing::TestParamInfo<concatFirstInputParams>& obj) {
     std::vector<std::vector<size_t>> inputShapes;
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/fq_conv_fq_affine.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/fq_conv_fq_affine.cpp
index 21ab0789dcd5a7..1bccd42658f320 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/fq_conv_fq_affine.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/fq_conv_fq_affine.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string FqConvFqAffineTest::getTestCaseName(testing::TestParamInfo<FqConvFqAffineTestParamsSet> obj) {
+std::string FqConvFqAffineTest::getTestCaseName(const testing::TestParamInfo<FqConvFqAffineTestParamsSet>& obj) {
     FqSpecificParams fqParams;
     ConvParams convParams;
     bool permute;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_conv.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_conv.cpp
index b14877f385e182..dcc553104701b6 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_conv.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_conv.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string InputConvTest::getTestCaseName(testing::TestParamInfo<inputConvParams> obj) {
+std::string InputConvTest::getTestCaseName(const testing::TestParamInfo<inputConvParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_split_concat.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_split_concat.cpp
index 447c2bcbf6288b..e7119843cea481 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_split_concat.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/input_split_concat.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string InputSplitConcatTest::getTestCaseName(testing::TestParamInfo<InputSplitConcatParams> obj) {
+std::string InputSplitConcatTest::getTestCaseName(const testing::TestParamInfo<InputSplitConcatParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/matmul_squeeze_add.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/matmul_squeeze_add.cpp
index 3c2a14bc7a4d5b..72bef4b588b1bd 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/matmul_squeeze_add.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/matmul_squeeze_add.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string MatmulSqueezeAddTest::getTestCaseName(testing::TestParamInfo<matmulSqueezeAddParams> obj) {
+std::string MatmulSqueezeAddTest::getTestCaseName(const testing::TestParamInfo<matmulSqueezeAddParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::vector<size_t> inputShape;
     std::size_t outputSize;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/mul_conv_fusion.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/mul_conv_fusion.cpp
new file mode 100644
index 00000000000000..50a21b2ece01b3
--- /dev/null
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/mul_conv_fusion.cpp
@@ -0,0 +1,122 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "transformations/common_optimizations/mul_conv_fusion.hpp"
+#include "ngraph/pass/constant_folding.hpp"
+#include "shared_test_classes/subgraph/mul_conv_fusion.hpp"
+#include "ngraph_functions/builders.hpp"
+
+namespace SubgraphTestsDefinitions {
+
+std::string MulConvFusion::getTestCaseName(const testing::TestParamInfo<MulConvFusionParams> &obj) {
+    ngraph::NodeTypeInfo conv_type;
+    ngraph::Shape input_shape, weights_shape, const_shape;
+    ngraph::element::Type precision;
+    std::string device;
+    std::tie(conv_type, input_shape, weights_shape, const_shape, precision, std::ignore, device) = obj.param;
+    std::ostringstream results;
+
+    results << conv_type.name << "_";
+    results << "input" << CommonTestUtils::vec2str(input_shape) << "_";
+    results << "weights" << CommonTestUtils::vec2str(weights_shape) << "_";
+    results << "const" << CommonTestUtils::vec2str(const_shape) << "_";
+    results << "precision=" << precision << "_";
+    results << "device=" << device;
+    return results.str();
+}
+
+void MulConvFusion::SetUp() {
+    ngraph::NodeTypeInfo conv_type;
+    ngraph::Shape input_shape, weights_shape, const_shape;
+    ngraph::element::Type precision;
+    bool is_negative;
+    std::tie(conv_type, input_shape, weights_shape, const_shape, precision, is_negative, targetDevice) = this->GetParam();
+    auto param = std::make_shared<ngraph::opset8::Parameter>(precision, input_shape);
+    auto spatial_dims = input_shape.size() - 2;
+
+    auto mul_const = ngraph::builder::makeConstant<float>(precision, const_shape, {}, true);
+    auto mul = std::make_shared<ngraph::opset8::Multiply>(param, mul_const);
+    ngraph::Shape strides(spatial_dims, 1);
+    std::vector<ptrdiff_t> pad_begin(spatial_dims, 0), pad_end(spatial_dims, 0);
+    auto weights = ngraph::builder::makeConstant<float>(precision, weights_shape, {}, true);
+    std::shared_ptr<ngraph::Node> conv;
+    if (conv_type == ngraph::opset8::Convolution::type_info) {
+        conv = std::make_shared<ngraph::opset8::Convolution>(mul, weights, strides, pad_begin, pad_end, strides);
+    } else if (conv_type == ngraph::opset8::GroupConvolution::type_info) {
+        conv = std::make_shared<ngraph::opset8::GroupConvolution>(mul, weights, strides, pad_begin, pad_end, strides);
+    } else if (conv_type == ngraph::opset8::ConvolutionBackpropData::type_info) {
+        conv = std::make_shared<ngraph::opset8::ConvolutionBackpropData>(mul, weights, strides, pad_begin, pad_end, strides);
+    } else if (conv_type == ngraph::opset8::GroupConvolutionBackpropData::type_info) {
+        conv = std::make_shared<ngraph::opset8::GroupConvolutionBackpropData>(mul, weights, strides, pad_begin, pad_end, strides);
+    } else {
+        throw ngraph::ngraph_error("Unsupported type");
+    }
+
+    function = std::make_shared<ngraph::Function>(ngraph::OutputVector{conv}, ngraph::ParameterVector{param});
+    auto cloned_function = ngraph::clone_function(*function);
+
+    ngraph::pass::Manager manager;
+    manager.register_pass<ngraph::pass::MultiplyConvolutionFusion>();
+    manager.register_pass<ngraph::pass::MultiplyGroupConvolutionFusion>();
+    manager.register_pass<ngraph::pass::MultiplyConvolutionBackpropDataFusion>();
+    manager.register_pass<ngraph::pass::MultiplyGroupConvolutionBackpropDataFusion>();
+    manager.run_passes(cloned_function);
+
+    bool functions_equal = false;
+    if (!is_negative) {
+        auto param = std::make_shared<ngraph::opset8::Parameter>(precision, input_shape);
+        ngraph::Shape strides(spatial_dims, 1);
+        std::vector<ptrdiff_t> pad_begin(spatial_dims, 0), pad_end(spatial_dims, 0);
+        std::shared_ptr<ngraph::Node> conv;
+        if (conv_type == ngraph::opset8::Convolution::type_info) {
+            weights = std::make_shared<ngraph::opset8::Multiply>(weights, mul_const);
+            weights = ngraph::get_constant_from_source(weights);
+            ASSERT_NE(nullptr, weights);
+            conv = std::make_shared<ngraph::opset8::Convolution>(param, weights, strides, pad_begin, pad_end, strides);
+        } else if (conv_type == ngraph::opset8::GroupConvolution::type_info) {
+            const_shape.insert(const_shape.begin(), weights_shape.size() - const_shape.size(), 1);
+            auto G = const_shape[2] > 1 ? weights_shape[0] : 1;
+            const_shape[0] = G;
+            const_shape[2] /= G;
+            auto reshape = std::make_shared<ngraph::opset8::Reshape>(mul_const,
+                    ngraph::op::Constant::create(ngraph::element::u64, ngraph::Shape{const_shape.size()}, const_shape), false);
+            weights = std::make_shared<ngraph::opset8::Multiply>(weights, reshape);
+            weights = ngraph::get_constant_from_source(weights);
+            ASSERT_NE(nullptr, weights);
+            conv = std::make_shared<ngraph::opset8::GroupConvolution>(param, weights, strides, pad_begin, pad_end, strides);
+        } else if (conv_type == ngraph::opset8::ConvolutionBackpropData::type_info) {
+            const_shape.insert(const_shape.begin(), weights_shape.size() - const_shape.size(), 1);
+            const_shape[0] = const_shape[1];
+            const_shape[1] = 1;
+            auto reshape = std::make_shared<ngraph::opset8::Reshape>(mul_const,
+                    ngraph::op::Constant::create(ngraph::element::u64, ngraph::Shape{const_shape.size()}, const_shape), false);
+            weights = std::make_shared<ngraph::opset8::Multiply>(weights, reshape);
+            weights = ngraph::get_constant_from_source(weights);
+            ASSERT_NE(nullptr, weights);
+            conv = std::make_shared<ngraph::opset8::ConvolutionBackpropData>(param, weights, strides, pad_begin, pad_end, strides);
+        } else if (conv_type == ngraph::opset8::GroupConvolutionBackpropData::type_info) {
+            const_shape.insert(const_shape.begin(), weights_shape.size() - const_shape.size(), 1);
+            auto G = const_shape[2] > 1 ? weights_shape[0] : 1;
+            const_shape[0] = G;
+            const_shape[1] = const_shape[2] / G;
+            const_shape[2] = 1;
+            auto reshape = std::make_shared<ngraph::opset8::Reshape>(mul_const,
+                    ngraph::op::Constant::create(ngraph::element::u64, ngraph::Shape{const_shape.size()}, const_shape), false);
+            weights = std::make_shared<ngraph::opset8::Multiply>(weights, reshape);
+            weights = ngraph::get_constant_from_source(weights);
+            ASSERT_NE(nullptr, weights);
+            conv = std::make_shared<ngraph::opset8::GroupConvolutionBackpropData>(param, weights, strides, pad_begin, pad_end, strides);
+        } else {
+            throw ngraph::ngraph_error("Unsupported type");
+        }
+        auto reference_function = std::make_shared<ngraph::Function>(ngraph::OutputVector{conv}, ngraph::ParameterVector{param});
+        std::tie(functions_equal, std::ignore) = compare_functions(cloned_function, reference_function, true);
+        ASSERT_TRUE(functions_equal);
+    } else {
+        auto reference_function = ngraph::clone_function(*function);
+        std::tie(functions_equal, std::ignore) = compare_functions(cloned_function, reference_function, true);
+        ASSERT_TRUE(functions_equal);
+    }
+}
+} // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_result.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_result.cpp
index 8de1cd0be5ad3a..3dce1b769a989d 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_result.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_result.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ParameterResultSubgraphTest::getTestCaseName(testing::TestParamInfo<parameterResultParams> obj) {
+std::string ParameterResultSubgraphTest::getTestCaseName(const testing::TestParamInfo<parameterResultParams>& obj) {
     std::string targetDevice;
     std::tie(targetDevice) = obj.param;
     std::ostringstream result;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_shapeof_result.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_shapeof_result.cpp
index 50cb5eaeef7f00..010437d3df4d4f 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_shapeof_result.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/parameter_shapeof_result.cpp
@@ -9,7 +9,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ParameterShapeOfResultSubgraphTest::getTestCaseName(testing::TestParamInfo<parameterShapeOfResultParams> obj) {
+std::string ParameterShapeOfResultSubgraphTest::getTestCaseName(const testing::TestParamInfo<parameterShapeOfResultParams>& obj) {
     ngraph::element::Type inType;
     std::string targetDevice;
     std::tie(inType, targetDevice) = obj.param;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/perm_conv_perm_concat.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/perm_conv_perm_concat.cpp
index f19197e4e1249f..aefa636964a5c7 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/perm_conv_perm_concat.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/perm_conv_perm_concat.cpp
@@ -5,7 +5,7 @@
 #include "shared_test_classes/subgraph/perm_conv_perm_concat.hpp"
 
 namespace SubgraphTestsDefinitions {
-std::string PermConvPermConcat::getTestCaseName(testing::TestParamInfo<PermConvPermConcatParams> obj) {
+std::string PermConvPermConcat::getTestCaseName(const testing::TestParamInfo<PermConvPermConcatParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetName;
     std::array<size_t, 4> input_shape;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_convolution_backprop_data.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_convolution_backprop_data.cpp
index 490be05714944d..207de62239178d 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_convolution_backprop_data.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_convolution_backprop_data.cpp
@@ -7,7 +7,7 @@
 namespace SubgraphTestsDefinitions {
 using ngraph::helpers::QuantizationGranularity;
 
-std::string QuantConvBackpropDataLayerTest::getTestCaseName(testing::TestParamInfo<quantConvBackpropDataLayerTestParamsSet> obj) {
+std::string QuantConvBackpropDataLayerTest::getTestCaseName(const testing::TestParamInfo<quantConvBackpropDataLayerTestParamsSet>& obj) {
     quantConvBackpropDataSpecificParams groupConvBackpropDataParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution.cpp
index 2c6c63d8b43558..02042976cdbb94 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution.cpp
@@ -8,7 +8,7 @@ using ngraph::helpers::QuantizationGranularity;
 
 namespace SubgraphTestsDefinitions {
 
-std::string QuantGroupConvLayerTest::getTestCaseName(testing::TestParamInfo<quantGroupConvLayerTestParamsSet> obj) {
+std::string QuantGroupConvLayerTest::getTestCaseName(const testing::TestParamInfo<quantGroupConvLayerTestParamsSet>& obj) {
     quantGroupConvSpecificParams groupConvParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution_backprop_data.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution_backprop_data.cpp
index 8ff3044ccb5b69..b4fd49b026c860 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution_backprop_data.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/quantized_group_convolution_backprop_data.cpp
@@ -7,7 +7,7 @@
 namespace SubgraphTestsDefinitions {
 using ngraph::helpers::QuantizationGranularity;
 
-std::string QuantGroupConvBackpropDataLayerTest::getTestCaseName(testing::TestParamInfo<quantGroupConvBackpropDataLayerTestParamsSet> obj) {
+std::string QuantGroupConvBackpropDataLayerTest::getTestCaseName(const testing::TestParamInfo<quantGroupConvBackpropDataLayerTestParamsSet>& obj) {
     quantGroupConvBackpropDataSpecificParams groupConvBackpropDataParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/range_add.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/range_add.cpp
index a4a917e1a505c6..f85f1ecc729777 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/range_add.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/range_add.cpp
@@ -8,7 +8,7 @@ namespace SubgraphTestsDefinitions {
 
 // ------------------------------ V0 ------------------------------
 
-std::string RangeAddSubgraphTest::getTestCaseName(testing::TestParamInfo<LayerTestsDefinitions::RangeParams> obj) {
+std::string RangeAddSubgraphTest::getTestCaseName(const testing::TestParamInfo<LayerTestsDefinitions::RangeParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
     InferenceEngine::Layout inLayout, outLayout;
@@ -45,7 +45,7 @@ void RangeAddSubgraphTest::SetUp() {
 
 // ------------------------------ V4 ------------------------------
 
-std::string RangeNumpyAddSubgraphTest::getTestCaseName(testing::TestParamInfo<LayerTestsDefinitions::RangeParams> obj) {
+std::string RangeNumpyAddSubgraphTest::getTestCaseName(const testing::TestParamInfo<LayerTestsDefinitions::RangeParams>& obj) {
     InferenceEngine::Precision netPrc;
     InferenceEngine::Precision constPrc;
     InferenceEngine::Precision outPrc;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/relu_shape_of.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/relu_shape_of.cpp
index b636590ddc57c6..3792cf2625b53e 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/relu_shape_of.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/relu_shape_of.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-    std::string ReluShapeOfSubgraphTest::getTestCaseName(testing::TestParamInfo<LayerTestsDefinitions::shapeOfParams> obj) {
+    std::string ReluShapeOfSubgraphTest::getTestCaseName(const testing::TestParamInfo<LayerTestsDefinitions::shapeOfParams>& obj) {
         InferenceEngine::SizeVector inputShapes;
         InferenceEngine::Precision inputPrecision;
         std::string targetDevice;
@@ -29,4 +29,4 @@ namespace SubgraphTestsDefinitions {
         const ngraph::ResultVector results{std::make_shared<ngraph::opset3::Result>(shapeOf)};
         function = std::make_shared<ngraph::Function>(results, param, "ReluShapeOf");
     }
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/reshape_permute_conv_permute_reshape_act.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/reshape_permute_conv_permute_reshape_act.cpp
index 44f77fe7523550..2f1f4f649999e9 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/reshape_permute_conv_permute_reshape_act.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/reshape_permute_conv_permute_reshape_act.cpp
@@ -5,7 +5,7 @@
 #include "shared_test_classes/subgraph/reshape_permute_conv_permute_reshape_act.hpp"
 
 namespace SubgraphTestsDefinitions {
-    std::string ConvReshapeAct::getTestCaseName(testing::TestParamInfo<ConvReshapeActParams> obj) {
+    std::string ConvReshapeAct::getTestCaseName(const testing::TestParamInfo<ConvReshapeActParams>& obj) {
         InferenceEngine::Precision netPrecision;
         std::string targetName;
         std::array<size_t, 4> input_shape;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/scaleshift_conv_scaleshift.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/scaleshift_conv_scaleshift.cpp
index 92be13eff4599e..e3d6d53bc89f91 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/scaleshift_conv_scaleshift.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/scaleshift_conv_scaleshift.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string ScaleShiftAfterConvTest::getTestCaseName(testing::TestParamInfo<ScaleShiftConvScaleShiftParams> obj) {
+std::string ScaleShiftAfterConvTest::getTestCaseName(const testing::TestParamInfo<ScaleShiftConvScaleShiftParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
@@ -92,7 +92,7 @@ void ScaleShiftAfterConvTest::SetUp() {
     function = std::make_shared<ngraph::Function>(mul, params, "ScaleShiftAfterConvTest");
 }
 
-std::string ScaleShiftBeforeConvTest::getTestCaseName(testing::TestParamInfo<ScaleShiftConvScaleShiftParams> obj) {
+std::string ScaleShiftBeforeConvTest::getTestCaseName(const testing::TestParamInfo<ScaleShiftConvScaleShiftParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/softsign.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/softsign.cpp
index d38d2d8e9147b8..585e8305652654 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/softsign.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/softsign.cpp
@@ -2,13 +2,13 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include <legacy/ngraph_ops/power.hpp>
+#include <ngraph/opsets/opset6.hpp>
 #include "shared_test_classes/subgraph/softsign.hpp"
 #include "ngraph_functions/builders.hpp"
 
 namespace SubgraphTestsDefinitions {
 
-std::string SoftsignTest::getTestCaseName(testing::TestParamInfo<softsignParams> obj) {
+std::string SoftsignTest::getTestCaseName(const testing::TestParamInfo<softsignParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::vector<size_t> inputShape;
     std::string targetDevice;
@@ -37,8 +37,13 @@ void SoftsignTest::SetUp() {
     auto params = ngraph::builder::makeParams(ngPrc, { inputShape });
 
     auto abs = std::make_shared<ngraph::op::Abs>(params[0]);
-    auto add = std::make_shared<ngraph::op::PowerIE>(abs, 1, 1, 1);
-    auto power = std::make_shared<ngraph::op::PowerIE>(add, -1, 1, 0);
+
+    auto const_1 = ngraph::opset1::Constant::create(ngPrc, ngraph::Shape{}, {1});
+    auto const_neg_1 = ngraph::opset1::Constant::create(ngPrc, ngraph::Shape{}, {-1});
+
+    auto add = std::make_shared<ngraph::opset6::Add>(abs, const_1);
+    auto power = std::make_shared<ngraph::opset6::Power>(add, const_neg_1);
+
     auto mul = std::make_shared<ngraph::op::v1::Multiply>(power, params[0]);
     ngraph::ResultVector results{ std::make_shared<ngraph::op::Result>(mul) };
     function = std::make_shared<ngraph::Function>(results, params, "SoftSignTest");
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_concat_memory.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_concat_memory.cpp
index bfaf2e877d9180..ec81837b97f5e9 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_concat_memory.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_concat_memory.cpp
@@ -10,7 +10,7 @@ namespace SubgraphTestsDefinitions {
 using namespace CommonTestUtils;
 using namespace InferenceEngine;
 
-std::string SplitConcatMemory::getTestCaseName(testing::TestParamInfo<ParamType> obj) {
+std::string SplitConcatMemory::getTestCaseName(const testing::TestParamInfo<ParamType>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
     int axis;
@@ -79,4 +79,4 @@ void SplitConcatMemory::SetUp() {
             ngraph::ParameterVector {input},
             "CyclicBuffer4");
 }
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv.cpp
index d69a258b776b76..d4a71c5ce5f2a0 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string SplitConvTest::getTestCaseName(testing::TestParamInfo<SplitConvParams> obj) {
+std::string SplitConvTest::getTestCaseName(const testing::TestParamInfo<SplitConvParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv_concat.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv_concat.cpp
index 0aa9b8cce14a91..97ec949438fc02 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv_concat.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/split_conv_concat.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string SplitConvConcat::getTestCaseName(testing::TestParamInfo<LayerTestsUtils::basicParams> obj) {
+std::string SplitConvConcat::getTestCaseName(const testing::TestParamInfo<LayerTestsUtils::basicParams>& obj) {
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes, newInputShapes;
     std::string targetDevice;
@@ -48,4 +48,4 @@ void SplitConvConcat::SetUp() {
     function = std::make_shared<ngraph::Function>(results, params, "SplitConvConcat");
 }
 
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/stridedslice_conv.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/stridedslice_conv.cpp
index 8d0995125c3f82..f726cfcaf1690e 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/stridedslice_conv.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/stridedslice_conv.cpp
@@ -7,7 +7,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string SliceConvTest::getTestCaseName(testing::TestParamInfo<SliceConvParams> obj) {
+std::string SliceConvTest::getTestCaseName(const testing::TestParamInfo<SliceConvParams>& obj) {
     InferenceEngine::Precision netPrecision;
     std::string targetDevice;
     std::map<std::string, std::string> configuration;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/tensor_names.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/tensor_names.cpp
index 2705c4d047fae5..fa2d8b7b1a4bd9 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/tensor_names.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/tensor_names.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string TensorNamesTest::getTestCaseName(testing::TestParamInfo<constResultParams> obj) {
+std::string TensorNamesTest::getTestCaseName(const testing::TestParamInfo<constResultParams>& obj) {
     std::string targetDevice;
     std::tie(targetDevice) = obj.param;
     std::ostringstream result;
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/transpose_add.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/transpose_add.cpp
new file mode 100644
index 00000000000000..ec405c4f63a0c0
--- /dev/null
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/transpose_add.cpp
@@ -0,0 +1,49 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "shared_test_classes/subgraph/transpose_add.hpp"
+
+namespace SubgraphTestsDefinitions {
+std::string TransposeAdd::getTestCaseName(testing::TestParamInfo<TransposeAddParams> obj) {
+    InferenceEngine::Precision netPrecision;
+    std::string targetName;
+    std::vector<size_t> input_shape;
+    std::map<std::string, std::string> configuration;
+
+    std::tie(netPrecision, targetName, input_shape, configuration) = obj.param;
+    std::ostringstream results;
+
+    results << "IS=" << CommonTestUtils::vec2str(std::vector<size_t>(input_shape.begin(), input_shape.end())) << "_";
+    results << "netPRC=" << netPrecision.name() << "_";
+    results << "targetDevice=" << targetName;
+    return results.str();
+}
+
+void TransposeAdd::SetUp() {
+    InferenceEngine::Precision netPrecision;
+    std::vector<size_t> input_shape;
+    std::map<std::string, std::string> additional_config;
+
+    std::tie(netPrecision, targetDevice, input_shape, additional_config) = this->GetParam();
+    GTEST_ASSERT_GE(input_shape.size(), 2);
+
+    configuration.insert(additional_config.begin(), additional_config.end());
+
+    auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(netPrecision);
+    auto params = ngraph::builder::makeParams(ngPrc, {input_shape});
+
+    ngraph::Shape permute_order(input_shape.size());
+    std::iota(std::begin(permute_order), std::end(permute_order), 0);
+    std::iter_swap(std::end(permute_order) - 2, std::end(permute_order) - 1);
+    auto transpose_in_params = std::make_shared<ngraph::opset8::Constant>(ngraph::element::i64,
+        ngraph::Shape{permute_order.size()}, permute_order);
+    auto transpose_in = std::make_shared<ngraph::opset8::Transpose>(params[0], transpose_in_params);
+
+    auto add_const = ngraph::builder::makeConstant<float>(ngPrc, transpose_in->get_output_shape(0), {}, true);
+    auto add = std::make_shared<ngraph::opset8::Add>(transpose_in, add_const);
+
+    function = std::make_shared<ngraph::Function>(add, params, "transpose_add");
+}
+
+} // namespace SubgraphTestsDefinitions
\ No newline at end of file
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/transpose_conv_transpose_squeeze.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/transpose_conv_transpose_squeeze.cpp
index 1b26740ed0d42f..07a455799e0fb5 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/transpose_conv_transpose_squeeze.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/transpose_conv_transpose_squeeze.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string TransposeConvTest::getTestCaseName(testing::TestParamInfo<TransposeConvTestParams> obj) {
+std::string TransposeConvTest::getTestCaseName(const testing::TestParamInfo<TransposeConvTestParams>& obj) {
     ConvParams convParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::SizeVector inputShapes;
@@ -83,4 +83,4 @@ InferenceEngine::Blob::Ptr TransposeConvTest::GenerateInput(const InferenceEngin
     return FuncTestUtils::createAndFillBlob(info.getTensorDesc(), inputDataMax - inputDataMin, inputDataMin, 1 / inputDataResolution,
                                             seed);
 }
-}  // namespace SubgraphTestsDefinitions
\ No newline at end of file
+}  // namespace SubgraphTestsDefinitions
diff --git a/inference-engine/tests/functional/shared_test_classes/src/subgraph/two_fake_quantize_to_fullyconnected.cpp b/inference-engine/tests/functional/shared_test_classes/src/subgraph/two_fake_quantize_to_fullyconnected.cpp
index 3b350d426cb5f5..3123ef72fe9ca9 100644
--- a/inference-engine/tests/functional/shared_test_classes/src/subgraph/two_fake_quantize_to_fullyconnected.cpp
+++ b/inference-engine/tests/functional/shared_test_classes/src/subgraph/two_fake_quantize_to_fullyconnected.cpp
@@ -6,7 +6,7 @@
 
 namespace SubgraphTestsDefinitions {
 
-std::string FakeQuantizeSubgraphTest::getTestCaseName(testing::TestParamInfo<fqSubgraphTestParamsSet> obj) {
+std::string FakeQuantizeSubgraphTest::getTestCaseName(const testing::TestParamInfo<fqSubgraphTestParamsSet>& obj) {
     fqSpecificParams fqParams;
     InferenceEngine::Precision netPrecision;
     InferenceEngine::Precision inPrc, outPrc;
diff --git a/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.cpp b/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.cpp
index 3a34ffc73984f2..738191890cfab9 100644
--- a/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.cpp
+++ b/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.cpp
@@ -5,11 +5,6 @@
 #include "common_test_utils/common_utils.hpp"
 #include <legacy/details/ie_cnn_network_iterator.hpp>
 
-::std::ostream& ngraph::operator << (::std::ostream & os, const Function&) {
-    throw std::runtime_error("should not be called");
-    return os;
-}
-
 namespace CommonTestUtils {
 
 IE_SUPPRESS_DEPRECATED_START
diff --git a/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.hpp b/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.hpp
index 9c20a00913d66b..9abc01094d2d75 100644
--- a/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.hpp
+++ b/inference-engine/tests/ie_test_utils/common_test_utils/common_utils.hpp
@@ -17,10 +17,6 @@
 #include <cpp/ie_cnn_network.h>
 #include <ngraph/function.hpp>
 
-namespace ngraph {
-::std::ostream& operator << (::std::ostream &, const Function&);
-}
-
 namespace InferenceEngine {
 class CNNLayer;
 }
diff --git a/inference-engine/tests/ie_test_utils/common_test_utils/ngraph_test_utils.cpp b/inference-engine/tests/ie_test_utils/common_test_utils/ngraph_test_utils.cpp
index 1af6642ba878bd..4b787a935518cf 100644
--- a/inference-engine/tests/ie_test_utils/common_test_utils/ngraph_test_utils.cpp
+++ b/inference-engine/tests/ie_test_utils/common_test_utils/ngraph_test_utils.cpp
@@ -22,6 +22,8 @@
 #include <ngraph/op/util/sub_graph_base.hpp>
 #include <ngraph/opsets/opset1.hpp>
 #include <ngraph/pass/visualize_tree.hpp>
+#include <ngraph_ops/type_relaxed.hpp>
+
 namespace {
 inline namespace tools {
 bool isTypeRelaxed(const std::string &type) {
@@ -43,20 +45,29 @@ bool compareTypeInfo(const ngraph::DiscreteTypeInfo &info1, const ngraph::Discre
 
 template<typename Node>
 bool compare_rt_keys(const Node &node1, const Node &node2) {
+    // The "opset" parameter in RT info is optional
+    // and mandatory only for TypeRelaxed operations.
+    // Therefore, we ignore this key when comparing RT keys.
+
     const auto &first_node_rt_info = node1->get_rt_info();
     const auto &second_node_rt_info = node2->get_rt_info();
 
-    if (first_node_rt_info.empty() && second_node_rt_info.empty()) {
-        return true;
-    }
-
-    if (first_node_rt_info.size() != second_node_rt_info.size()) {
-        return false;
-    }
-
     auto first_node_rt_info_it = first_node_rt_info.begin();
     auto second_node_rt_info_it = second_node_rt_info.begin();
-    while (first_node_rt_info_it != first_node_rt_info.end()) {
+
+    while (first_node_rt_info_it != first_node_rt_info.end()
+        && second_node_rt_info_it != second_node_rt_info.end()) {
+        bool is_continue = false;
+        if (first_node_rt_info_it->first == "opset") {
+            ++first_node_rt_info_it;
+            is_continue = true;
+        }
+        if (second_node_rt_info_it->first == "opset") {
+            ++second_node_rt_info_it;
+            is_continue = true;
+        }
+        if (is_continue)
+            continue;
         if (first_node_rt_info_it->first != second_node_rt_info_it->first) {
             return false;
         }
@@ -64,7 +75,16 @@ bool compare_rt_keys(const Node &node1, const Node &node2) {
         ++second_node_rt_info_it;
     }
 
-    return true;
+    if (first_node_rt_info_it != first_node_rt_info.end()
+        && first_node_rt_info_it->first == "opset") {
+        ++first_node_rt_info_it;
+    }
+    if (second_node_rt_info_it != second_node_rt_info.end()
+        && second_node_rt_info_it->first == "opset") {
+        ++second_node_rt_info_it;
+    }
+    return first_node_rt_info_it == first_node_rt_info.end()
+        && second_node_rt_info_it == second_node_rt_info.end();
 }
 
 bool less_by_name(
diff --git a/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/summarize.py b/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/summarize.py
index 1245ae8a0fb9bf..bc1db07f86376f 100644
--- a/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/summarize.py
+++ b/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/summarize.py
@@ -7,7 +7,6 @@
 
 from jinja2 import Environment, FileSystemLoader
 
-from utils import constants
 from utils import utils
 
 logger = utils.get_logger('Summarize')
@@ -167,11 +166,9 @@ def create_summary(summary_root: ET.Element, output_folder: os.path, report_tag:
     env = Environment(loader=file_loader)
     template = env.get_template('report_template.html')
 
-    verified_operations = constants.VERIFIED_OP_REFERENCES
-
     res_summary = template.render(ordered_ops=op_list, devices=device_list, results=results, timestamp=timestamp,
                                   general_pass_rate=general_pass_rate, pass_rate_avg=pass_rate_avg,
-                                  verified_operations=verified_operations, trusted_ops=trusted_ops,
+                                  trusted_ops=trusted_ops,
                                   general_test_count=general_test_count, report_tag=report_tag)
 
     report_path = os.path.join(output_folder, f'{output_filename}.html')
diff --git a/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/template/report_template.html b/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/template/report_template.html
index 2fc9c17398516e..ed860be450bcfe 100644
--- a/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/template/report_template.html
+++ b/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/template/report_template.html
@@ -22,10 +22,6 @@
     <div class="main">
         <h2>Operations coverage summary: {{report_tag}} {{ timestamp }}</h2>
         <div class="legend">
-            <div>
-                <span class="border colorRed">Acosh-4</span><span>Not verified Ngraph references</span>
-            </div>
-
             <div>
                 <span class="table-primary border"></span><span>Collected statistic info</span>
             </div>
@@ -127,8 +123,7 @@ <h2>Operations coverage summary: {{report_tag}} {{ timestamp }}</h2>
         <tbody id="data">
             {% for op in ordered_ops -%}
             <tr>
-                <th scope="row" {% if op not in verified_operations -%} class="colorRed" {% endif -%} name="{{ op }}">{{
-                    op }}</th>
+                <th scope="row" name="{{ op }}">{{ op }}</th>
 
                 {% for d in devices -%}
                 {% if op in results[d] -%}
diff --git a/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/utils/constants.py b/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/utils/constants.py
deleted file mode 100644
index d40dc40480c2e3..00000000000000
--- a/inference-engine/tests/ie_test_utils/functional_test_utils/layer_tests_summary/utils/constants.py
+++ /dev/null
@@ -1,131 +0,0 @@
-# Copyright (C) 2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-VERIFIED_OP_REFERENCES = [
-    'Abs-1',
-    'Acos-1',
-    'Acosh-3',
-    'Add-1',
-    'Asin-1',
-    'Asinh-3',
-    'Assign-6',
-    'AvgPool-1',
-    'BatchNormInference-5',
-    'BatchToSpace-2',
-    'BinaryConvolution-1',
-    'Broadcast-1',
-    'Broadcast-3',
-    'Bucketize-3',
-    'Ceiling-1',
-    'CTCGreedyDecoder-1',
-    'CTCGreedyDecoderSeqLen-6',
-    'Concat-1',
-    'Convert-1',
-    'ConvertLike-1',
-    'Convolution-1',
-    'Constant-1',
-    'Cos-1',
-    'Cosh-1',
-    'DeformableConvolution-1',
-    'DeformablePSROIPooling-1',
-    'DepthToSpace-1',
-    'DetectionOutput-1',
-    'Divide-1',
-    'Equal-1',
-    'Erf-1',
-    'ExperimentalDetectronDetectionOutput-6',
-    'ExperimentalDetectronGenerateProposalsSingleImage-6',
-    'ExperimentalDetectronPriorGridGenerator-6',
-    'ExperimentalDetectronROIFeatureExtractor-6',
-    'ExperimentalDetectronTopKROIs-6',
-    'FakeQuantize-1',
-    'Floor-1'
-    'FloorMod-1'
-    'GRUSequence-5',
-    'Gather-1',
-    'GatherElements-6',
-    'GatherND-5',
-    'Gelu-7',
-    'Greater-1',
-    'GreaterEqual-1',
-    'GRN-1',
-    'GroupConvolution-1',
-    'GroupConvolutionBackpropData-1',
-    'GRUSequence-5',
-    'HSigmoid-5',
-    'HSwish-4',
-    'HardSigmoid-1',
-    'Interpolate-4',
-    'Less-1',
-    'LessEqual-1'
-    'LRN-1',
-    'LSTMCell-4',
-    'LSTMSequence-5',
-    'LogicalAnd-1',
-    'LogicalNot-1'
-    'LogicalOr-1'
-    'LogicalXor-1'
-    'LogSoftmax-5',
-    'Loop-5',
-    'MVN-1',
-    'MVN-6',
-    'Maximum-1',
-    'MaxPool-1',
-    'Mish-4',
-    'Multiply-1',
-    'Negative-1',
-    'NonMaxSuppression-4',
-    'NonMaxSuppression-5',
-    'NonZero-3',
-    'NormalizeL2-1',
-    'PriorBox-1',
-    'PriorBoxClustered-1',
-    'Proposal-1',
-    'Proposal-4',
-    'PSROIPooling-1',
-    'RNNSequence-5',
-    'ROIAlign-3',
-    'ROIPooling-2',
-    'Range-1',
-    'Range-4',
-    'ReadValue-6',
-    'ReduceL1-4',
-    'ReduceL2-4',
-    'ReduceLogicalAnd-1',
-    'ReduceLogicalOr-1',
-    'ReduceMax-1',
-    'ReduceMean-1',
-    'ReduceMin-1',
-    'ReduceProd-1',
-    'ReduceSum-1',
-    'RegionYOLO-1',
-    'Relu-1',
-    'ReorgYOLO-2',
-    'Result-1'
-    'ReverseSequence-1',
-    'Round-5',
-    'SpaceToDepth-1',
-    'ScatterElementsUpdate-3',
-    'ScatterNDUpdate-4',
-    'Select-1',
-    'ShapeOf-1',
-    'ShapeOf-3',
-    'ShuffleChannels-1',
-    'Sigmoid-1',
-    'Sign-1',
-    'Sin-1',
-    'Sinh-1'
-    'SoftPlus-4',
-    'Softmax-1',
-    'Split-1',
-    'Squeeze-1',
-    'StridedSlice-1',
-    'Subtract-1',
-    'Swish-4',
-    'Tile-1',
-    'TopK-1',
-    'TopK-3',
-    'Transpose-1',
-    'Unsqueeze-1',
-    'VariadicSplit-1',
-]
diff --git a/inference-engine/tests/ie_test_utils/functional_test_utils/src/layer_test_utils/summary.cpp b/inference-engine/tests/ie_test_utils/functional_test_utils/src/layer_test_utils/summary.cpp
index 91d6ee58c4394a..449d8b294912b4 100644
--- a/inference-engine/tests/ie_test_utils/functional_test_utils/src/layer_test_utils/summary.cpp
+++ b/inference-engine/tests/ie_test_utils/functional_test_utils/src/layer_test_utils/summary.cpp
@@ -36,6 +36,7 @@ Summary::Summary() {
     opsets.push_back(ngraph::get_opset5());
     opsets.push_back(ngraph::get_opset6());
     opsets.push_back(ngraph::get_opset7());
+    opsets.push_back(ngraph::get_opset8());
 }
 
 Summary &Summary::getInstance() {
diff --git a/inference-engine/tests/ie_test_utils/unit_test_utils/mock.cpp b/inference-engine/tests/ie_test_utils/unit_test_utils/mock.cpp
index 9cc7309c1c9666..515a51e5244d7c 100644
--- a/inference-engine/tests/ie_test_utils/unit_test_utils/mock.cpp
+++ b/inference-engine/tests/ie_test_utils/unit_test_utils/mock.cpp
@@ -45,12 +45,12 @@ void MockNotEmptyICNNNetwork::getInputsInfo(InputsDataMap &inputs) const noexcep
         "Input",
         Precision::FP32 });
     getInputTo(inData)[MockNotEmptyICNNNetwork::OUTPUT_BLOB_NAME] = inputLayer;
-    inData->setDims(MockNotEmptyICNNNetwork::INPUT_DIMENTIONS);
+    inData->setDims(MockNotEmptyICNNNetwork::INPUT_DIMENSIONS);
     inData->setLayout(Layout::NCHW);
     inputInfo->setInputData(inData);
 
     auto outData = std::make_shared<Data>(MockNotEmptyICNNNetwork::OUTPUT_BLOB_NAME, Precision::UNSPECIFIED);
-    outData->setDims(MockNotEmptyICNNNetwork::OUTPUT_DIMENTIONS);
+    outData->setDims(MockNotEmptyICNNNetwork::OUTPUT_DIMENSIONS);
     outData->setLayout(Layout::NCHW);
     getInputTo(outData)[""] = std::make_shared<CNNLayer>(LayerParams{
         MockNotEmptyICNNNetwork::OUTPUT_BLOB_NAME,
diff --git a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_icore.hpp b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_icore.hpp
index 38fc58dacd5a22..009cdb2259551d 100644
--- a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_icore.hpp
+++ b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_icore.hpp
@@ -17,14 +17,14 @@ class MockICore : public InferenceEngine::ICore {
     MOCK_METHOD3(LoadNetwork, InferenceEngine::SoExecutableNetworkInternal(
         const InferenceEngine::CNNNetwork&, const std::string&, const std::map<std::string, std::string>&));
     MOCK_METHOD3(LoadNetwork, InferenceEngine::SoExecutableNetworkInternal(
-        const InferenceEngine::CNNNetwork&, const std::shared_ptr<InferenceEngine::IRemoteContext> &, const std::map<std::string, std::string>&));
+        const InferenceEngine::CNNNetwork&, const std::shared_ptr<InferenceEngine::RemoteContext> &, const std::map<std::string, std::string>&));
     MOCK_METHOD3(LoadNetwork, InferenceEngine::SoExecutableNetworkInternal(
         const std::string &, const std::string &, const std::map<std::string, std::string>&));
 
     MOCK_METHOD3(ImportNetwork, InferenceEngine::SoExecutableNetworkInternal(
         std::istream&, const std::string&, const std::map<std::string, std::string>&));
     MOCK_METHOD3(ImportNetwork, InferenceEngine::SoExecutableNetworkInternal(
-        std::istream&, const std::shared_ptr<InferenceEngine::IRemoteContext>&, const std::map<std::string, std::string>&));
+        std::istream&, const std::shared_ptr<InferenceEngine::RemoteContext>&, const std::map<std::string, std::string>&));
 
     MOCK_CONST_METHOD3(QueryNetwork, InferenceEngine::QueryNetworkResult(
         const InferenceEngine::CNNNetwork&, const std::string&, const std::map<std::string, std::string>&));
diff --git a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iexecutable_network_internal.hpp b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iexecutable_network_internal.hpp
index 4ceb8f728fea09..805df1d61dcf5b 100644
--- a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iexecutable_network_internal.hpp
+++ b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iexecutable_network_internal.hpp
@@ -30,7 +30,7 @@ class MockIExecutableNetworkInternal : public IExecutableNetworkInternal {
     MOCK_METHOD1(SetConfig, void(const std::map<std::string, Parameter> &config));
     MOCK_CONST_METHOD1(GetConfig, Parameter(const std::string &name));
     MOCK_CONST_METHOD1(GetMetric, Parameter(const std::string &name));
-    MOCK_CONST_METHOD0(GetContext, std::shared_ptr<IRemoteContext>(void));
+    MOCK_CONST_METHOD0(GetContext, std::shared_ptr<RemoteContext>(void));
     void WrapOstreamExport(std::ostream& networkModel) {
         IExecutableNetworkInternal::Export(networkModel);
     }
diff --git a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iinference_plugin.hpp b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iinference_plugin.hpp
index 0c45de9b9951dd..4cc853e5fd3bc5 100644
--- a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iinference_plugin.hpp
+++ b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iinference_plugin.hpp
@@ -30,15 +30,15 @@ class MockIInferencePlugin : public InferenceEngine::IInferencePlugin {
     MOCK_CONST_METHOD2(GetMetric, InferenceEngine::Parameter(
                 const std::string&, const std::map<std::string, InferenceEngine::Parameter>&));
     MOCK_METHOD1(CreateContext,
-                std::shared_ptr<InferenceEngine::IRemoteContext>(const InferenceEngine::ParamMap&));
-    MOCK_METHOD1(GetDefaultContext, std::shared_ptr<InferenceEngine::IRemoteContext>(const InferenceEngine::ParamMap&));
+                std::shared_ptr<InferenceEngine::RemoteContext>(const InferenceEngine::ParamMap&));
+    MOCK_METHOD1(GetDefaultContext, std::shared_ptr<InferenceEngine::RemoteContext>(const InferenceEngine::ParamMap&));
     MOCK_METHOD3(LoadNetwork, std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>(
                 const InferenceEngine::CNNNetwork&, const std::map<std::string, std::string>&,
-                std::shared_ptr<InferenceEngine::IRemoteContext>));
+                std::shared_ptr<InferenceEngine::RemoteContext>));
     MOCK_METHOD2(ImportNetwork, std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>(
                 std::istream&, const std::map<std::string, std::string>&));
     MOCK_METHOD3(ImportNetwork, std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>(
-                std::istream&, const std::shared_ptr<InferenceEngine::IRemoteContext>&,
+                std::istream&, const std::shared_ptr<InferenceEngine::RemoteContext>&,
                 const std::map<std::string, std::string>&));
     MOCK_CONST_METHOD2(QueryNetwork,
                        InferenceEngine::QueryNetworkResult(const InferenceEngine::CNNNetwork&,
diff --git a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.cpp b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.cpp
index 2cfa6330ab5932..e6cefc75ea24f8 100644
--- a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.cpp
+++ b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.cpp
@@ -45,7 +45,7 @@ MockPlugin::LoadNetwork(const CNNNetwork &network,
 std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>
 MockPlugin::LoadNetwork(const CNNNetwork& network,
                         const std::map<std::string, std::string>& config,
-                        const std::shared_ptr<IRemoteContext>& context) {
+                        const std::shared_ptr<RemoteContext>& context) {
     if (_target) {
         return _target->LoadNetwork(network, config, context);
     } else {
@@ -81,7 +81,7 @@ MockPlugin::ImportNetwork(std::istream& networkModel,
 
 std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>
 MockPlugin::ImportNetwork(std::istream& networkModel,
-                         const std::shared_ptr<InferenceEngine::IRemoteContext>& context,
+                         const std::shared_ptr<InferenceEngine::RemoteContext>& context,
                          const std::map<std::string, std::string>& config) {
     if (_target) {
         return _target->ImportNetwork(networkModel, context, config);
@@ -90,7 +90,7 @@ MockPlugin::ImportNetwork(std::istream& networkModel,
     }
 }
 
-std::shared_ptr<InferenceEngine::IRemoteContext> MockPlugin::GetDefaultContext(const InferenceEngine::ParamMap& params) {
+std::shared_ptr<InferenceEngine::RemoteContext> MockPlugin::GetDefaultContext(const InferenceEngine::ParamMap& params) {
     if (_target) {
         return _target->GetDefaultContext(params);
     } else {
diff --git a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.hpp b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.hpp
index 8514bf28c807d1..05becce1fcda89 100644
--- a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.hpp
+++ b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_engine/mock_plugin.hpp
@@ -24,7 +24,7 @@ class MockPlugin : public InferenceEngine::IInferencePlugin {
     std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>
     LoadNetwork(const InferenceEngine::CNNNetwork& network,
                 const std::map<std::string, std::string>& config,
-                const std::shared_ptr<InferenceEngine::IRemoteContext>& context) override;
+                const std::shared_ptr<InferenceEngine::RemoteContext>& context) override;
 
     std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>
     LoadExeNetworkImpl(const InferenceEngine::CNNNetwork& network,
@@ -40,13 +40,13 @@ class MockPlugin : public InferenceEngine::IInferencePlugin {
 
     std::shared_ptr<InferenceEngine::IExecutableNetworkInternal>
     ImportNetwork(std::istream& networkModel,
-        const std::shared_ptr<InferenceEngine::IRemoteContext>& context,
+        const std::shared_ptr<InferenceEngine::RemoteContext>& context,
         const std::map<std::string, std::string>& config) override;
 
     InferenceEngine::Parameter GetMetric(const std::string& name,
                         const std::map<std::string, InferenceEngine::Parameter>& options) const override;
 
-    std::shared_ptr<InferenceEngine::IRemoteContext> GetDefaultContext(const InferenceEngine::ParamMap& params) override;
+    std::shared_ptr<InferenceEngine::RemoteContext> GetDefaultContext(const InferenceEngine::ParamMap& params) override;
 
     InferenceEngine::QueryNetworkResult QueryNetwork(const InferenceEngine::CNNNetwork& network,
                                                      const std::map<std::string, std::string>& config) const override;
diff --git a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_not_empty_icnn_network.hpp b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_not_empty_icnn_network.hpp
index d861ded519a863..98cf3509c8eef8 100644
--- a/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_not_empty_icnn_network.hpp
+++ b/inference-engine/tests/ie_test_utils/unit_test_utils/mocks/mock_not_empty_icnn_network.hpp
@@ -19,9 +19,9 @@ IE_SUPPRESS_DEPRECATED_START
 class MockNotEmptyICNNNetwork final : public ICNNNetwork {
 public:
     static constexpr const char* INPUT_BLOB_NAME = "first_input";
-    const SizeVector INPUT_DIMENTIONS = { 1, 3, 299, 299 };
+    const SizeVector INPUT_DIMENSIONS = { 1, 3, 299, 299 };
     static constexpr const char* OUTPUT_BLOB_NAME = "first_output";
-    const SizeVector OUTPUT_DIMENTIONS = { 1, 3, 299, 299 };
+    const SizeVector OUTPUT_DIMENSIONS = { 1, 3, 299, 299 };
     const std::string name = "test";
     const std::string& getName() const noexcept override {
         return name;
@@ -29,10 +29,24 @@ class MockNotEmptyICNNNetwork final : public ICNNNetwork {
     void getOutputsInfo(OutputsDataMap& out) const noexcept override;
     void getInputsInfo(InputsDataMap &inputs) const noexcept override;
     std::shared_ptr<ngraph::Function> getFunction() noexcept override {
-        return nullptr;
+        ngraph::ParameterVector parameters;
+        parameters.push_back(std::make_shared<ngraph::op::v0::Parameter>(
+            ov::element::f32, std::vector<ov::Dimension>{INPUT_DIMENSIONS.begin(), INPUT_DIMENSIONS.end()}));
+        parameters.back()->set_friendly_name(INPUT_BLOB_NAME);
+        ngraph::ResultVector results;
+        results.push_back(std::make_shared<ngraph::op::v0::Result>(parameters.back()->output(0)));
+        results.back()->set_friendly_name(OUTPUT_BLOB_NAME);
+        return std::make_shared<ov::Function>(results, parameters, "empty_function");
     }
     std::shared_ptr<const ngraph::Function> getFunction() const noexcept override {
-        return nullptr;
+        ngraph::ParameterVector parameters;
+        parameters.push_back(std::make_shared<ngraph::op::v0::Parameter>(
+            ov::element::f32, std::vector<ov::Dimension>{INPUT_DIMENSIONS.begin(), INPUT_DIMENSIONS.end()}));
+        parameters.back()->set_friendly_name(INPUT_BLOB_NAME);
+        ngraph::ResultVector results;
+        results.push_back(std::make_shared<ngraph::op::v0::Result>(parameters.back()->output(0)));
+        results.back()->set_friendly_name(OUTPUT_BLOB_NAME);
+        return std::make_shared<const ov::Function>(results, parameters, "empty_function");
     }
     MOCK_METHOD(InputInfo::Ptr, getInput, (const std::string &inputName), (const, noexcept));
     MOCK_METHOD(size_t, layerCount, (), (const, noexcept));
diff --git a/inference-engine/tests/ngraph_helpers/lpt_ngraph_functions/include/lpt_ngraph_functions/move_fake_quantize_function.hpp b/inference-engine/tests/ngraph_helpers/lpt_ngraph_functions/include/lpt_ngraph_functions/move_fake_quantize_function.hpp
new file mode 100644
index 00000000000000..9640845c8be6d1
--- /dev/null
+++ b/inference-engine/tests/ngraph_helpers/lpt_ngraph_functions/include/lpt_ngraph_functions/move_fake_quantize_function.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <algorithm>
+#include <memory>
+#include <ngraph/ngraph.hpp>
+#include "low_precision/layer_transformation.hpp"
+#include "common/fake_quantize_on_data.hpp"
+#include "common/dequantization_operations.hpp"
+
+namespace ngraph {
+namespace builder {
+namespace subgraph {
+
+class MoveFakeQuantize {
+public:
+    static std::shared_ptr<ngraph::Function> get(
+        const ngraph::element::Type inputPrecision,
+        const ngraph::PartialShape& inputShape,
+        const FakeQuantizeOnDataWithConstant& fqOnData1,
+        const DequantizationOperations::Convert& convert1,
+        const DequantizationOperations& dequantization1,
+        const FakeQuantizeOnDataWithConstant& fqOnData2,
+        const DequantizationOperations::Convert& convert2,
+        const DequantizationOperations& dequantization2,
+        const std::string& operation,
+        const FakeQuantizeOnDataWithConstant& fqOnData3,
+        const DequantizationOperations::Convert& convert3,
+        const DequantizationOperations& dequantization3,
+        const std::vector<std::shared_ptr<Variant>>& concatAttributes,
+        const ngraph::element::Type precisionAfterOperation,
+        const DequantizationOperations& dequantizationAfter,
+        const std::int64_t& axis);
+};
+
+}  // namespace subgraph
+}  // namespace builder
+}  // namespace ngraph
diff --git a/inference-engine/tests/ngraph_helpers/lpt_ngraph_functions/src/move_fake_quantize_function.cpp b/inference-engine/tests/ngraph_helpers/lpt_ngraph_functions/src/move_fake_quantize_function.cpp
new file mode 100644
index 00000000000000..c53ddd3f6df813
--- /dev/null
+++ b/inference-engine/tests/ngraph_helpers/lpt_ngraph_functions/src/move_fake_quantize_function.cpp
@@ -0,0 +1,107 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "lpt_ngraph_functions/move_fake_quantize_function.hpp"
+#include <low_precision/relu.hpp>
+
+#include <ngraph/opsets/opset1.hpp>
+#include "ngraph_ops/type_relaxed.hpp"
+#include "low_precision/network_helper.hpp"
+
+#include "lpt_ngraph_functions/common/fake_quantize_on_data.hpp"
+#include "lpt_ngraph_functions/common/dequantization_operations.hpp"
+#include "lpt_ngraph_functions/common/builders.hpp"
+
+namespace ngraph {
+namespace builder {
+namespace subgraph {
+
+using namespace ngraph::pass;
+
+std::shared_ptr<ngraph::Function> MoveFakeQuantize::get(
+    const ngraph::element::Type inputPrecision,
+    const ngraph::PartialShape& inputShape,
+    const FakeQuantizeOnDataWithConstant& fqOnData1,
+    const DequantizationOperations::Convert& convert1,
+    const DequantizationOperations& dequantization1,
+    const FakeQuantizeOnDataWithConstant& fqOnData2,
+    const DequantizationOperations::Convert& convert2,
+    const DequantizationOperations& dequantization2,
+    const std::string& operation,
+    const FakeQuantizeOnDataWithConstant& fqOnData3,
+    const DequantizationOperations::Convert& convert3,
+    const DequantizationOperations& dequantization3,
+    const std::vector<std::shared_ptr<Variant>>& concatAttributes,
+    const ngraph::element::Type precisionAfterOperation,
+    const DequantizationOperations& dequantizationAfter,
+    const std::int64_t& axis) {
+
+    const auto input1 = std::make_shared<ngraph::opset1::Parameter>(inputPrecision, inputShape);
+    input1->set_friendly_name("input1");
+
+    const auto input2 = std::make_shared<ngraph::opset1::Parameter>(inputPrecision, inputShape);
+    input2->set_friendly_name("input2");
+    std::shared_ptr<Node> parent1 = input1, parent2 = input2;
+    if (!fqOnData1.empty()) {
+        if (operation == "relu") {
+            auto relu1 = std::make_shared<ngraph::opset1::Relu>(input1->output(0));
+            parent1 = makeFakeQuantize(relu1, inputPrecision, fqOnData1);
+        } else {
+            parent1 = makeFakeQuantize(input1, inputPrecision, fqOnData1);
+        }
+        parent1->set_friendly_name("concat_fq1");
+        if (!convert1.empty()) {
+            parent1 = std::make_shared<opset1::Convert>(parent1, convert1.outPrecision);
+        }
+        if (!dequantization1.empty()) {
+            parent1 = makeDequantization(parent1, dequantization1);
+        }
+    }
+    if (!fqOnData2.empty()) {
+        if (operation == "relu") {
+            auto relu2 = std::make_shared<ngraph::opset1::Relu>(input2->output(0));
+            parent2 = makeFakeQuantize(relu2, inputPrecision, fqOnData2);
+        } else {
+            parent2 = makeFakeQuantize(input1, inputPrecision, fqOnData2);
+        }
+        parent2->set_friendly_name("concat_fq2");
+        if (!convert2.empty()) {
+            parent1 = std::make_shared<opset1::Convert>(parent2, convert2.outPrecision);
+        }
+        if (!dequantization1.empty()) {
+            parent2 = makeDequantization(parent2, dequantization2);
+        }
+    }
+    const std::shared_ptr<ngraph::opset1::Concat> concat = std::make_shared<ngraph::opset1::Concat>(ngraph::OutputVector{ parent1, parent2 }, axis);
+    concat->set_friendly_name("concat");
+    std::shared_ptr<ngraph::Node> parent = concat;
+    if (!dequantizationAfter.empty()) {
+        const auto lastDequantization = makeDequantization(concat, dequantizationAfter);
+        lastDequantization->set_friendly_name("multiply");
+        parent = lastDequantization;
+    }
+    addAttributes({ parent }, concatAttributes);
+    if (!fqOnData3.empty()) {
+        std::shared_ptr<Node> fq;
+        if (operation == "relu") {
+            auto relu = std::make_shared<ngraph::opset1::Relu>(concat->output(0));
+            fq = makeFakeQuantize(relu, inputPrecision, fqOnData3);
+        } else {
+            fq = makeFakeQuantize(concat, inputPrecision, fqOnData3);
+        }
+        fq->set_friendly_name("fakeQuantizeAfter");
+        parent = fq;
+    }
+    parent->set_friendly_name("output");
+    ngraph::ResultVector results{ std::make_shared<ngraph::opset1::Result>(parent) };
+    std::shared_ptr<ngraph::Function> function = std::make_shared<ngraph::Function>(
+        results,
+        ngraph::ParameterVector{ input1, input2 },
+        "MoveFakeQuantize");
+    return function;
+}
+
+}  // namespace subgraph
+}  // namespace builder
+}  // namespace ngraph
diff --git a/inference-engine/tests/unit/cpu/CMakeLists.txt b/inference-engine/tests/unit/cpu/CMakeLists.txt
index bea484969fc66c..c5180204454c6b 100644
--- a/inference-engine/tests/unit/cpu/CMakeLists.txt
+++ b/inference-engine/tests/unit/cpu/CMakeLists.txt
@@ -14,6 +14,7 @@ addIeTargetTest(
         LINK_LIBRARIES
             gtest
             gtest_main
+            gmock
             mkldnn
             inference_engine_transformations
             inference_engine_lp_transformations
diff --git a/inference-engine/tests/unit/cpu/mkldnn_memory_desc_test.cpp b/inference-engine/tests/unit/cpu/mkldnn_memory_desc_test.cpp
index 66eecf43cf31cf..97d9533595e52f 100644
--- a/inference-engine/tests/unit/cpu/mkldnn_memory_desc_test.cpp
+++ b/inference-engine/tests/unit/cpu/mkldnn_memory_desc_test.cpp
@@ -4,24 +4,32 @@
 
 #include <utility>
 #include <gtest/gtest.h>
+#include <gmock/gmock-matchers.h>
 
 #include "mkldnn_memory.h"
-#include "cpu_memory_desc_utils.h"
+#include "memory_desc/cpu_memory_desc_utils.h"
+#include "nodes/common/blocked_desc_creator.h"
+#include "mkldnn_extension_utils.h"
+#include "memory_desc/dnnl_blocked_memory_desc.h"
 
 using namespace MKLDNNPlugin;
 using namespace InferenceEngine;
+using namespace testing;
 
 TEST(MemDescTest, Conversion) {
     // Check if conversion keep desc structure
-    // dnnl::memory::desc -> MKLDNNMemoryDesc -> BlockedMemoryDesc -> MKLDNNMemoryDesc -> dnnl::memory::desc
+    // dnnl::memory::desc -> DnnlBlockedMemoryDesc -> CpuBlockedMemoryDesc -> DnnlBlockedMemoryDesc -> dnnl::memory::desc
     auto converted_correctly = [] (dnnl::memory::format_tag fmt, dnnl::memory::dims dims) {
         dnnl::memory::desc orig_tdesc {dims, dnnl::memory::data_type::u8, fmt};
-        MKLDNNMemoryDesc plg_tdesc {orig_tdesc};
-        BlockedMemoryDesc blk_tdesc = MemoryDescUtils::convertToBlockedDescriptor(plg_tdesc);
-        MKLDNNMemoryDesc plg_tdesc_after = MemoryDescUtils::convertToMKLDNNMemoryDesc(blk_tdesc);
-        dnnl::memory::desc after_tdesc(plg_tdesc_after);
+        DnnlMemoryDescPtr plg_tdesc = MKLDNNExtensionUtils::makeDescriptor(orig_tdesc);
+        BlockedMemoryDescPtr blk_tdesc = MemoryDescUtils::convertToBlockedMemoryDesc(plg_tdesc);
+        MemoryDescPtr cpu_blk_tdesc = std::make_shared<CpuBlockedMemoryDesc>(blk_tdesc->getPrecision(), blk_tdesc->getShape(), blk_tdesc->getBlockDims(),
+                                                                  blk_tdesc->getOrder(), blk_tdesc->getOffsetPadding(), blk_tdesc->getOffsetPaddingToData(),
+                                                                  blk_tdesc->getStrides());
+        DnnlMemoryDescPtr plg_tdesc_after = MemoryDescUtils::convertToDnnlMemoryDesc(cpu_blk_tdesc);
+        dnnl::memory::desc after_tdesc = plg_tdesc_after->getDnnlDesc();
 
-        return  orig_tdesc == after_tdesc;
+        return orig_tdesc == after_tdesc;
     };
 
     std::pair<dnnl::memory::format_tag, dnnl::memory::dims> payload[] {
@@ -37,15 +45,90 @@ TEST(MemDescTest, Conversion) {
         ASSERT_TRUE(converted_correctly(p.first, p.second));
 }
 
+TEST(MemDescTest, UndefinedStateConversion) {
+    ngraph::PartialShape ngraphUndefinedShape({{16}, {7, 15}, {-1, -1}, {3}});
+    Shape cpuShape(ngraphUndefinedShape);
+
+    const std::vector<mkldnn::memory::format_tag> vecTags = {
+            mkldnn::memory::format_tag::nChw8c,
+            mkldnn::memory::format_tag::nhwc,
+            mkldnn::memory::format_tag::nChw16c,
+            mkldnn::memory::format_tag::ABcd16a16b,
+            mkldnn::memory::format_tag::OIhw4i16o4i
+    };
+
+    for (auto tag : vecTags) {
+        DnnlBlockedMemoryDescPtr mkldnnDesc = std::make_shared<DnnlBlockedMemoryDesc>(cpuShape, mkldnn::memory::data_type::f32, tag);
+
+        ASSERT_FALSE(mkldnnDesc->isDefined());
+
+        auto blockedDesc = MemoryDescUtils::convertToBlockedMemoryDesc(mkldnnDesc);
+        MemoryDescPtr cpuBlockedDesc = std::make_shared<CpuBlockedMemoryDesc>(blockedDesc->getPrecision(), blockedDesc->getShape(), blockedDesc->getBlockDims(),
+                                                                    blockedDesc->getOrder(), blockedDesc->getOffsetPadding(),
+                                                                    blockedDesc->getOffsetPaddingToData(), blockedDesc->getStrides());
+
+        ASSERT_TRUE(mkldnnDesc->isCompatible(*cpuBlockedDesc));
+        ASSERT_TRUE(cpuBlockedDesc->isCompatible(*mkldnnDesc));
+
+        auto reconstructedDesc = MemoryDescUtils::convertToDnnlMemoryDesc(cpuBlockedDesc);
+
+        ASSERT_TRUE(mkldnnDesc->isCompatible(*reconstructedDesc));
+        ASSERT_TRUE(cpuBlockedDesc->isCompatible(*reconstructedDesc));
+
+        mkldnn::memory::desc dnnlDesc = mkldnnDesc->getDnnlDesc();
+        mkldnn::memory::desc reconstDnnlDesc = reconstructedDesc->getDnnlDesc();
+
+        ASSERT_EQ(dnnlDesc, reconstDnnlDesc);
+
+        auto definedMemDesc = mkldnnDesc->cloneWithNewDims({16, 10, 15, 3});
+        auto definedReconstructedMkldnnDesc = reconstructedDesc->cloneWithNewDims({16, 10, 15, 3});
+
+        ASSERT_TRUE(definedMemDesc->isCompatible(*definedReconstructedMkldnnDesc));
+    }
+}
+
+TEST(MemDescTest, TurnToUninit) {
+    Shape cpuShape(SizeVector{7, 19, 43, 20});
+
+    auto& blokcedDescCreators = BlockedDescCreator::getCommonCreators();
+
+    for (auto item : blokcedDescCreators) {
+        auto creator = item.second;
+
+        const MemoryDescPtr blockedDesc = creator->createSharedDesc(Precision::FP32, cpuShape);
+        auto mkldnnDesc = MemoryDescUtils::convertToDnnlMemoryDesc(blockedDesc);
+
+        auto uninitMkldnnDesc = MemoryDescUtils::cloneWithUndefStridesAndOffset(*mkldnnDesc);
+
+        ASSERT_TRUE(uninitMkldnnDesc->isCompatible(*mkldnnDesc));
+
+        const auto cpuBlockedDesc = std::dynamic_pointer_cast<CpuBlockedMemoryDesc>(blockedDesc);
+        auto strides = cpuBlockedDesc->getStrides();
+        std::transform(strides.begin(), strides.begin() + cpuShape.getRank(), strides.begin(), [](size_t x) { return x * 3; });
+
+        auto stridedBlockedDesc = CpuBlockedMemoryDesc(cpuBlockedDesc->getPrecision(), cpuBlockedDesc->getShape(), cpuBlockedDesc->getBlockDims(),
+                                                       cpuBlockedDesc->getOrder(),
+                                                    100500, cpuBlockedDesc->getOffsetPaddingToData(), strides);
+
+        ASSERT_FALSE(blockedDesc->isCompatible(stridedBlockedDesc));
+        ASSERT_TRUE(uninitMkldnnDesc->isCompatible(stridedBlockedDesc));
+
+        auto initMkldnnDesc = MemoryDescUtils::cloneWithDefaultStridesAndOffset(*uninitMkldnnDesc);
+
+        ASSERT_TRUE(initMkldnnDesc->isCompatible(*blockedDesc));
+        ASSERT_FALSE(initMkldnnDesc->isCompatible(stridedBlockedDesc));
+    }
+}
+
 TEST(MemDescTest, CompareWithTensorDescRecomputedStrides) {
     auto converted_correctly = [] (dnnl::memory::format_tag fmt, dnnl::memory::dims dims) {
         dnnl::memory::desc orig_tdesc {dims, dnnl::memory::data_type::u8, fmt};
-        MKLDNNMemoryDesc plg_tdesc {orig_tdesc};
-        BlockedMemoryDesc blk_tdesc = MemoryDescUtils::convertToBlockedDescriptor(plg_tdesc);
+        DnnlMemoryDescPtr plg_tdesc = MKLDNNExtensionUtils::makeDescriptor(orig_tdesc);
+        BlockedMemoryDescPtr blk_tdesc = MemoryDescUtils::convertToBlockedMemoryDesc(plg_tdesc);
 
-        BlockedMemoryDesc recomputed_blk_tdesc(blk_tdesc.getPrecision(), blk_tdesc.getShape().getStaticDims(), blk_tdesc.getBlockDims(), blk_tdesc.getOrder());
+        CpuBlockedMemoryDesc recomputed_blk_tdesc(blk_tdesc->getPrecision(), blk_tdesc->getShape(), blk_tdesc->getBlockDims(), blk_tdesc->getOrder());
 
-        return  blk_tdesc.isCompatible(recomputed_blk_tdesc);
+        return  plg_tdesc->isCompatible(recomputed_blk_tdesc);
     };
 
     std::pair<dnnl::memory::format_tag, dnnl::memory::dims> payload[] {
@@ -68,9 +151,9 @@ TEST(MemDescTest, isPlainCheck) {
     dnnl::memory::desc permt_tdesc {dims, type, dnnl::memory::format_tag::acdb};
     dnnl::memory::desc blckd_tdesc {dims, type, dnnl::memory::format_tag::aBcd8b};
 
-    ASSERT_TRUE(MKLDNNMemoryDesc(plain_tdesc).hasLayoutType(LayoutType::ncsp));
-    ASSERT_FALSE(MKLDNNMemoryDesc(permt_tdesc).hasLayoutType(LayoutType::ncsp));
-    ASSERT_FALSE(MKLDNNMemoryDesc(blckd_tdesc).hasLayoutType(LayoutType::ncsp));
+    ASSERT_TRUE(MKLDNNExtensionUtils::makeDescriptor(plain_tdesc)->hasLayoutType(LayoutType::ncsp));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(permt_tdesc)->hasLayoutType(LayoutType::ncsp));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(blckd_tdesc)->hasLayoutType(LayoutType::ncsp));
 }
 
 TEST(MemDescTest, isBlockedCCheck) {
@@ -81,19 +164,19 @@ TEST(MemDescTest, isBlockedCCheck) {
     dnnl::memory::desc tailc_tdesc {dims, type, dnnl::memory::format_tag::acdb};
     dnnl::memory::desc blck8_tdesc {dims, type, dnnl::memory::format_tag::aBcd8b};
     dnnl::memory::desc blck8_permCD_tdesc {dims, type, dnnl::memory::format_tag::aBdc16b};
-    const MKLDNNMemoryDesc plain_mdesc(plain_tdesc);
-    const MKLDNNMemoryDesc tailc_mdesc(tailc_tdesc);
-    ASSERT_FALSE(plain_mdesc.hasLayoutType(LayoutType::nCsp8c) || plain_mdesc.hasLayoutType(LayoutType::nCsp16c));
-    ASSERT_FALSE(tailc_mdesc.hasLayoutType(LayoutType::nCsp8c) || tailc_mdesc.hasLayoutType(LayoutType::nCsp16c));
-    ASSERT_TRUE(MKLDNNMemoryDesc(blck8_tdesc).hasLayoutType(LayoutType::nCsp8c));
-    ASSERT_FALSE(MKLDNNMemoryDesc(blck8_permCD_tdesc).hasLayoutType(LayoutType::nCsp16c));
+    auto plain_mdesc = MKLDNNExtensionUtils::makeDescriptor(plain_tdesc);
+    auto tailc_mdesc = MKLDNNExtensionUtils::makeDescriptor(tailc_tdesc);
+    ASSERT_FALSE(plain_mdesc->hasLayoutType(LayoutType::nCsp8c) || plain_mdesc->hasLayoutType(LayoutType::nCsp16c));
+    ASSERT_FALSE(tailc_mdesc->hasLayoutType(LayoutType::nCsp8c) || tailc_mdesc->hasLayoutType(LayoutType::nCsp16c));
+    ASSERT_TRUE(MKLDNNExtensionUtils::makeDescriptor(blck8_tdesc)->hasLayoutType(LayoutType::nCsp8c));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(blck8_permCD_tdesc)->hasLayoutType(LayoutType::nCsp16c));
 
     const auto crop_dims = dnnl::memory::dims {2, 1, 5, 7};
     const auto crop_off = dnnl::memory::dims {1, 0, 0, 0};
     dnnl::memory::desc blck8_crop_tdesc = blck8_tdesc.submemory_desc(crop_dims, crop_off);
     dnnl::memory::desc blck8_permCD_crop_tdesc = blck8_permCD_tdesc.submemory_desc(crop_dims, crop_off);
-    ASSERT_TRUE(MKLDNNMemoryDesc(blck8_crop_tdesc).hasLayoutType(LayoutType::nCsp8c));
-    ASSERT_FALSE(MKLDNNMemoryDesc(blck8_permCD_crop_tdesc).hasLayoutType(LayoutType::nCsp8c));
+    ASSERT_TRUE(MKLDNNExtensionUtils::makeDescriptor(blck8_crop_tdesc)->hasLayoutType(LayoutType::nCsp8c));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(blck8_permCD_crop_tdesc)->hasLayoutType(LayoutType::nCsp8c));
 }
 
 TEST(MemDescTest, isTailCCheck) {
@@ -104,18 +187,18 @@ TEST(MemDescTest, isTailCCheck) {
     dnnl::memory::desc tailc_tdesc {dims, type, dnnl::memory::format_tag::acdb};
     dnnl::memory::desc permt_tdesc {dims, type, dnnl::memory::format_tag::bcda};
     dnnl::memory::desc blck8_tdesc {dims, type, dnnl::memory::format_tag::aBcd8b};
-    ASSERT_FALSE(MKLDNNMemoryDesc(plain_tdesc).hasLayoutType(LayoutType::nspc));
-    ASSERT_FALSE(MKLDNNMemoryDesc(permt_tdesc).hasLayoutType(LayoutType::nspc));
-    ASSERT_TRUE(MKLDNNMemoryDesc(tailc_tdesc).hasLayoutType(LayoutType::nspc));
-    ASSERT_FALSE(MKLDNNMemoryDesc(blck8_tdesc).hasLayoutType(LayoutType::nspc));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(plain_tdesc)->hasLayoutType(LayoutType::nspc));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(permt_tdesc)->hasLayoutType(LayoutType::nspc));
+    ASSERT_TRUE(MKLDNNExtensionUtils::makeDescriptor(tailc_tdesc)->hasLayoutType(LayoutType::nspc));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(blck8_tdesc)->hasLayoutType(LayoutType::nspc));
 
     dnnl::memory::desc blck8_permCD_tdesc {dims, type, dnnl::memory::format_tag::aBdc16b};
-    ASSERT_FALSE(MKLDNNMemoryDesc(blck8_permCD_tdesc).hasLayoutType(LayoutType::nspc));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(blck8_permCD_tdesc)->hasLayoutType(LayoutType::nspc));
 
     const auto crop_dims = dnnl::memory::dims {2, 1, 5, 7};
     const auto crop_off = dnnl::memory::dims {1, 0, 0, 0};
     dnnl::memory::desc tailc_crop_tdesc = blck8_tdesc.submemory_desc(crop_dims, crop_off);
-    ASSERT_FALSE(MKLDNNMemoryDesc(tailc_crop_tdesc).hasLayoutType(LayoutType::nspc));
+    ASSERT_FALSE(MKLDNNExtensionUtils::makeDescriptor(tailc_crop_tdesc)->hasLayoutType(LayoutType::nspc));
 }
 
 TEST(MemDescTest, constructWithPlainFormat) {
@@ -138,11 +221,132 @@ TEST(MemDescTest, ComaptibleWithFormat) {
     GTEST_SKIP();
 }
 
+TEST(MKLDNNMemDescTest, KeepOrder) {
+    using mkldnn::memory;
+    Shape dims(VectorDims{7, 3, 1, 5});
+    memory::data_type dataType = memory::data_type::u8;
+    DnnlBlockedMemoryDesc descPalanar(MKLDNNExtensionUtils::DataTypeToIEPrecision(dataType), dims);
+    ASSERT_THAT(descPalanar.getOrder(), ElementsAre(0, 1, 2, 3));
+
+    DnnlBlockedMemoryDesc descTailC(dims, dataType, memory::format_tag::acdb);
+    ASSERT_THAT(descTailC.getOrder(), ElementsAre(0, 2, 3, 1));
+
+    DnnlBlockedMemoryDesc descBlockedC(dims, dataType, memory::format_tag::aBcd16b);
+    ASSERT_THAT(descBlockedC.getOrder(), ElementsAre(0, 1, 2, 3, 1));
+
+    DnnlBlockedMemoryDesc descWeightBlocked(dims, dataType, memory::format_tag::ABcd16b16a2b);
+    ASSERT_THAT(descWeightBlocked.getOrder(), ElementsAre(0, 1, 2, 3, 1, 0, 1));
+
+    auto dnnDims = MKLDNNExtensionUtils::convertToDnnlDims(dims.getStaticDims());
+
+    memory::desc mkldnnDescPlanar(dnnDims, dataType, memory::format_tag::abcd);
+    ASSERT_THAT(MKLDNNExtensionUtils::makeDescriptor(mkldnnDescPlanar)->as<DnnlBlockedMemoryDesc>()->getOrder(), ElementsAre(0, 1, 2, 3));
+
+    memory::desc mkldnnDescTailC(dnnDims, dataType, memory::format_tag::acdb);
+    ASSERT_THAT(MKLDNNExtensionUtils::makeDescriptor(mkldnnDescTailC)->as<DnnlBlockedMemoryDesc>()->getOrder(), ElementsAre(0, 2, 3, 1));
+
+    memory::desc mkldnnDescBlockedC(dnnDims, dataType, memory::format_tag::aBcd16b);
+    ASSERT_THAT(MKLDNNExtensionUtils::makeDescriptor(mkldnnDescBlockedC)->as<DnnlBlockedMemoryDesc>()->getOrder(), ElementsAre(0, 1, 2, 3, 1));
+
+    memory::desc mkldnnDescWeightBlocked(dnnDims, dataType, memory::format_tag::ABcd16b16a2b);
+    ASSERT_THAT(MKLDNNExtensionUtils::makeDescriptor(mkldnnDescWeightBlocked)->as<DnnlBlockedMemoryDesc>()->getOrder(), ElementsAre(0, 1, 2, 3, 1, 0, 1));
+}
+
+TEST(MemDescTest, UndefinedState) {
+    ngraph::PartialShape ngraphShape({{16}, {-1, -1}, {20, 30}, {7}});
+    MKLDNNPlugin::Shape pluginShape(ngraphShape);
+    DnnlBlockedMemoryDesc memDesc(pluginShape, mkldnn::memory::data_type::f32, mkldnn::memory::format_tag::nChw8c);
+
+    ASSERT_FALSE(memDesc.isDefined());
+
+    ASSERT_THROW(memDesc.cloneWithNewDims({16, 7, 40, 7}), InferenceEngine::ParameterMismatch);
+    ASSERT_THROW(memDesc.cloneWithNewDims({16, 7, 25}), InferenceEngine::ParameterMismatch);
+    ASSERT_THROW(memDesc.cloneWithNewDims({16, 7, 25, 5}), InferenceEngine::ParameterMismatch);
+
+    auto definedDesc = memDesc.cloneWithNewDims({16, 15, 25, 7});
+
+    ASSERT_TRUE(definedDesc->isDefined());
+
+    auto creator = BlockedDescCreator::getCommonCreators().at(LayoutType::nCsp8c);
+    auto cpuBlockedDesc = creator->createSharedDesc(Precision::FP32, pluginShape);
+
+    ASSERT_FALSE(cpuBlockedDesc->isDefined());
+
+    ASSERT_TRUE(cpuBlockedDesc->isCompatible(memDesc));
+
+    ASSERT_THROW(cpuBlockedDesc->cloneWithNewDims({16, 7, 40, 7}), InferenceEngine::ParameterMismatch);
+    ASSERT_THROW(cpuBlockedDesc->cloneWithNewDims({16, 7, 25}), InferenceEngine::ParameterMismatch);
+    ASSERT_THROW(cpuBlockedDesc->cloneWithNewDims({16, 7, 25, 5}), InferenceEngine::ParameterMismatch);
+
+    auto definedBlockedDesc = cpuBlockedDesc->cloneWithNewDims({16, 15, 25, 7});
+
+    ASSERT_TRUE(definedBlockedDesc->isDefined());
+
+    ASSERT_FALSE(memDesc.isCompatible(*definedDesc));
+    ASSERT_FALSE(memDesc.isCompatible(*definedBlockedDesc));
+
+    ASSERT_TRUE(definedBlockedDesc->isCompatible(*definedDesc));
+}
+
+TEST(MemDescTest, MemSize) {
+    constexpr size_t undefSize = MemoryDesc::UNDEFINED_SIZE;
+    static const auto dnnlDataType = mkldnn::memory::data_type::f32;
+    static const Precision iePrc = Precision::FP32;
+
+
+    ngraph::PartialShape ngraphShapeUndef({{16}, {-1, -1}, {20, 30}, {7}});
+    MKLDNNPlugin::Shape pluginShapeUndef(ngraphShapeUndef);
+
+    auto creator = BlockedDescCreator::getCommonCreators().at(LayoutType::nspc);
+    auto blockedDescUndef = creator->createDesc(iePrc, pluginShapeUndef);
+
+    ASSERT_EQ(blockedDescUndef.getCurrentMemSize(), undefSize);
+    ASSERT_EQ(blockedDescUndef.getMaxMemSize(), undefSize);
+
+    DnnlBlockedMemoryDesc memDescUndef(pluginShapeUndef, dnnlDataType, mkldnn::memory::format_tag::nhwc);
+
+    ASSERT_EQ(memDescUndef.getCurrentMemSize(), undefSize);
+    ASSERT_EQ(memDescUndef.getMaxMemSize(), undefSize);
+
+    ngraph::PartialShape ngraphShapeDefUpperBound({{16}, {7, 14}, {20, 30}, {7}});
+    MKLDNNPlugin::Shape pluginShapeDefUpperBound(ngraphShapeDefUpperBound);
+
+    auto blockedDescDefUpper = creator->createDesc(iePrc, pluginShapeDefUpperBound);
+
+    ASSERT_EQ(blockedDescDefUpper.getCurrentMemSize(), undefSize);
+    auto maxElementsCount = std::accumulate(pluginShapeDefUpperBound.getMaxDims().begin(),
+                                            pluginShapeDefUpperBound.getMaxDims().end(),
+                                            1, std::multiplies<size_t>());
+    ASSERT_EQ(blockedDescDefUpper.getMaxMemSize(), maxElementsCount * iePrc.size());
+
+    DnnlBlockedMemoryDesc memDescDefUpper(pluginShapeDefUpperBound, dnnlDataType, mkldnn::memory::format_tag::nhwc);
+
+    ASSERT_EQ(memDescDefUpper.getCurrentMemSize(), undefSize);
+    ASSERT_EQ(memDescDefUpper.getMaxMemSize(), maxElementsCount * MKLDNNExtensionUtils::sizeOfDataType(dnnlDataType));
+
+    ngraph::PartialShape ngraphShapeDefined({{16}, {16}, {10}, {7}});
+    MKLDNNPlugin::Shape pluginShapeDefined(ngraphShapeDefined);
+
+    auto blockedDescDefined = creator->createDesc(iePrc, pluginShapeDefined);
+
+    ASSERT_NE(blockedDescDefined.getCurrentMemSize(), undefSize);
+    ASSERT_NE(blockedDescDefined.getMaxMemSize(), undefSize);
+    ASSERT_EQ(blockedDescDefined.getCurrentMemSize(), blockedDescDefined.getMaxMemSize());
+
+    DnnlBlockedMemoryDesc memDescDefined(pluginShapeDefined, dnnlDataType, mkldnn::memory::format_tag::nhwc);
+
+    ASSERT_NE(memDescDefined.getCurrentMemSize(), undefSize);
+    ASSERT_NE(memDescDefined.getMaxMemSize(), undefSize);
+    ASSERT_EQ(memDescDefined.getCurrentMemSize(), memDescDefined.getMaxMemSize());
+    ASSERT_EQ(blockedDescDefined.getCurrentMemSize(), memDescDefined.getCurrentMemSize());
+}
+
+
 TEST(isSameMethodTest, CheckTensorWithSameStrides) {
     auto isSameDataFormat = [] (dnnl::memory::format_tag fmt, dnnl::memory::dims dims) {
         dnnl::memory::desc oneDnnDesc {dims, dnnl::memory::data_type::u8, fmt};
-        MKLDNNMemoryDesc pluginDesc {oneDnnDesc};
-        return pluginDesc.getFormat() == fmt;
+        auto pluginDesc = MKLDNNExtensionUtils::makeDescriptor(oneDnnDesc);
+        return pluginDesc->isSame(fmt);
     };
 
     std::pair<dnnl::memory::format_tag, dnnl::memory::dims> testCases[] {
diff --git a/inference-engine/tests/unit/gna/gna_get_scale_factor.cpp b/inference-engine/tests/unit/gna/gna_get_scale_factor.cpp
new file mode 100644
index 00000000000000..0a34eabe609633
--- /dev/null
+++ b/inference-engine/tests/unit/gna/gna_get_scale_factor.cpp
@@ -0,0 +1,54 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+#include <limits>
+
+#include <gtest/gtest.h>
+// to suppress deprecated definition errors
+#define IMPLEMENT_INFERENCE_ENGINE_PLUGIN
+#include "legacy/layer_transform.hpp"
+#include "frontend/layer_quantizer.hpp"
+
+namespace {
+
+class GnaGetScaleFactorTest : public ::testing::Test {
+ protected:
+    void GetScaleFactorAndCheck(float src_scale, float dst_scale, float weights_scale, float bias_scale) const {
+        InferenceEngine::LayerParams params("fc", "FullyConnected", InferenceEngine::Precision::FP32);
+        InferenceEngine::CNNLayerPtr layer = std::make_shared<InferenceEngine::CNNLayer>(params);
+        layer = InferenceEngine::injectData<GNAPluginNS::QuantizedLayerParams>(*layer);
+        auto quant = InferenceEngine::getInjectedData<GNAPluginNS::QuantizedLayerParams>(*layer);
+        quant->_src_quant.SetScale(src_scale);
+        quant->_dst_quant.SetScale(dst_scale);
+        quant->_weights_quant.SetScale(weights_scale);
+        quant->_bias_quant.SetScale(bias_scale);
+        ASSERT_EQ(GNAPluginNS::getScaleFactor(layer, GNAPluginNS::QuantizedDataType::input), src_scale);
+        ASSERT_EQ(GNAPluginNS::getScaleFactor(layer, GNAPluginNS::QuantizedDataType::output), dst_scale);
+        ASSERT_EQ(GNAPluginNS::getScaleFactor(layer, GNAPluginNS::QuantizedDataType::weights), weights_scale);
+        ASSERT_EQ(GNAPluginNS::getScaleFactor(layer, GNAPluginNS::QuantizedDataType::bias), bias_scale);
+    }
+};
+
+TEST_F(GnaGetScaleFactorTest, validSF) {
+    EXPECT_NO_THROW(GetScaleFactorAndCheck(100, 200, 300, 400));
+}
+
+TEST_F(GnaGetScaleFactorTest, invalidSF) {
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(0, 200, 300, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, 0, 300, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, 200, 0, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, 200, 300, 0));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(-100, 200, 300, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, -200, 300, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, 200, -300, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, 200, 300, -400));
+    double inf = std::numeric_limits<float>::infinity();
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(inf, 200, 300, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, inf, 300, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, 200, inf, 400));
+    EXPECT_ANY_THROW(GetScaleFactorAndCheck(100, 200, 300, inf));
+}
+
+} // namespace
\ No newline at end of file
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_dwsc_to_scaleshifts.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_dwsc_to_scaleshifts.cpp
new file mode 100644
index 00000000000000..7dd08c31f24360
--- /dev/null
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_dwsc_to_scaleshifts.cpp
@@ -0,0 +1,384 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include <tuple>
+
+#include "transformations/convert_dwsc_to_scaleshifts.hpp"
+#include "common_test_utils/ngraph_test_utils.hpp"
+#include <ngraph/function.hpp>
+#include <ngraph/opsets/opset7.hpp>
+#include <ngraph/pass/manager.hpp>
+#include <transformations/init_node_info.hpp>
+#include <transformations/utils/utils.hpp>
+
+namespace testing {
+
+namespace {
+
+enum class modelType {
+    TranspDWSCTransp = 0,               /* Transpose(NHWC->NCHW) => DWSC (Group Convolution) => Transpose(NCHW->NHWC) */
+    TranspDWSCBiasTransp,               /* Transpose(NHWC->NCHW) => DWSC => Broadcasted Add (Bias) => Transpose(NCHW->NHWC) */
+};
+
+typedef std::tuple<
+    modelType,              // Test model
+    ngraph::Shape,          // Input shape
+    ngraph::Shape,          // Convolution filter shape
+    ngraph::Strides,        // Convolution stride
+    ngraph::CoordinateDiff, // Convolution pads begin
+    ngraph::CoordinateDiff, // Convolution pads end
+    ngraph::Strides,        // Convolution dilation
+    ngraph::Shape,          // Bias shape
+    ngraph::op::PadType     // Padding type
+> DWSCToScaleShiftsParams;
+
+typedef std::tuple<
+    bool,                   // With / without Fake Quantize layers
+    DWSCToScaleShiftsParams // Test parameters
+> fqDWSCToScaleShiftsParams;
+
+std::shared_ptr<ngraph::opset7::FakeQuantize> createFQ(std::shared_ptr<ngraph::Node>& in_node) {
+    auto input_low = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{1}, {1});
+    auto input_high = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{1}, {5});
+    auto output_low = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{1}, {0});
+    auto output_high = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{1}, {10});
+    return std::make_shared<ngraph::opset7::FakeQuantize>(in_node, input_low, input_high, output_low, output_high, 11);
+}
+
+std::shared_ptr<ngraph::Node> createBiasFQ(const std::shared_ptr<ngraph::Node>& in_node,
+    std::shared_ptr<ngraph::opset7::Constant>& bias_const, const bool& fq) {
+    std::shared_ptr<ngraph::Node> node;
+    node = std::make_shared<ngraph::opset7::Add>(in_node, bias_const);
+
+    if (fq) {
+        node = createFQ(node);
+    }
+
+    return node;
+}
+
+std::shared_ptr<ngraph::opset7::Result> createFunction(const bool& fq,
+    const modelType& model,
+    const ngraph::Output<ngraph::Node>& input_node,
+    const ngraph::Shape& filters_shape,
+    const ngraph::Strides& conv_stride,
+    const ngraph::CoordinateDiff& pads_begin,
+    const ngraph::CoordinateDiff& pads_end,
+    const ngraph::Strides& conv_dilation,
+    const ngraph::Shape& bias_shape,
+    const ngraph::op::PadType& pad_type,
+    std::shared_ptr<ngraph::opset7::GroupConvolution>& dwsc,
+    std::shared_ptr<ngraph::opset7::Constant>& bias_const,
+    std::shared_ptr<ngraph::opset7::FakeQuantize>& fq_bias) {
+    std::shared_ptr<ngraph::Node> fq_filters;
+
+    auto transpose_in_order = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64, ngraph::Shape{4}, std::vector<int64_t>{0, 3, 1, 2});
+    auto transpose_in = std::make_shared<ngraph::opset7::Transpose>(input_node, transpose_in_order);
+
+    if (fq) {
+        fq_filters = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64,
+            ngraph::Shape{input_node.get_shape()[3], 1, filters_shape[0], filters_shape[1]});
+        fq_filters = createFQ(fq_filters);
+        fq_filters = std::make_shared<ngraph::opset7::Reshape>(fq_filters,
+            ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{5},
+                ngraph::Shape{input_node.get_shape()[3], 1, 1, filters_shape[0], filters_shape[1]}), false);
+    } else {
+        fq_filters = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64,
+            ngraph::Shape{input_node.get_shape()[3], 1, 1, filters_shape[0], filters_shape[1]});
+    }
+
+    dwsc = std::make_shared<ngraph::opset7::GroupConvolution>(transpose_in, fq_filters, conv_stride, pads_begin, pads_end, conv_dilation, pad_type);
+    auto transpose_out_order = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64, ngraph::Shape{4}, std::vector<int64_t>{0, 2, 3, 1});
+    auto last_op = std::make_shared<ngraph::opset7::Transpose>(dwsc, transpose_out_order);
+
+    if (model == modelType::TranspDWSCBiasTransp || fq) {
+        bias_const = std::make_shared<ngraph::opset7::Constant>(ngraph::element::i64, bias_shape);
+        auto bias = createBiasFQ(dwsc, bias_const, fq);
+        fq_bias = std::dynamic_pointer_cast<ngraph::opset7::FakeQuantize>(bias);
+        last_op = std::make_shared<ngraph::opset7::Transpose>(bias, transpose_out_order);
+    }
+
+    return std::make_shared<ngraph::opset7::Result>(last_op);
+}
+
+std::shared_ptr<ngraph::Function> get_initial_function(const bool& fq,
+    const modelType& model,
+    const ngraph::Shape& input_shape,
+    const ngraph::Shape& filters_shape,
+    const ngraph::Strides& conv_stride,
+    const ngraph::CoordinateDiff& pads_begin,
+    const ngraph::CoordinateDiff& pads_end,
+    const ngraph::Strides& conv_dilation,
+    const ngraph::Shape& bias_shape,
+    const ngraph::op::PadType& pad_type,
+    std::shared_ptr<ngraph::opset7::GroupConvolution>& dwsc,
+    std::shared_ptr<ngraph::opset7::Constant>& bias_const,
+    std::shared_ptr<ngraph::opset7::FakeQuantize>& fq_bias) {
+    auto input_params = std::make_shared<ngraph::opset7::Parameter>(ngraph::element::i64, input_shape);
+    auto result = createFunction(fq, model, input_params, filters_shape, conv_stride, pads_begin, pads_end, conv_dilation,
+        bias_shape, pad_type, dwsc, bias_const, fq_bias);
+    return std::make_shared<ngraph::Function>(ngraph::ResultVector{result}, ngraph::ParameterVector{input_params});
+}
+
+// ---------------------------------------------------------------------------------------------------------------------
+
+class ConvertDWSCToScaleShiftsTestInvalidFixture : public CommonTestUtils::TestsCommon,
+    public ::testing::WithParamInterface<fqDWSCToScaleShiftsParams> {
+public:
+    void SetUp() override;
+public:
+    std::shared_ptr<ngraph::Function> function, reference_function;
+    modelType model;
+};
+
+void ConvertDWSCToScaleShiftsTestInvalidFixture::SetUp() {
+    bool fq;
+    DWSCToScaleShiftsParams params;
+    ngraph::Shape input_shape;
+    ngraph::Shape filters_shape, bias_shape;
+    ngraph::Strides conv_stride, conv_dilation;
+    ngraph::CoordinateDiff pads_begin, pads_end;
+    ngraph::op::PadType pad_type;
+    std::shared_ptr<ngraph::opset7::GroupConvolution> dwsc;
+    std::shared_ptr<ngraph::opset7::Constant> bias_const;
+    std::shared_ptr<ngraph::opset7::FakeQuantize> fq_bias;
+    std::tie(fq, params) = this->GetParam();
+    std::tie(model, input_shape, filters_shape, conv_stride, pads_begin, pads_end, conv_dilation,
+        bias_shape, pad_type) = params;
+
+    function = get_initial_function(fq, model, input_shape, filters_shape, conv_stride, pads_begin, pads_end, conv_dilation,
+        bias_shape, pad_type, dwsc, bias_const, fq_bias);
+    reference_function = get_initial_function(fq, model, input_shape, filters_shape, conv_stride, pads_begin, pads_end, conv_dilation,
+        bias_shape, pad_type, dwsc, bias_const, fq_bias);
+}
+
+// ---------------------------------------------------------------------------------------------------------------------
+
+class ConvertDWSCToScaleShiftsTestFixture: public CommonTestUtils::TestsCommon,
+    public ::testing::WithParamInterface<fqDWSCToScaleShiftsParams> {
+public:
+    void SetUp() override;
+    std::shared_ptr<ngraph::Function> get_reference(const bool& fq,
+        const modelType& model,
+        const ngraph::Shape& input_shape,
+        const ngraph::Shape& filters_shape,
+        const ngraph::Strides& conv_stride,
+        const ngraph::CoordinateDiff& pads_begin,
+        const ngraph::CoordinateDiff& pads_end,
+        const ngraph::Strides& conv_dilation,
+        const ngraph::Shape& bias_shape,
+        const ngraph::op::PadType& pad_type,
+        const std::shared_ptr<ngraph::opset7::GroupConvolution>& dwsc,
+        const std::shared_ptr<ngraph::opset7::Constant>& bias_const,
+        const std::shared_ptr<ngraph::opset7::FakeQuantize>& fq_bias);
+public:
+    std::shared_ptr<ngraph::Function> function, reference_function;
+    modelType model;
+};
+
+void ConvertDWSCToScaleShiftsTestFixture::SetUp() {
+    bool fq;
+    DWSCToScaleShiftsParams params;
+    ngraph::Shape input_shape;
+    ngraph::Shape filters_shape, bias_shape;
+    ngraph::Strides conv_stride, conv_dilation;
+    ngraph::CoordinateDiff pads_begin, pads_end;
+    ngraph::op::PadType pad_type;
+    std::shared_ptr<ngraph::opset7::GroupConvolution> dwsc;
+    std::shared_ptr<ngraph::opset7::Constant> bias_const;
+    std::shared_ptr<ngraph::opset7::FakeQuantize> fq_bias;
+    std::tie(fq, params) = this->GetParam();
+    std::tie(model, input_shape, filters_shape, conv_stride, pads_begin, pads_end, conv_dilation,
+        bias_shape, pad_type) = params;
+
+    function = get_initial_function(fq, model, input_shape, filters_shape, conv_stride, pads_begin, pads_end, conv_dilation,
+        bias_shape, pad_type, dwsc, bias_const, fq_bias);
+    reference_function = get_reference(fq, model, input_shape, filters_shape, conv_stride, pads_begin, pads_end, conv_dilation,
+        bias_shape, pad_type, dwsc, bias_const, fq_bias);
+}
+
+std::shared_ptr<ngraph::opset7::StridedSlice> FlatCrop(ngraph::Output<ngraph::Node> input, size_t offset, size_t size) {
+    return std::make_shared<ngraph::opset7::StridedSlice>(
+        input, // data
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, {(size_t)0, offset}), // begin sice index
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, {(size_t)0, offset + size}), // end slice index
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, {(size_t)1, (size_t)1}), // strides
+        std::vector<int64_t>{1, 0},  // begin mask
+        std::vector<int64_t>{1, 0}); // end mask
+}
+
+std::shared_ptr<ngraph::Node> InsertFQLayer(const std::shared_ptr<ngraph::opset7::FakeQuantize> fq_layer,
+    std::shared_ptr<ngraph::Node> last_node) {
+    if (fq_layer != nullptr) {
+        return fq_layer->clone_with_new_inputs({last_node,
+            fq_layer->input_value(1), fq_layer->input_value(2),
+            fq_layer->input_value(3), fq_layer->input_value(4)});
+    }
+    return last_node;
+}
+
+std::shared_ptr<ngraph::Node> DecomposeDWSC(std::shared_ptr<ngraph::opset7::GroupConvolution> dwsc,
+    std::shared_ptr<ngraph::opset7::Constant> bias_const, std::shared_ptr<ngraph::opset7::FakeQuantize> fq_bias,
+    std::shared_ptr<ngraph::opset7::Reshape> flat_input_plane, std::shared_ptr<ngraph::Node> flat_filters_plane) {
+    std::shared_ptr<ngraph::opset7::Constant> const_zero_padding;
+    std::shared_ptr<ngraph::Node> reshaped_bias;
+    ngraph::OutputVector output_chunks;
+    auto input_channel_count = dwsc->get_input_shape(0)[1];
+    auto input_width = dwsc->get_input_shape(0)[3];
+    auto output_width = dwsc->get_output_shape(0)[3];
+    auto filter_width = dwsc->get_input_shape(1)[4];
+    auto pads_begin = dwsc->get_pads_begin()[1];
+    auto stride_width = dwsc->get_strides()[1];
+    auto dilation_width = dwsc->get_dilations()[1];
+
+    // Constant with zero padding
+    if (pads_begin) {
+        const_zero_padding = std::make_shared<ngraph::opset7::Constant>(dwsc->get_element_type(), ngraph::Shape{1, input_channel_count}, 0);
+    }
+
+    // Reshape bias const
+    if (bias_const) {
+        auto bias_size = shape_size(bias_const->get_shape());
+        reshaped_bias = ngraph::op::util::make_try_fold<ngraph::opset7::Reshape>(bias_const,
+            ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, ngraph::Shape{1, bias_size}), false);
+    }
+
+    // Move filter over input performing multiplication and addition (scaleshift), take padding, stride, dilation and bias into account
+    for (int32_t input_position = -pads_begin, o = 0; o < output_width; input_position += stride_width, o++) {
+        std::shared_ptr<ngraph::Node> previous_layer_output, last_layer_output;
+        int32_t filter_end = input_position + filter_width * dilation_width;
+        bool first = true;
+
+        filter_end = filter_end < input_width ? filter_end : input_width;
+
+        for (int32_t filter_pos = input_position, filter_idx = 0; filter_pos < filter_end; filter_pos += dilation_width, filter_idx++) {
+            if (filter_pos >= 0) {
+                auto conv_input_slice = FlatCrop(flat_input_plane, filter_pos * input_channel_count, input_channel_count);
+                auto conv_filter_slice = FlatCrop(flat_filters_plane, filter_idx * input_channel_count, input_channel_count);
+
+                if (first) {
+                    first = false;
+                    previous_layer_output = std::make_shared<ngraph::opset7::Multiply>(conv_input_slice, conv_filter_slice);
+                    if (bias_const) {
+                        previous_layer_output = std::make_shared<ngraph::opset7::Add>(previous_layer_output, reshaped_bias);
+                        previous_layer_output = InsertFQLayer(fq_bias, previous_layer_output);
+                    }
+                    last_layer_output = previous_layer_output;
+                } else {
+                    last_layer_output = std::make_shared<ngraph::opset7::Multiply>(conv_input_slice, conv_filter_slice);
+                    last_layer_output = std::make_shared<ngraph::opset7::Add>(last_layer_output, previous_layer_output);
+                    previous_layer_output = last_layer_output;
+                }
+            }
+        }
+
+        if (!last_layer_output) {
+            IE_ASSERT(const_zero_padding);
+            last_layer_output = const_zero_padding;
+        }
+
+        output_chunks.push_back(last_layer_output);
+    }
+
+    // Concat and transpose is only needed when output width > 1
+    if (output_chunks.size() > 1) {
+        return std::make_shared<ngraph::opset7::Concat>(output_chunks, 0);
+    }
+
+    return output_chunks[0].get_node_shared_ptr();
+}
+
+std::shared_ptr<ngraph::Function> ConvertDWSCToScaleShiftsTestFixture::get_reference(const bool& fq,
+    const modelType& model,
+    const ngraph::Shape& input_shape,
+    const ngraph::Shape& filters_shape,
+    const ngraph::Strides& conv_stride,
+    const ngraph::CoordinateDiff& pads_begin,
+    const ngraph::CoordinateDiff& pads_end,
+    const ngraph::Strides& conv_dilation,
+    const ngraph::Shape& bias_shape,
+    const ngraph::op::PadType& pad_type,
+    const std::shared_ptr<ngraph::opset7::GroupConvolution>& dwsc,
+    const std::shared_ptr<ngraph::opset7::Constant>& bias_const,
+    const std::shared_ptr<ngraph::opset7::FakeQuantize>& fq_bias) {
+    auto input_params = std::make_shared<ngraph::opset7::Parameter>(ngraph::element::i64, input_shape);
+    auto output_channel_count = dwsc->get_output_shape(0)[1];
+    auto output_width = dwsc->get_output_shape(0)[3];
+
+    // Prepare flat input data
+    auto flat_input_plane = std::make_shared<ngraph::opset7::Reshape>(input_params,
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2},
+            ngraph::Shape{1, ngraph::shape_size(input_shape)}), false);
+
+    // Prepare flat filter data
+    auto filters_const = std::dynamic_pointer_cast<ngraph::Node>(dwsc->get_input_node_shared_ptr(1));
+    auto filters_size = ngraph::shape_size(filters_const->get_shape());
+
+    auto transposed_filters_const = ngraph::op::util::make_try_fold<ngraph::opset7::Transpose>(filters_const,
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{5}, ngraph::Shape{4, 1, 2, 3, 0}));
+
+    auto flat_filters_plane = ngraph::op::util::make_try_fold<ngraph::opset7::Reshape>(transposed_filters_const,
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, ngraph::Shape{1, filters_size}), false);
+
+    // Convert DWSC to a set of diagonal layers
+    auto output_plane = DecomposeDWSC(dwsc, bias_const, fq_bias, flat_input_plane, flat_filters_plane);
+
+    // Restore the original output shape
+    auto result = std::make_shared<ngraph::opset7::Reshape>(output_plane,
+        ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{4},
+            ngraph::Shape{1, output_channel_count, 1, output_width}), false);
+
+    return std::make_shared<ngraph::Function>(ngraph::ResultVector{std::make_shared<ngraph::opset7::Result>(result)}, ngraph::ParameterVector{input_params});
+}
+
+// ---------------------------------------------------------------------------------------------------------------------
+
+void execute_test(modelType model, std::shared_ptr<ngraph::Function> function, std::shared_ptr<ngraph::Function> reference_function) {
+    ngraph::pass::Manager manager;
+    manager.register_pass<ngraph::pass::InitNodeInfo>();
+
+    manager.register_pass<GNAPluginNS::ConvertDWSCToScaleShifts>();
+    manager.run_passes(function);
+    const FunctionsComparator func_comparator = FunctionsComparator::with_default().enable(FunctionsComparator::ATTRIBUTES);
+    const FunctionsComparator::Result result = func_comparator(function, reference_function);
+    ASSERT_TRUE(result.valid);
+}
+
+TEST_P(ConvertDWSCToScaleShiftsTestFixture, CompareFunctions) {
+    execute_test(model, function, reference_function);
+}
+
+INSTANTIATE_TEST_SUITE_P(ConvertDWSCToScaleShiftsTestSuite, ConvertDWSCToScaleShiftsTestFixture,
+    ::testing::Combine(
+        // With / without Fake Quantize layers
+        ::testing::Values(true, false),
+        ::testing::Values(
+            std::make_tuple(modelType::TranspDWSCTransp, ngraph::Shape{1, 1, 5, 32}, ngraph::Shape{1, 3}, ngraph::Strides{1, 1},
+                ngraph::CoordinateDiff{0, 1}, ngraph::CoordinateDiff{0, 1}, ngraph::Strides{1, 1},
+                ngraph::Shape{1, 32, 1, 1}, ngraph::op::PadType::VALID),
+            std::make_tuple(modelType::TranspDWSCBiasTransp, ngraph::Shape{1, 1, 5, 32}, ngraph::Shape{1, 3}, ngraph::Strides{1, 1},
+                ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 2}, ngraph::Strides{1, 1},
+                ngraph::Shape{1, 32, 1, 1}, ngraph::op::PadType::VALID))));
+
+TEST_P(ConvertDWSCToScaleShiftsTestInvalidFixture, CompareFunctions) {
+    execute_test(model, function, reference_function);
+}
+
+INSTANTIATE_TEST_SUITE_P(ConvertDWSCToScaleShiftsInvalidTestSuite, ConvertDWSCToScaleShiftsTestInvalidFixture,
+    ::testing::Combine(
+        // With / without Fake Quantize layers
+        ::testing::Values(true, false),
+        ::testing::Values(
+            std::make_tuple(modelType::TranspDWSCTransp, ngraph::Shape{2, 16, 8, 1}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
+                ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
+                ngraph::Shape{1, 4, 1, 1}, ngraph::op::PadType::SAME_UPPER),
+            std::make_tuple(modelType::TranspDWSCBiasTransp, ngraph::Shape{2, 16, 8, 1}, ngraph::Shape{1, 2}, ngraph::Strides{1, 1},
+                ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
+                ngraph::Shape{1, 4, 1, 1}, ngraph::op::PadType::EXPLICIT))));
+
+} // namespace
+
+} // namespace testing
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded2valid_conv.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded_to_valid_convolution.cpp
similarity index 95%
rename from inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded2valid_conv.cpp
rename to inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded_to_valid_convolution.cpp
index 381847b7a1c31d..dc3501a980b983 100644
--- a/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded2valid_conv.cpp
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_convert_padded_to_valid_convolution.cpp
@@ -6,7 +6,7 @@
 
 #include <tuple>
 
-#include "transformations/convert_padded2valid_conv.hpp"
+#include "transformations/convert_padded_to_valid_convolution.hpp"
 #include "common_test_utils/ngraph_test_utils.hpp"
 #include <ngraph/function.hpp>
 #include <ngraph/opsets/opset7.hpp>
@@ -39,12 +39,12 @@ typedef std::tuple<
     ngraph::Strides,        // Max Pool stride
     ngraph::Shape,          // Max Pool shape
     ngraph::op::PadType     // Padding type
-> padded2ValidConvParams;
+> paddedToValidConvParams;
 
 typedef std::tuple<
     bool,                   // With / without Fake Quantize layers
-    padded2ValidConvParams      // Test parameters
-> fqPadded2ValidConvParams;
+    paddedToValidConvParams      // Test parameters
+> fqPaddedToValidConvParams;
 
 struct ConvData {
     size_t input_height;
@@ -193,17 +193,17 @@ std::shared_ptr<ngraph::Function> get_initial_function(const bool& fq,
 
 // ---------------------------------------------------------------------------------------------------------------------
 
-class ConvertPadded2ValidConvTestInvalidFixture : public CommonTestUtils::TestsCommon,
-    public ::testing::WithParamInterface<fqPadded2ValidConvParams> {
+class ConvertPaddedToValidConvTestInvalidFixture : public CommonTestUtils::TestsCommon,
+    public ::testing::WithParamInterface<fqPaddedToValidConvParams> {
 public:
     void SetUp() override;
 public:
     std::shared_ptr<ngraph::Function> function, reference_function;
 };
 
-void ConvertPadded2ValidConvTestInvalidFixture::SetUp() {
+void ConvertPaddedToValidConvTestInvalidFixture::SetUp() {
     bool fq;
-    padded2ValidConvParams params;
+    paddedToValidConvParams params;
     modelType model;
     ngraph::PartialShape input_shape;
     ngraph::Shape filters_shape, bias_shape, maxpool_shape;
@@ -223,8 +223,8 @@ void ConvertPadded2ValidConvTestInvalidFixture::SetUp() {
 
 // ---------------------------------------------------------------------------------------------------------------------
 
-class ConvertPadded2ValidConvTestFixture: public CommonTestUtils::TestsCommon,
-    public ::testing::WithParamInterface<fqPadded2ValidConvParams> {
+class ConvertPaddedToValidConvTestFixture: public CommonTestUtils::TestsCommon,
+    public ::testing::WithParamInterface<fqPaddedToValidConvParams> {
 public:
     void SetUp() override;
     std::shared_ptr<ngraph::Function> get_reference(const bool& fq,
@@ -244,9 +244,9 @@ class ConvertPadded2ValidConvTestFixture: public CommonTestUtils::TestsCommon,
     std::shared_ptr<ngraph::Function> function, reference_function;
 };
 
-void ConvertPadded2ValidConvTestFixture::SetUp() {
+void ConvertPaddedToValidConvTestFixture::SetUp() {
     bool fq;
-    padded2ValidConvParams params;
+    paddedToValidConvParams params;
     modelType model;
     ngraph::PartialShape input_shape;
     ngraph::Shape filters_shape, bias_shape, maxpool_shape;
@@ -354,7 +354,7 @@ std::shared_ptr<ngraph::Node> CreatePaddedNet(const ngraph::Output<ngraph::Node>
     return padded_input_plane;
 }
 
-std::shared_ptr<ngraph::Function> ConvertPadded2ValidConvTestFixture::get_reference(const bool& fq,
+std::shared_ptr<ngraph::Function> ConvertPaddedToValidConvTestFixture::get_reference(const bool& fq,
     const modelType& model,
     const ngraph::PartialShape& input_shape,
     const ngraph::Shape& filters_shape,
@@ -406,18 +406,18 @@ std::shared_ptr<ngraph::Function> ConvertPadded2ValidConvTestFixture::get_refere
 void execute_test(std::shared_ptr<ngraph::Function> function, std::shared_ptr<ngraph::Function> reference_function) {
     ngraph::pass::Manager manager;
     manager.register_pass<ngraph::pass::InitNodeInfo>();
-    manager.register_pass<GNAPluginNS::ConvertPadded2ValidConv>();
+    manager.register_pass<GNAPluginNS::ConvertPaddedToValidConv>();
     manager.run_passes(function);
     const FunctionsComparator func_comparator = FunctionsComparator::with_default().enable(FunctionsComparator::ATTRIBUTES);
     const FunctionsComparator::Result result = func_comparator(function, reference_function);
     ASSERT_TRUE(result.valid);
 }
 
-TEST_P(ConvertPadded2ValidConvTestFixture, CompareFunctions) {
+TEST_P(ConvertPaddedToValidConvTestFixture, CompareFunctions) {
     execute_test(function, reference_function);
 }
 
-INSTANTIATE_TEST_SUITE_P(ConvertPadded2ValidConvTestSuite, ConvertPadded2ValidConvTestFixture,
+INSTANTIATE_TEST_SUITE_P(ConvertPaddedToValidConvTestSuite, ConvertPaddedToValidConvTestFixture,
     ::testing::Combine(
         // With / without Fake Quantize layers
         ::testing::Values(true, false),
@@ -444,11 +444,11 @@ INSTANTIATE_TEST_SUITE_P(ConvertPadded2ValidConvTestSuite, ConvertPadded2ValidCo
                 ngraph::CoordinateDiff{0, 2}, ngraph::CoordinateDiff{0, 3}, ngraph::Strides{1, 1},
                 ngraph::Shape{1, 1, 1, 4}, ngraph::Strides{1, 1}, ngraph::Shape{1, 2}, ngraph::op::PadType::EXPLICIT))));
 
-TEST_P(ConvertPadded2ValidConvTestInvalidFixture, CompareFunctions) {
+TEST_P(ConvertPaddedToValidConvTestInvalidFixture, CompareFunctions) {
     execute_test(function, reference_function);
 }
 
-INSTANTIATE_TEST_SUITE_P(ConvertPadded2ValidConvInvalidTestSuite, ConvertPadded2ValidConvTestInvalidFixture,
+INSTANTIATE_TEST_SUITE_P(ConvertPaddedToValidConvInvalidTestSuite, ConvertPaddedToValidConvTestInvalidFixture,
     ::testing::Combine(
         // With / without Fake Quantize layers
         ::testing::Values(true, false),
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_conv.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_convolution.cpp
similarity index 99%
rename from inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_conv.cpp
rename to inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_convolution.cpp
index 9861663caf82c9..483f5c67a45fea 100644
--- a/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_conv.cpp
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_decompose_2d_convolution.cpp
@@ -6,7 +6,7 @@
 
 #include <tuple>
 
-#include "transformations/decompose_2d_conv.hpp"
+#include "transformations/decompose_2d_convolution.hpp"
 #include "common_test_utils/ngraph_test_utils.hpp"
 #include <ngraph/function.hpp>
 #include <ngraph/opsets/opset7.hpp>
@@ -426,7 +426,7 @@ void TransformInput(const GraphData& graph_data, const ConvParams& conv_params,
     */
 
     // First we need to prepare flat (height = 1) slices of input data proper for flattened (height = 1) filters created later on;
-    // the input datat is overlapping (duplicated)
+    // the input data is overlapping (duplicated)
     ngraph::OutputVector dilated_input_planes;
     for (size_t filter_height = 0; filter_height < conv_params.filter_height; filter_height++) {
         size_t offset;
@@ -704,10 +704,13 @@ void execute_test(modelType model, std::shared_ptr<ngraph::Function> function, s
     case modelType::TranspConvBcastAddActTransp:
     case modelType::TranspConvBcastAddMaxPoolActTransp:
         manager.register_pass<GNAPluginNS::Decompose2DConv>();
+        break;
     case modelType::TranspConvTranspBcastAdd:
         manager.register_pass<GNAPluginNS::Decompose2DConvTransposedWithBias>();
+        break;
     case modelType::TranspConvTranspBcastAddAct:
         manager.register_pass<GNAPluginNS::Decompose2DConvTransposedWithBiasAF>();
+        break;
     }
 
     manager.run_passes(function);
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_insert_reshape_around_matmul.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_insert_reshape_around_matmul.cpp
new file mode 100644
index 00000000000000..68422b5a9be3fd
--- /dev/null
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_insert_reshape_around_matmul.cpp
@@ -0,0 +1,190 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include "transformations/insert_reshape_around_matmul.hpp"
+
+#include "common_test_utils/ngraph_test_utils.hpp"
+#include <ngraph/function.hpp>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pass/manager.hpp>
+#include <transformations/init_node_info.hpp>
+#include <numeric>
+
+template<bool ADD, bool ADD_FIRST_INPUT_NOT_CONSTANT, bool FQ>
+struct InsertReshapeAroundMatmulTest {
+    static std::shared_ptr<ngraph::Node> CreateAdd(std::shared_ptr<ngraph::Node> input, const ngraph::Shape& constant_shape) {
+        std::vector<size_t> data(ngraph::shape_size(constant_shape));
+        std::iota(std::begin(data), std::end(data), 1);
+        auto constant = ngraph::opset8::Constant::create(ngraph::element::i64, constant_shape, data);
+        return std::make_shared<ngraph::opset8::Add>(input, constant);
+    }
+
+    static std::shared_ptr<ngraph::Node> CreateMatmul(
+        std::shared_ptr<ngraph::Node> input,
+        const ngraph::Shape& matmul_constant_shape) {
+        std::vector<size_t> data(ngraph::shape_size(matmul_constant_shape));
+        std::iota(std::begin(data), std::end(data), 1);
+        auto constant = ngraph::opset8::Constant::create(ngraph::element::i64, matmul_constant_shape, data);
+        std::shared_ptr<ngraph::Node> node;
+        node = std::make_shared<ngraph::opset8::MatMul>(input, constant);
+
+        if (ADD) {
+            auto matmul_shape = node->get_output_shape(0);
+            data.resize(ngraph::shape_size(matmul_shape));
+            std::iota(std::begin(data), std::end(data), 1);
+            std::vector<size_t> constant_add_shape(2, 1);
+            std::copy_if(matmul_shape.begin(), matmul_shape.end(), constant_add_shape.begin(), [](size_t e) { return e > 1; });
+            auto constant_add = ngraph::opset8::Constant::create(ngraph::element::i64, ngraph::Shape{constant_add_shape}, data);
+            if (ADD_FIRST_INPUT_NOT_CONSTANT) {
+                node = std::make_shared<ngraph::opset8::Add>(node, constant_add);
+            } else {
+                node = std::make_shared<ngraph::opset8::Add>(constant_add, node);
+            }
+        }
+
+        if (FQ) {
+            node = std::make_shared<ngraph::opset8::FakeQuantize>(
+                node,
+                ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {-0.1}),
+                ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {0.1}),
+                ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {-0.1}),
+                ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {0.1}),
+                255);
+        }
+
+        return node;
+    }
+
+    static std::shared_ptr<ngraph::Function> CreateFunction(
+        const ngraph::Shape& input_shape,
+        const ngraph::Shape& matmul_constant_shape,
+        const ngraph::Shape& result_shape) {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i64, input_shape);
+        auto before = std::make_shared<ngraph::opset8::Relu>(input);
+        auto matmul = CreateMatmul(before, matmul_constant_shape);
+        auto after = std::make_shared<ngraph::opset8::Relu>(matmul);
+        return std::make_shared<ngraph::Function>(
+            ngraph::ResultVector{std::make_shared<ngraph::opset8::Result>(after)},
+            ngraph::ParameterVector{input});
+    }
+
+    static std::shared_ptr<ngraph::Function> CreateReferenceFunction(
+        const ngraph::Shape& input_shape,
+        const ngraph::Shape& reshape_before_shape,
+        const ngraph::Shape& matmul_constant_shape,
+        const ngraph::Shape& reshape_after_shape,
+        const ngraph::Shape& result_shape) {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i64, input_shape);
+        auto before = std::make_shared<ngraph::opset8::Relu>(input);
+        auto reshape_before_constant = ngraph::opset8::Constant::create(ngraph::element::i64,
+            ngraph::Shape{reshape_before_shape.size()}, reshape_before_shape);
+        auto reshape_before = std::make_shared<ngraph::opset8::Reshape>(before, reshape_before_constant, false);
+        auto matmul = CreateMatmul(reshape_before, matmul_constant_shape);
+        auto reshape_after_constant = ngraph::opset8::Constant::create(ngraph::element::i64,
+            ngraph::Shape{reshape_after_shape.size()}, reshape_after_shape);
+        auto reshape_after = std::make_shared<ngraph::opset8::Reshape>(matmul, reshape_after_constant, false);
+        auto after = std::make_shared<ngraph::opset8::Relu>(reshape_after);
+        return std::make_shared<ngraph::Function>(
+            ngraph::ResultVector{std::make_shared<ngraph::opset8::Result>(after)},
+            ngraph::ParameterVector{input});
+    }
+}; // struct InsertReshapeAroundMatmulTest
+
+namespace {
+
+void RunTest(const std::shared_ptr<ngraph::Function>& func, const std::shared_ptr<ngraph::Function>& reference_func) {
+    {
+        ngraph::pass::Manager m;
+        m.register_pass<ngraph::pass::InitNodeInfo>();
+        m.register_pass<GNAPluginNS::InsertReshapeAroundMatmulWithTranspose>();
+        m.register_pass<GNAPluginNS::InsertReshapeAroundMatmulWithFq>();
+        m.register_pass<GNAPluginNS::InsertReshapeAroundMatmulWithAdd>();
+        m.register_pass<GNAPluginNS::InsertReshapeAroundMatmul>();
+        m.run_passes(func);
+        ASSERT_NO_THROW(check_rt_info(func));
+    }
+
+    const FunctionsComparator func_comparator = FunctionsComparator::with_default().enable(FunctionsComparator::ATTRIBUTES);
+    const FunctionsComparator::Result result = func_comparator(func, reference_func);
+    ASSERT_TRUE(result.valid);
+}
+
+} // namespace
+
+TEST(TransformationTests, InsertReshapeAroundMatmul) {
+    RunTest(
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateFunction({1, 6, 8}, {8, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+    RunTest(
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+    RunTest(
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateFunction({1, 6, 1, 8}, {8, 10}, {1, 6, 1, 10}),
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateReferenceFunction({1, 6, 1, 8}, {6, 8}, {8, 10}, {1, 6, 1, 10}, {1, 6, 1, 10}));
+    RunTest(
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateReferenceFunction({1, 6, 1, 8}, {6, 8}, {8, 10}, {1, 6, 1, 10}, {1, 6, 1, 10}),
+        InsertReshapeAroundMatmulTest<false, false, false>::
+            CreateReferenceFunction({1, 6, 1, 8}, {6, 8}, {8, 10}, {1, 6, 1, 10}, {1, 6, 1, 10}));
+}
+
+TEST(TransformationTests, InsertReshapeAroundMatmulWithAdd) {
+    RunTest(
+        InsertReshapeAroundMatmulTest<true, true, false>::
+            CreateFunction({1, 6, 8}, {8, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<true, true, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+    RunTest(
+        InsertReshapeAroundMatmulTest<true, true, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<true, true, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+}
+
+TEST(TransformationTests, InsertReshapeAroundMatmulWithAdd_AddFirstInputConstant) {
+    RunTest(
+        InsertReshapeAroundMatmulTest<true, false, false>::
+            CreateFunction({1, 6, 8}, {8, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<true, false, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+    RunTest(
+        InsertReshapeAroundMatmulTest<true, false, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<true, false, false>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+}
+
+TEST(TransformationTests, InsertReshapeAroundMatmulWithFq) {
+    RunTest(
+        InsertReshapeAroundMatmulTest<false, false, true>::
+            CreateFunction({1, 6, 8}, {8, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<false, false, true>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+    RunTest(
+        InsertReshapeAroundMatmulTest<false, false, true>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<false, false, true>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+}
+
+TEST(TransformationTests, InsertReshapeAroundMatmulWithAddAndFq) {
+    RunTest(
+        InsertReshapeAroundMatmulTest<true, true, true>::
+            CreateFunction({1, 6, 8}, {8, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<true, true, true>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+    RunTest(
+        InsertReshapeAroundMatmulTest<true, true, true>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}),
+        InsertReshapeAroundMatmulTest<true, true, true>::
+            CreateReferenceFunction({1, 6, 8}, {6, 8}, {8, 10}, {1, 6, 10}, {1, 6, 10}));
+}
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_remove_single_input_concat.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_remove_single_input_concat.cpp
new file mode 100644
index 00000000000000..dfb2a0f0a2db1f
--- /dev/null
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_remove_single_input_concat.cpp
@@ -0,0 +1,143 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <gtest/gtest.h>
+
+#include "transformations/remove_single_input_concat.hpp"
+
+#include "common_test_utils/ngraph_test_utils.hpp"
+#include <ngraph/function.hpp>
+#include <ngraph/opsets/opset8.hpp>
+#include <ngraph/pass/manager.hpp>
+#include <transformations/init_node_info.hpp>
+
+namespace testing {
+namespace {
+
+using GraphInputs = std::vector<std::shared_ptr<ngraph::opset8::Parameter>>;
+using GraphOutputs = ngraph::OutputVector;
+
+struct Graph {
+    std::shared_ptr<ngraph::Function> createFunction();
+
+    GraphInputs inputs;
+    GraphOutputs outputs;
+};
+
+std::shared_ptr<ngraph::Function> Graph::createFunction() {
+    ngraph::ResultVector results;
+    std::transform(outputs.begin(), outputs.end(), std::back_inserter(results),
+                   [] (ngraph::Output<ngraph::Node> output) {
+                        return std::make_shared<ngraph::opset8::Result>(output);
+                   });
+
+    ngraph::ParameterVector params(inputs.begin(), inputs.end());
+
+    return std::make_shared<ngraph::Function>(results, params);
+}
+
+// -------------------------------------------------------------------------------------------------------
+
+using Operations = std::vector<std::shared_ptr<ngraph::op::Op>>;
+
+Graph createGraph(int n_inputs, bool has_concat, int n_outputs) {
+    GraphInputs inputs;
+    Operations outputs;
+
+    for (int i = 0; i < n_inputs; ++i) {
+        auto input = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i64,
+                                                                 ngraph::Shape{1, 3, 64});
+        inputs.push_back(input);
+        outputs.push_back(input);
+    }
+
+    {
+        Operations new_outputs;
+        for (auto output : outputs) {
+            auto add_bias = ngraph::opset8::Constant::create(ngraph::element::i64, {1, 1, 1}, {2});
+            auto add_operation = std::make_shared<ngraph::opset8::Add>(output, add_bias);
+            new_outputs.push_back(add_operation);
+        }
+        outputs.swap(new_outputs);
+    }
+
+    if (has_concat) {
+        auto concat_operation = std::make_shared<ngraph::opset8::Concat>(ngraph::OutputVector(outputs.begin(),
+                                                                                              outputs.end()),
+                                                                         0);
+        outputs = {concat_operation};
+    }
+
+    {
+        Operations new_outputs;
+        for (auto output : outputs) {
+            for (int i = 0; i < n_outputs; ++i) {
+                auto add_bias = ngraph::opset8::Constant::create(ngraph::element::i64, {1, 1, 1}, {3});
+                auto add_operation = std::make_shared<ngraph::opset8::Add>(output, add_bias);
+                new_outputs.push_back(add_operation);
+            }
+        }
+        outputs.swap(new_outputs);
+    }
+
+    Graph graph;
+    graph.inputs.swap(inputs);
+    graph.outputs.insert(graph.outputs.end(),
+                        std::make_move_iterator(outputs.begin()),
+                        std::make_move_iterator(outputs.end()));
+
+    return graph;
+}
+
+// -------------------------------------------------------------------------------------------------------
+
+class RemoveSingleInputConcatFixture: public CommonTestUtils::TestsCommon,
+                               public ::testing::WithParamInterface<std::tuple<Graph /* tranformed */,
+                                                                               Graph /* reference */>> {
+public:
+    void SetUp() override;
+public:
+    std::shared_ptr<ngraph::Function> function, reference_function;
+};
+
+void RemoveSingleInputConcatFixture::SetUp() {
+    // TODO: use auto & [transformed_graph, reference_graph] = this->GetParam() when C++17
+    Graph transformed_graph;
+    Graph reference_graph;
+    std::tie(transformed_graph, reference_graph) = this->GetParam();
+
+    function = transformed_graph.createFunction();
+    reference_function = reference_graph.createFunction();
+}
+
+ngraph::pass::Manager createPassManager() {
+    ngraph::pass::Manager manager;
+    manager.register_pass<ngraph::pass::InitNodeInfo>();
+    manager.register_pass<GNAPluginNS::RemoveSingleInputConcat>();
+    return manager;
+}
+
+void execute_test(std::shared_ptr<ngraph::Function> function,
+                  std::shared_ptr<ngraph::Function> reference_function) {
+    ngraph::pass::Manager pass_manager = createPassManager();
+    pass_manager.run_passes(function);
+    const FunctionsComparator func_comparator = FunctionsComparator::with_default().enable(FunctionsComparator::ATTRIBUTES);
+    const FunctionsComparator::Result result = func_comparator(function, reference_function);
+    ASSERT_TRUE(result.valid);
+}
+
+TEST_P(RemoveSingleInputConcatFixture, CompareFunctions) {
+    execute_test(function, reference_function);
+}
+
+INSTANTIATE_TEST_SUITE_P(RemoveSingleInputConcatTestSuite, RemoveSingleInputConcatFixture,
+                         ::testing::Values(std::make_tuple(createGraph(1 /* n_inputs */, true /* has_concat */, 1 /* n_outputs */),
+                                                           createGraph(1 /* n_inputs */, false /* has_concat */, 1 /* n_outputs */)),
+                                           std::make_tuple(createGraph(1 /* n_inputs */, true /* has_concat */, 2 /* n_outputs */),
+                                                           createGraph(1 /* n_inputs */, false /* has_concat */, 2 /* n_outputs */)),
+                                           std::make_tuple(createGraph(2 /* n_inputs */, true /* has_concat */, 1 /* n_outputs */),
+                                                           createGraph(2 /* n_inputs */, true /* has_concat */, 1 /* n_outputs */))));
+
+} // namespace
+} // namespace testing
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_split_convolution_with_large_buffer_size.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_split_convolution_with_large_buffer_size.cpp
index 29dbf117cb40c3..b13d3518286061 100644
--- a/inference-engine/tests/unit/gna/ngraph/transformations/gna_split_convolution_with_large_buffer_size.cpp
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_split_convolution_with_large_buffer_size.cpp
@@ -78,7 +78,7 @@ class CreateAppendableGraphDecorator : public CreateGraphDecorator {
 class CreateBaseDecorator : public CreateGraphDecorator {
 public:
     // always the first decorator => no prev_builder
-    CreateBaseDecorator(const ngraph::Shape& input_data_shape = ngraph::Shape{1, 64, 4096, 4096}) :
+    CreateBaseDecorator(const ngraph::Shape& input_data_shape = ngraph::Shape{1, 64, 1, 4096}) :
                         CreateGraphDecorator(nullptr),
                         input_data_shape_(input_data_shape) {}
 protected:
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/gna_swap_input_matmul.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/gna_swap_input_matmul.cpp
index 184f0fac937896..40288d05785677 100644
--- a/inference-engine/tests/unit/gna/ngraph/transformations/gna_swap_input_matmul.cpp
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/gna_swap_input_matmul.cpp
@@ -20,7 +20,8 @@ static std::shared_ptr<ngraph::Function> CreateMatMulFunction(const ngraph::Shap
                                                               bool withBias,
                                                               bool withWeightsFq,
                                                               bool withOutFq,
-                                                              bool swappedInputs) {
+                                                              bool swappedInputs,
+                                                              bool needTranspose) {
     auto input_params = std::make_shared<ngraph::opset8::Parameter>(ngraph::element::i64, input2_shape);
 
     auto constant = ngraph::opset8::Constant::create(ngraph::element::i64, input1_shape, {1});
@@ -33,14 +34,14 @@ static std::shared_ptr<ngraph::Function> CreateMatMulFunction(const ngraph::Shap
         const_input = std::make_shared<ngraph::opset8::FakeQuantize>(const_input, input_low, input_high,
                                                                      output_low, output_high, 11);
     }
-    auto matmul = swappedInputs ? std::make_shared<ngraph::opset8::MatMul>(input_params, const_input, true, true) :
-        std::make_shared<ngraph::opset8::MatMul>(const_input, input_params);
+    auto matmul = swappedInputs ? std::make_shared<ngraph::opset8::MatMul>(input_params, const_input, needTranspose, needTranspose) :
+        std::make_shared<ngraph::opset8::MatMul>(const_input, input_params, needTranspose, needTranspose);
 
     std::shared_ptr<ngraph::Node> final_node = matmul;
     if (withBias) {
         auto bias = ngraph::opset8::Constant::create(ngraph::element::i64, bias_shape, {1});
         std::shared_ptr<ngraph::Node> bias_node = bias;
-        if (swappedInputs && bias_shape.size() > 1) {
+        if (needTranspose && bias_shape.size() > 1) {
             auto transpose_order = ngraph::opset8::Constant::create(ngraph::element::i64, ngraph::Shape{2},
                                                                     std::vector<size_t>{1, 0});
             bias_node = std::make_shared<ngraph::opset8::Transpose>(bias_node, transpose_order);
@@ -57,7 +58,7 @@ static std::shared_ptr<ngraph::Function> CreateMatMulFunction(const ngraph::Shap
                                                                     output_low, output_high, 11);
     }
 
-    if (swappedInputs) {
+    if (needTranspose) {
         auto transpose_order = ngraph::opset8::Constant::create(ngraph::element::i64, ngraph::Shape{2},
                                                                 std::vector<size_t>{1, 0});
         final_node = std::make_shared<ngraph::opset8::Transpose>(final_node, transpose_order);
@@ -104,6 +105,12 @@ static std::string getTestCaseName(testing::TestParamInfo<SwapInputMatmulParams>
     return result.str();
 }
 
+enum class MatmulInputType {
+    FirstInputConstant,
+    SecondInputConstant
+}; // enum class MatmulInputType
+
+template<MatmulInputType E>
 class SwapInputMatmul : public CommonTestUtils::TestsCommon,
                         public ::testing::WithParamInterface<SwapInputMatmulParams> {
 public:
@@ -112,14 +119,24 @@ class SwapInputMatmul : public CommonTestUtils::TestsCommon,
         bool withBias, withWeightsFq, withOutFq;
         std::tie(shapes, withBias, withWeightsFq, withOutFq) = this->GetParam();
 
-        function = CreateMatMulFunction(shapes[0], shapes[1], shapes[2], withBias, withWeightsFq, withOutFq, false);
+        bool swap_inputs = false;
+        switch (E) {
+        case MatmulInputType::FirstInputConstant:
+            break;
+        case MatmulInputType::SecondInputConstant:
+            swap_inputs = true;
+            break;
+        }
+
+        function = CreateMatMulFunction(shapes[0], shapes[1], shapes[2], withBias, withWeightsFq, withOutFq, swap_inputs, false);
         reference_function = CreateMatMulFunction(shapes[0], shapes[1], shapes[2], withBias, withWeightsFq,
-                                                  withOutFq, true);
+                                                  withOutFq, !swap_inputs, true);
     }
 public:
     std::shared_ptr<ngraph::Function> function, reference_function;
 };
 
+template<MatmulInputType E>
 class SwapInputMatmulNotApplied : public CommonTestUtils::TestsCommon,
                                   public ::testing::WithParamInterface<SwapInputMatmulParams> {
 public:
@@ -128,42 +145,92 @@ class SwapInputMatmulNotApplied : public CommonTestUtils::TestsCommon,
         bool withBias, withWeightsFq, withOutFq;
         std::tie(shapes, withBias, withWeightsFq, withOutFq) = this->GetParam();
 
-        function = CreateMatMulFunction(shapes[0], shapes[1], shapes[2], withBias, withWeightsFq, withOutFq, false);
+        bool swap_inputs = false;
+        switch (E) {
+        case MatmulInputType::FirstInputConstant:
+            break;
+        case MatmulInputType::SecondInputConstant:
+            swap_inputs = true;
+            break;
+        }
+
+        function = CreateMatMulFunction(shapes[0], shapes[1], shapes[2], withBias, withWeightsFq, withOutFq, swap_inputs, false);
         reference_function = ngraph::clone_function(*function);
     }
 public:
     std::shared_ptr<ngraph::Function> function, reference_function;
 };
 
-TEST_P(SwapInputMatmul, CompareFunctions) {
+using SwapInputMatmulWithFirstInputConstant = SwapInputMatmul<MatmulInputType::FirstInputConstant>;
+using SwapInputMatmulWithSecondInputConstant = SwapInputMatmul<MatmulInputType::SecondInputConstant>;
+using SwapInputMatmulWithFirstInputConstantNotApplied = SwapInputMatmulNotApplied<MatmulInputType::FirstInputConstant>;
+using SwapInputMatmulWithSecondInputConstantNotApplied = SwapInputMatmulNotApplied<MatmulInputType::SecondInputConstant>;
+
+TEST_P(SwapInputMatmulWithFirstInputConstant, CompareFunctions) {
     Execute(function, reference_function);
 }
 
-TEST_P(SwapInputMatmulNotApplied, CompareFunctions) {
+TEST_P(SwapInputMatmulWithFirstInputConstantNotApplied, CompareFunctions) {
     Execute(function, reference_function);
 }
 
-const std::vector<std::vector<ngraph::Shape>> input_shapes_applied = {
+TEST_P(SwapInputMatmulWithSecondInputConstant, CompareFunctions) {
+    Execute(function, reference_function);
+}
+
+TEST_P(SwapInputMatmulWithSecondInputConstantNotApplied, CompareFunctions) {
+    Execute(function, reference_function);
+}
+
+const std::vector<std::vector<ngraph::Shape>> input_shapes_for_matmul_with_first_constant_applied = {
     {{16, 8}, {8, 8}, {16, 8}},
     {{16, 8}, {8, 8}, {1}},
 };
 
-const std::vector<std::vector<ngraph::Shape>> input_shapes_not_applied = {
+const std::vector<std::vector<ngraph::Shape>> input_shapes_for_matmul_with_first_constant_not_applied = {
     {{1, 8}, {8, 8}, {1, 8}},
     {{8}, {8, 8}, {8}}
 };
 
-INSTANTIATE_TEST_SUITE_P(smoke_swap_input_matmul, SwapInputMatmul,
+const std::vector<std::vector<ngraph::Shape>> input_shapes_for_matmul_with_second_constant_applied = {
+    {{64, 6}, {100, 64}, {100, 6}},
+    {{64, 6}, {100, 64}, {1}},
+};
+
+const std::vector<std::vector<ngraph::Shape>> input_shapes_for_matmul_with_second_constant_not_applied = {
+    {{64, 16}, {100, 64}, {100, 16}},
+    {{64, 6}, {8, 64}, {8, 6}},
+    {{8, 1}, {8, 8}, {8, 1}},
+    {{8}, {8, 8}, {8}}
+};
+
+INSTANTIATE_TEST_SUITE_P(smoke_swap_input_matmul, SwapInputMatmulWithFirstInputConstant,
+    ::testing::Combine(
+        ::testing::ValuesIn(input_shapes_for_matmul_with_first_constant_applied),
+        ::testing::ValuesIn(std::vector<bool>{false, true}),
+        ::testing::ValuesIn(std::vector<bool>{false, true}),
+        ::testing::ValuesIn(std::vector<bool>{false, true})),
+    getTestCaseName);
+
+INSTANTIATE_TEST_SUITE_P(smoke_swap_input_matmul, SwapInputMatmulWithFirstInputConstantNotApplied,
+    ::testing::Combine(
+        ::testing::ValuesIn(input_shapes_for_matmul_with_first_constant_not_applied),
+        ::testing::ValuesIn(std::vector<bool>{false, true}),
+        ::testing::ValuesIn(std::vector<bool>{false, true}),
+        ::testing::ValuesIn(std::vector<bool>{false, true})),
+    getTestCaseName);
+
+INSTANTIATE_TEST_SUITE_P(smoke_swap_input_matmul, SwapInputMatmulWithSecondInputConstant,
     ::testing::Combine(
-        ::testing::ValuesIn(input_shapes_applied),
+        ::testing::ValuesIn(input_shapes_for_matmul_with_second_constant_applied),
         ::testing::ValuesIn(std::vector<bool>{false, true}),
         ::testing::ValuesIn(std::vector<bool>{false, true}),
         ::testing::ValuesIn(std::vector<bool>{false, true})),
     getTestCaseName);
 
-INSTANTIATE_TEST_SUITE_P(smoke_swap_input_matmul, SwapInputMatmulNotApplied,
+INSTANTIATE_TEST_SUITE_P(smoke_swap_input_matmul, SwapInputMatmulWithSecondInputConstantNotApplied,
     ::testing::Combine(
-        ::testing::ValuesIn(input_shapes_not_applied),
+        ::testing::ValuesIn(input_shapes_for_matmul_with_second_constant_not_applied),
         ::testing::ValuesIn(std::vector<bool>{false, true}),
         ::testing::ValuesIn(std::vector<bool>{false, true}),
         ::testing::ValuesIn(std::vector<bool>{false, true})),
diff --git a/inference-engine/tests/unit/gna/ngraph/transformations/handle_transposes_around_matmul.cpp b/inference-engine/tests/unit/gna/ngraph/transformations/handle_transposes_around_matmul.cpp
index df8ac77ed6e85d..cd35294579c09e 100644
--- a/inference-engine/tests/unit/gna/ngraph/transformations/handle_transposes_around_matmul.cpp
+++ b/inference-engine/tests/unit/gna/ngraph/transformations/handle_transposes_around_matmul.cpp
@@ -70,56 +70,117 @@ std::shared_ptr<ngraph::Function> CreateMatmulFunction(const ngraph::Shape& inpu
 
 namespace handle_transpose_after_matmul {
 
-std::shared_ptr<ngraph::Function> CreateMatmulTransposeFunction(const ngraph::Shape& input_shape,
-    const ngraph::Shape& matmul_shape, const ngraph::Shape& reshape_shape, bool create_reshape_after_transpose) {
+std::shared_ptr<ngraph::Function> CreateMatmulTransposeFunction(
+    const ngraph::Shape& input_shape,
+    const ngraph::Shape& matmul_shape,
+    const ngraph::Shape& reshape_shape,
+    bool create_reshape_after_transpose,
+    bool enable_last_reshape,
+    bool enable_add,
+    bool matmul_on_left_side,
+    bool enable_fq) {
     auto input_params = std::make_shared<ngraph::opset7::Parameter>(ngraph::element::i64, input_shape);
 
     std::vector<size_t> data(ngraph::shape_size(matmul_shape));
     std::iota(std::begin(data), std::end(data), 1);
     auto matmul_constant = ngraph::opset7::Constant::create(ngraph::element::i64, matmul_shape, data);
-    auto matmul = std::make_shared<ngraph::opset7::MatMul>(input_params, matmul_constant);
-    const auto matmul_output_shape = matmul->get_output_shape(0);
+    std::shared_ptr<ngraph::Node> node = std::make_shared<ngraph::opset7::MatMul>(input_params, matmul_constant);
+    const auto matmul_output_shape = node->get_output_shape(0);
+    if (enable_add) {
+        auto add_const = ngraph::opset7::Constant::create(ngraph::element::i64, matmul_output_shape, {1});
+        if (matmul_on_left_side) {
+            node = std::make_shared<ngraph::opset7::Add>(add_const, node);
+        } else {
+            node = std::make_shared<ngraph::opset7::Add>(node, add_const);
+        }
+    }
+
+    if (enable_fq) {
+        node = std::make_shared<ngraph::opset7::FakeQuantize>(
+            node,
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {-0.1}),
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {0.1}),
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {-0.1}),
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {0.1}),
+            255);
+    }
 
     auto transpose_order = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{2}, {1, 0});
-    auto transpose = std::make_shared<ngraph::opset7::Transpose>(matmul, transpose_order);
+    auto transpose = std::make_shared<ngraph::opset7::Transpose>(node, transpose_order);
     const auto transpose_output_shape = transpose->get_output_shape(0);
 
-    std::shared_ptr<ngraph::opset7::Reshape> reshape;
+    std::shared_ptr<ngraph::Node> reshape;
     auto shape_const = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{reshape_shape.size()}, reshape_shape);
     if (create_reshape_after_transpose) {
-        const auto matmul_output_shape = matmul->get_output_shape(0);
+        const auto matmul_output_shape = node->get_output_shape(0);
         auto reshape_after_transpose_const = ngraph::opset7::Constant::create(ngraph::element::i64,
             ngraph::Shape{matmul_output_shape.size()}, matmul_output_shape);
         auto reshape_after_transpose = std::make_shared<ngraph::opset7::Reshape>(transpose, reshape_after_transpose_const, false);
-        reshape = std::make_shared<ngraph::opset7::Reshape>(reshape_after_transpose, shape_const, false);
+        reshape = reshape_after_transpose;
+        if (enable_last_reshape) {
+            reshape = std::make_shared<ngraph::opset7::Reshape>(reshape_after_transpose, shape_const, false);
+        }
     } else {
-        reshape = std::make_shared<ngraph::opset7::Reshape>(transpose, shape_const, false);
-        const auto reshape_output_shape = reshape->get_output_shape(0);
+        reshape = transpose;
+        if (enable_last_reshape) {
+            reshape = std::make_shared<ngraph::opset7::Reshape>(transpose, shape_const, false);
+        }
     }
 
     auto result = std::make_shared<ngraph::opset7::Result>(reshape);
     return std::make_shared<ngraph::Function>(ngraph::ResultVector{result}, ngraph::ParameterVector{input_params});
 }
 
-std::shared_ptr<ngraph::Function> CreateMatmulFunction(const ngraph::Shape& input_shape,
-    const ngraph::Shape& matmul_shape, const ngraph::Shape& reshape_shape, bool create_reshape_instead_of_transpose) {
+std::shared_ptr<ngraph::Function> CreateMatmulFunction(
+    const ngraph::Shape& input_shape,
+    const ngraph::Shape& matmul_shape,
+    const ngraph::Shape& reshape_shape,
+    bool create_reshape_instead_of_transpose,
+    bool enable_last_reshape,
+    bool enable_add,
+    bool matmul_on_left_side,
+    bool enable_fq) {
     auto input_params = std::make_shared<ngraph::opset7::Parameter>(ngraph::element::i64, input_shape);
 
     std::vector<size_t> data(ngraph::shape_size(matmul_shape));
     std::iota(std::begin(data), std::end(data), 1);
     auto matmul_constant = ngraph::opset7::Constant::create(ngraph::element::i64, matmul_shape, data);
-    auto matmul = std::make_shared<ngraph::opset7::MatMul>(input_params, matmul_constant);
+    std::shared_ptr<ngraph::Node> node = std::make_shared<ngraph::opset7::MatMul>(input_params, matmul_constant);
+    const auto matmul_output_shape = node->get_output_shape(0);
+    if (enable_add) {
+        auto add_const = ngraph::opset7::Constant::create(ngraph::element::i64, matmul_output_shape, {1});
+        if (matmul_on_left_side) {
+            node = std::make_shared<ngraph::opset7::Add>(add_const, node);
+        } else {
+            node = std::make_shared<ngraph::opset7::Add>(node, add_const);
+        }
+    }
 
-    std::shared_ptr<ngraph::opset7::Reshape> reshape;
+    if (enable_fq) {
+        node = std::make_shared<ngraph::opset7::FakeQuantize>(
+            node,
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {-0.1}),
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {0.1}),
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {-0.1}),
+            ngraph::opset7::Constant::create(ngraph::element::f32, {1}, {0.1}),
+            255);
+    }
+
+    std::shared_ptr<ngraph::Node> reshape;
     auto shape_const = ngraph::opset7::Constant::create(ngraph::element::i64, ngraph::Shape{reshape_shape.size()}, reshape_shape);
     if (create_reshape_instead_of_transpose) {
-        const auto matmul_output_shape = matmul->get_output_shape(0);
         auto reshape_instead_of_transpose_const = ngraph::opset7::Constant::create(ngraph::element::i64,
             ngraph::Shape{matmul_output_shape.size()}, {matmul_output_shape[1], matmul_output_shape[0]});
-        auto reshape_instead_of_transpose = std::make_shared<ngraph::opset7::Reshape>(matmul, reshape_instead_of_transpose_const, false);
-        reshape = std::make_shared<ngraph::opset7::Reshape>(reshape_instead_of_transpose, shape_const, false);
+        auto reshape_instead_of_transpose = std::make_shared<ngraph::opset7::Reshape>(node, reshape_instead_of_transpose_const, false);
+        reshape = reshape_instead_of_transpose;
+        if (enable_last_reshape) {
+            reshape = std::make_shared<ngraph::opset7::Reshape>(reshape_instead_of_transpose, shape_const, false);
+        }
     } else {
-        reshape = std::make_shared<ngraph::opset7::Reshape>(matmul, shape_const, false);
+        reshape = node;
+        if (enable_last_reshape) {
+            reshape = std::make_shared<ngraph::opset7::Reshape>(node, shape_const, false);
+        }
     }
 
     auto result = std::make_shared<ngraph::opset7::Result>(reshape);
@@ -153,6 +214,9 @@ TEST(TransformationTests, InsertTransposeBeforeMatmulTest) {
     RunTest(
         handle_transpose_before_matmul::CreateMatmulFunction({1, 16}, {8, 2}, {2, 1}, false),
         handle_transpose_before_matmul::CreateTransposeMatmulFunction({1, 16}, {8, 2}, {2, 1}, true));
+    RunTest(
+        handle_transpose_before_matmul::CreateMatmulFunction({1, 2, 8}, {8, 2}, {2, 1}, false),
+        handle_transpose_before_matmul::CreateTransposeMatmulFunction({1, 2, 8}, {8, 2}, {2, 1}, true));
 }
 
 TEST(TransformationTests, InsertTransposeBeforeMatmulTestReshapeInOutEq) {
@@ -177,25 +241,59 @@ TEST(TransformationTests, RemoveTransposeBeforeMatmulTestReshapeInOutEq) {
 }
 
 TEST(TransformationTests, InsertTransposeAfterMatmulTest) {
-    RunTest(
-        handle_transpose_after_matmul::CreateMatmulFunction({4, 1}, {1, 8}, {2, 16}, false),
-        handle_transpose_after_matmul::CreateMatmulTransposeFunction({4, 1}, {1, 8}, {2, 16}, true));
+    for (auto enable_add : { true, false}) {
+        for (auto matmul_on_left_side : { true, false}) {
+            for (auto enable_fq : { true, false}) {
+                RunTest(
+                    handle_transpose_after_matmul::CreateMatmulFunction(
+                        {4, 1}, {1, 8}, {2, 16}, false, true, enable_add, matmul_on_left_side, enable_fq),
+                    handle_transpose_after_matmul::CreateMatmulTransposeFunction(
+                        {4, 1}, {1, 8}, {2, 16}, true, true, enable_add, matmul_on_left_side, enable_fq));
+            }
+        }
+    }
 }
 
 TEST(TransformationTests, RemoveTransposeAfterMatmulTest) {
-    RunTest(
-        handle_transpose_after_matmul::CreateMatmulTransposeFunction({4, 1}, {1, 8}, {2, 16}, false),
-        handle_transpose_after_matmul::CreateMatmulFunction({4, 1}, {1, 8}, {2, 16}, true));
+    for (auto enable_add : { true, false }) {
+        for (auto matmul_on_left_side : { true, false }) {
+            for (auto enable_fq : { true, false }) {
+                RunTest(
+                    handle_transpose_after_matmul::CreateMatmulTransposeFunction(
+                        {4, 1}, {1, 8}, {2, 16}, false, true, enable_add, matmul_on_left_side, enable_fq),
+                    handle_transpose_after_matmul::CreateMatmulFunction(
+                        {4, 1}, {1, 8}, {2, 16}, true, true, enable_add, matmul_on_left_side, enable_fq));
+            }
+        }
+    }
 }
 
 TEST(TransformationTests, RemoveTransposeAfterMatmulTestReshapeInOutEq) {
-    RunTest(
-        handle_transpose_after_matmul::CreateMatmulTransposeFunction({4, 1}, {1, 8}, {8, 4}, false),
-        handle_transpose_after_matmul::CreateMatmulTransposeFunction({4, 1}, {1, 8}, {8, 4}, false));
+    for (auto enable_add : { true, false }) {
+        for (auto matmul_on_left_side : { true, false }) {
+            for (auto enable_fq : { true, false }) {
+                RunTest(
+                    handle_transpose_after_matmul::CreateMatmulTransposeFunction(
+                        {4, 1}, {1, 8}, {8, 4}, false, true, enable_add, matmul_on_left_side, enable_fq),
+                    handle_transpose_after_matmul::CreateMatmulTransposeFunction(
+                        {4, 1}, {1, 8}, {8, 4}, false, true, enable_add, matmul_on_left_side, enable_fq));
+            }
+        }
+    }
 }
 
 TEST(TransformationTests, InsertTransposeAfterMatmulTestReshapeInOutEq) {
-    RunTest(
-        handle_transpose_after_matmul::CreateMatmulFunction({4, 1}, {1, 8}, {4, 8}, false),
-        handle_transpose_after_matmul::CreateMatmulFunction({4, 1}, {1, 8}, {4, 8}, false));
+    for (auto enable_last_reshape : { true, false }) {
+        for (auto enable_add : { true, false }) {
+            for (auto matmul_on_left_side : { true, false }) {
+                for (auto enable_fq : { true, false }) {
+                    RunTest(
+                        handle_transpose_after_matmul::CreateMatmulFunction(
+                            {4, 1}, {1, 8}, {4, 8}, false, enable_last_reshape, enable_add, matmul_on_left_side, enable_fq),
+                        handle_transpose_after_matmul::CreateMatmulFunction(
+                            {4, 1}, {1, 8}, {4, 8}, false, enable_last_reshape, enable_add, matmul_on_left_side, enable_fq));
+                }
+            }
+        }
+    }
 }
diff --git a/inference-engine/tests_deprecated/behavior/shared_tests/plugin_tests/behavior_test_plugin.h b/inference-engine/tests_deprecated/behavior/shared_tests/plugin_tests/behavior_test_plugin.h
index e5c4c17679efaa..fb2016cb5ea11b 100644
--- a/inference-engine/tests_deprecated/behavior/shared_tests/plugin_tests/behavior_test_plugin.h
+++ b/inference-engine/tests_deprecated/behavior/shared_tests/plugin_tests/behavior_test_plugin.h
@@ -107,7 +107,4 @@ const TestModel convReluNormPoolFcModelFP32 = getConvReluNormPoolFcModel(Inferen
 const TestModel convReluNormPoolFcModelFP16 = getConvReluNormPoolFcModel(InferenceEngine::Precision::FP16);
 const TestModel convReluNormPoolFcModelQ78 = getConvReluNormPoolFcModel(InferenceEngine::Precision::Q78);
 
-class FPGAHangingTest : public BehaviorPluginTest {
-};
-
 #endif
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp
index f46a5dd10420b9..53b9cad0fea159 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/graph/network.hpp
@@ -145,6 +145,7 @@ struct network {
     std::vector<primitive_id> get_all_primitive_org_ids() const;
     const program::primitives_info& get_primitives_info() const;
     const program::graph_optimizer_info& get_optimizer_passes_info() const;
+    std::map<primitive_id, primitive_id> get_ext_id_mapping() const;
     void execute_impl(const std::vector<event::ptr>& events);
 
     /// @brief Executes network and returns the list of @ref network_output.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp
index 71a8c4ba2c05fc..b0cbe24542a145 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/activation.hpp
@@ -89,8 +89,9 @@ struct activation : public primitive_base<activation> {
                const primitive_id& input,
                activation_func activation_function,
                activation_additional_params additional_params = {0.f, 0.f},
+               const primitive_id& ext_prim_id = "",
                const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           activation_function(activation_function),
           additional_params(additional_params),
           additional_params_input("") {}
@@ -105,8 +106,9 @@ struct activation : public primitive_base<activation> {
                const primitive_id& input,
                const primitive_id& additional_params_input,
                activation_func activation_function,
+               const primitive_id& ext_prim_id = "",
                const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           activation_function(activation_function),
           additional_params({0, 0}),
           additional_params_input(additional_params_input) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp
index 2b2ede9fecd43f..98bf194ef5e0e0 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/arg_max_min.hpp
@@ -49,9 +49,10 @@ struct arg_max_min : public primitive_base<arg_max_min> {
                 axis_name axis = axis_name::xyf,
                 sort_type sort = sort_type::sort_by_values,
                 bool values_first = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding(),
                 data_types output_data_type = data_types::f32)
-        : primitive_base(id, {input}, output_padding, optional_data_type {output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type {output_data_type}),
           top_k(top_k),
           output_type(output_type),
           axis(axis),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp
index 8db0a0f48f00b3..b507c454a81358 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/average_unpooling.hpp
@@ -32,8 +32,9 @@ struct average_unpooling : public primitive_base<average_unpooling> {
         const tensor output_size,
         const tensor& size,
         const tensor& stride,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), stride(stride), size(size), output_size(output_size) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), stride(stride), size(size), output_size(output_size) {}
 
     /// @brief Defines shift in output buffer.
     tensor stride;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp
index 715b81ee0ba768..566148c25e0e13 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/batch_to_space.hpp
@@ -59,8 +59,9 @@ struct batch_to_space : public primitive_base<batch_to_space> {
                    const tensor& crops_begin,
                    const tensor& crops_end,
                    const tensor& out_size,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           block_shape(block_shape),
           crops_begin(crops_begin),
           crops_end(crops_end),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp
index 7942b8d5fd915b..69ce63725497d2 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/binary_convolution.hpp
@@ -44,8 +44,9 @@ struct binary_convolution : public primitive_base<binary_convolution> {
                        int groups = 1,
                        float pad_value = 0.0f,
                        data_types calc_precision = data_types::f32,
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type {calc_precision}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type {calc_precision}),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp
index 17a14d6d363fd0..529ec0d4cd5177 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/border.hpp
@@ -67,8 +67,9 @@ struct border : public primitive_base<border> {
            const tensor& right_bottom_sizes = {0, 0, 0, 0},
            const border_type type = border_type::constant,
            const float border_value = 0.0f,
+           const primitive_id& ext_prim_id = "",
            const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           left_top_sizes(left_top_sizes),
           right_bottom_sizes(right_bottom_sizes),
           type(type),
@@ -90,7 +91,7 @@ struct border : public primitive_base<border> {
            const tensor& x_y_sizes,
            const border_type type = border_type::constant,
            const padding& output_padding = padding())
-        : border(id, input, x_y_sizes, x_y_sizes, type, 0.0f, output_padding) {}
+        : border(id, input, x_y_sizes, x_y_sizes, type, 0.0f, ext_prim_id, output_padding) {}
 
     /// @brief Sizes of border that needs to be added from left (in X dimension) and from top (in Y dimension).
     tensor left_top_sizes;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp
index f7140648d7851c..f6931236bd9873 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/broadcast.hpp
@@ -75,8 +75,9 @@ struct broadcast : public primitive_base<broadcast> {
               const primitive_id& input,
               const tensor& broadcast_sizes,
               const std::vector<uint16_t>& broadcast_axes = {},
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           broadcast_sizes(broadcast_sizes),
           broadcast_axes(broadcast_axes) {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp
index b8e2118675dd1b..8c0199cf56f9b6 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/concatenation.hpp
@@ -57,8 +57,9 @@ struct concatenation : public primitive_base<concatenation> {
         const primitive_id& id,
         const std::vector<primitive_id>& input,
         const concatenation_axis axis,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), axis(axis) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), axis(axis) {}
 
     /// @li Constructs concatenation primitive.
     /// @param id This primitive id.
@@ -70,8 +71,9 @@ struct concatenation : public primitive_base<concatenation> {
         const std::vector<primitive_id>& input,
         const concatenation_axis axis,
         const data_types output_dt,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_dt}), axis(axis) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_dt}), axis(axis) {}
 
     /// @brief Dimension along which concatenation should take place
     concatenation_axis axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp
index aa63586c4a3157..791522d325485f 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/condition.hpp
@@ -47,8 +47,9 @@ struct condition : public primitive_base<condition> {
               const primitive_id& compare_data,
               const cond_functions& func,
               const tensor& offset = {0, 0, 0, 0, 0},
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           topology_true(topology_true),
           topology_false(topology_false),
           compare_data(compare_data),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp
index 0a34c6ba50641c..b608f31dbeee3b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/convolution.hpp
@@ -53,8 +53,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor output_size,
                 data_types output_type,
                 bool grouped_weights_shape,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding, optional_data_type{output_type}),
+            : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_type}),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -104,8 +105,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor output_size,
                 bool grouped_weights_shape,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+            : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -162,8 +164,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor output_size,
                 bool grouped_weights_shape,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+            : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -209,8 +212,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor stride = {1, 1, 1, 1},
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -254,8 +258,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -301,8 +306,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -347,8 +353,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
                 bool grouped_weights_shape = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -391,8 +398,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
                 bool grouped_weights_shape = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -433,8 +441,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -477,8 +486,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor dilation,
                 tensor padding_above,
                 tensor padding_below,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -518,8 +528,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset = tensor(0),
                 tensor dilation = {1, 1, 1, 1},
                 bool grouped_weights_shape = false,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -560,8 +571,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset,
                 tensor dilation,
                 tensor output_size,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -604,8 +616,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset,
                 tensor dilation,
                 tensor output_size,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -652,8 +665,9 @@ struct convolution : public primitive_base<convolution> {
                 tensor input_offset,
                 tensor dilation,
                 tensor output_size,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input, trans}, output_padding),
+        : primitive_base(id, {input, trans}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           dilation(dilation),
@@ -701,6 +715,7 @@ struct convolution : public primitive_base<convolution> {
                                                tensor stride = {1, 1, 1, 1},
                                                tensor input_offset = tensor(0),
                                                tensor dilation = {1, 1, 1, 1},
+                                               const primitive_id& ext_prim_id = "",
                                                const padding& output_padding = padding()) {
         return convolution(id,
                            input,
@@ -710,6 +725,7 @@ struct convolution : public primitive_base<convolution> {
                            input_offset,
                            dilation,
                            output_size,
+                           ext_prim_id,
                            output_padding);
     }
 
@@ -736,6 +752,7 @@ struct convolution : public primitive_base<convolution> {
                                                tensor stride = {1, 1, 1, 1},
                                                tensor input_offset = tensor(0),
                                                tensor dilation = {1, 1, 1, 1},
+                                               const primitive_id& ext_prim_id = "",
                                                const padding& output_padding = padding()) {
         return convolution(id,
                            input,
@@ -744,6 +761,7 @@ struct convolution : public primitive_base<convolution> {
                            input_offset,
                            dilation,
                            output_size,
+                           ext_prim_id,
                            output_padding);
     }
 
@@ -813,8 +831,9 @@ struct deformable_interp : public primitive_base<deformable_interp> {
                       tensor dilation,
                       tensor output_size,
                       tensor kernel_size,
+                      const primitive_id& ext_prim_id = "",
                       const padding& output_padding = padding())
-            : primitive_base(id, {input, trans}, output_padding),
+            : primitive_base(id, {input, trans}, ext_prim_id, output_padding),
               input_offset(input_offset),
               stride(stride),
               dilation(dilation),
@@ -857,8 +876,9 @@ struct deformable_conv : public primitive_base<deformable_conv> {
                     const std::vector<primitive_id>& biases,
                     uint32_t groups,
                     tensor output_size,
+                    const primitive_id& ext_prim_id = "",
                     const padding& output_padding = padding())
-            : primitive_base(id, {input}, output_padding),
+            : primitive_base(id, {input}, ext_prim_id, output_padding),
               output_size(output_size),
               groups(groups),
               weights(weights),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp
index ff14ad1e94ff40..ee87c285211ce2 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/crop.hpp
@@ -51,8 +51,9 @@ struct crop : public primitive_base<crop> {
          const primitive_id& input,
          const tensor& reference_input,
          const tensor& offsets,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), reference_input(reference_input), offsets(offsets) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), reference_input(reference_input), offsets(offsets) {}
 
     /// @brief Constructs crop primitive (borders variant).
     ///
@@ -71,8 +72,9 @@ struct crop : public primitive_base<crop> {
          const tensor& lt_borders,
          const tensor& rb_borders,
          const crop_borders_t,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), reference_input(rb_borders.negate()), offsets(lt_borders) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), reference_input(rb_borders.negate()), offsets(lt_borders) {}
 
     /// @brief Constructs crop primitive (symmetric borders variant).
     ///
@@ -88,8 +90,9 @@ struct crop : public primitive_base<crop> {
          const primitive_id& input,
          const tensor& xy_borders,
          const crop_borders_t,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), reference_input(xy_borders.negate()), offsets(xy_borders) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), reference_input(xy_borders.negate()), offsets(xy_borders) {}
 
     /// @brief Reference input tensor with the required dimensions.
     tensor reference_input;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp
index 2ec0f84c27baa0..d5deedeaeaf360 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/ctc_greedy_decoder.hpp
@@ -28,8 +28,9 @@ struct ctc_greedy_decoder : public primitive_base<ctc_greedy_decoder> {
                        const uint32_t blank_index,
                        const bool ctc_merge_repeated,
                        const tensor output_tensor,
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding())
-        : primitive_base(id, input, output_padding)
+        : primitive_base(id, input, ext_prim_id, output_padding)
         , blank_index(blank_index)
         , ctc_merge_repeated(ctc_merge_repeated)
         , output_tensor(output_tensor) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp
index 8a0847fd61fadb..5740fa445af38b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/cum_sum.hpp
@@ -37,8 +37,9 @@ struct cum_sum : public primitive_base<cum_sum> {
             const cum_sum_axis axis = along_b,
             const bool exclusive = false,
             const bool reverse = false,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), axis(axis), exclusive(exclusive), reverse(reverse)
+        : primitive_base(id, {input}, ext_prim_id, output_padding), axis(axis), exclusive(exclusive), reverse(reverse)
     {}
 
     /// @brief Scalar axis.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp
index 25da079a5de315..163f7276319e7d 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/custom_gpu_primitive.hpp
@@ -56,8 +56,9 @@ struct custom_gpu_primitive : public primitive_base<custom_gpu_primitive> {
                          const std::string& build_options,
                          const layout& output_layout,
                          const std::vector<size_t>& gws = {},
-                         const std::vector<size_t>& lws = {})
-        : primitive_base(id, {input}, output_layout.data_padding),
+                         const std::vector<size_t>& lws = {},
+                         const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {input}, ext_prim_id, output_layout.data_padding),
           kernel_entry_point(kernel_entry_point),
           kernel_arguments(kernel_arguments),
           build_options(build_options),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp
index e7fe1f889fc619..571175d4d04750 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/data.hpp
@@ -26,8 +26,8 @@ struct data : public primitive_base<data> {
     /// @param id This primitive id.
     /// @param mem @ref memory object which contains data.
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
-    data(const primitive_id& id, memory::ptr mem)
-        : primitive_base(id, {}, padding()), mem(mem) {}
+    data(const primitive_id& id, memory::ptr mem, const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {}, ext_prim_id, padding()), mem(mem) {}
 
     /// @brief @ref memory object which contains data.
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp
index 333488d6297469..2bc753553c08a2 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/deconvolution.hpp
@@ -37,8 +37,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   const std::vector<primitive_id>& bias,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -64,8 +65,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   uint32_t groups,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -88,8 +90,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   const std::vector<primitive_id>& weights,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -114,8 +117,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   uint32_t groups,
                   tensor stride = {1, 1, 1, 1},
                   tensor input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(false),
@@ -142,8 +146,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   tensor stride,
                   tensor input_offset,
                   tensor output_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(true),
@@ -174,8 +179,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   tensor input_offset,
                   tensor output_size,
                   bool grouped_weights_shape,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(true),
@@ -201,8 +207,9 @@ struct deconvolution : public primitive_base<deconvolution> {
                   tensor stride,
                   tensor input_offset,
                   tensor output_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           input_offset(input_offset),
           stride(stride),
           with_output_size(true),
@@ -231,6 +238,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                                                  tensor output_size,
                                                  tensor stride = {1, 1, 1, 1},
                                                  tensor input_offset = {0, 0, 0, 0},
+                                                 const primitive_id& ext_prim_id = "",
                                                  const padding& output_padding = padding()) {
         return deconvolution(id,
                              input,
@@ -239,6 +247,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                              stride,
                              input_offset,
                              output_size,
+                             ext_prim_id,
                              output_padding);
     }
 
@@ -259,6 +268,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                                                  tensor output_size,
                                                  tensor stride = {1, 1, 1, 1},
                                                  tensor input_offset = {0, 0, 0, 0},
+                                                 const primitive_id& ext_prim_id = "",
                                                  const padding& output_padding = padding()) {
         return deconvolution(id,
                              input,
@@ -266,6 +276,7 @@ struct deconvolution : public primitive_base<deconvolution> {
                              stride,
                              input_offset,
                              output_size,
+                             ext_prim_id,
                              output_padding);
     }
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp
index 74b824a670d1c9..70cc035f6b16ec 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/depth_to_space.hpp
@@ -36,8 +36,9 @@ struct depth_to_space : public primitive_base<depth_to_space> {
                    const primitive_id& input,
                    const size_t block_size,
                    const depth_to_space_mode mode,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding)
+        : primitive_base(id, {input}, ext_prim_id, output_padding)
         , block_size(block_size)
         , mode(mode) {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp
index 22f7d686c0f674..a46f0cd0b813b7 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/detection_output.hpp
@@ -65,8 +65,9 @@ struct detection_output : public primitive_base<detection_output> {
                      const bool decrease_label_id = false,
                      const bool clip_before_nms = false,
                      const bool clip_after_nms = false,
+                     const primitive_id& ext_prim_id = "",
                      const padding& output_padding = padding())
-        : primitive_base(id, {input_location, input_confidence, input_prior_box}, output_padding),
+        : primitive_base(id, {input_location, input_confidence, input_prior_box}, ext_prim_id, output_padding),
           num_classes(num_classes),
           keep_top_k(keep_top_k),
           share_location(share_location),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp
index 459377fdf12654..35725348ada0ca 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/eltwise.hpp
@@ -78,8 +78,9 @@ struct eltwise : public primitive_base<eltwise> {
             const primitive_id& input,
             const primitive_id& input2,
             eltwise_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input, input2}, output_padding),
+        : primitive_base(id, {input, input2}, ext_prim_id, output_padding),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(std::vector<tensor>(0)) {}
@@ -97,8 +98,9 @@ struct eltwise : public primitive_base<eltwise> {
             const primitive_id& input2,
             std::vector<tensor> stride,
             eltwise_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input, input2}, output_padding),
+        : primitive_base(id, {input, input2}, ext_prim_id, output_padding),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(stride) {}
@@ -112,8 +114,9 @@ struct eltwise : public primitive_base<eltwise> {
             const std::vector<primitive_id>& inputs,
             eltwise_mode mode,
             data_types data_type,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding, optional_data_type{data_type}),
+        : primitive_base(id, inputs, ext_prim_id, output_padding, optional_data_type{data_type}),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(std::vector<tensor>(0)) {}
@@ -125,8 +128,9 @@ struct eltwise : public primitive_base<eltwise> {
     eltwise(const primitive_id& id,
             const std::vector<primitive_id>& inputs,
             eltwise_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding),
+        : primitive_base(id, inputs, ext_prim_id, output_padding),
           mode(mode),
           coefficients(std::vector<float>(0)),
           stride(std::vector<tensor>(0)) {}
@@ -141,8 +145,9 @@ struct eltwise : public primitive_base<eltwise> {
             eltwise_mode mode,
             const std::vector<float>& coefficients,
             data_types data_type,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding, optional_data_type{data_type}),
+        : primitive_base(id, inputs, ext_prim_id, output_padding, optional_data_type{data_type}),
           mode(mode),
           coefficients(coefficients),
           stride(std::vector<tensor>(0)) {
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp
index 630f352c94872d..6788a2a20b0d0b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/embedding_bag.hpp
@@ -36,8 +36,9 @@ struct embedding_bag : public primitive_base<embedding_bag> {
                   const embedding_bag_type& type,
                   const tensor& output_shape,
                   const int32_t default_index = -1,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding), type(type), output_shape(output_shape), default_index(default_index) {}
+        : primitive_base(id, inputs, ext_prim_id, output_padding), type(type), output_shape(output_shape), default_index(default_index) {}
 
     /// @brief Type of EmbeddingBag operation
     embedding_bag_type type;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp
index 8ee28b9c846cb6..661a99c2b70061 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/extract_image_patches.hpp
@@ -43,8 +43,9 @@ struct extract_image_patches : public primitive_base<extract_image_patches> {
                           const std::vector<unsigned int>& rates,
                           const std::string& auto_pad,
                           const tensor& output_shape,
+                          const primitive_id& ext_prim_id = "",
                           const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           sizes(sizes),
           strides(strides),
           rates(rates),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp
index 9e2a5f51b10c96..93ea33e80fd77b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fully_connected.hpp
@@ -49,9 +49,10 @@ struct fully_connected : public primitive_base<fully_connected> {
                     const primitive_id& input,
                     const primitive_id& weights,
                     const primitive_id& bias = "",
+                    const primitive_id& ext_prim_id = "",
                     const padding& output_padding = padding(),
                     const size_t input_size = 2)
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           weights(weights),
           bias(bias),
           input_size(input_size)
@@ -63,16 +64,17 @@ struct fully_connected : public primitive_base<fully_connected> {
     /// @param weights Primitive id containing weights data.
     /// @param bias Primitive id containing bias data. Provide empty string if using Relu without bias.
     fully_connected(const primitive_id& id,
-        const primitive_id& input,
-        const primitive_id& weights,
-        const primitive_id& bias,
-        const data_types data_type,
-        const padding& output_padding = padding(),
-        const size_t input_size = 2)
-        : primitive_base(id, { input }, output_padding, optional_data_type{data_type}),
-        weights(weights),
-        bias(bias),
-        input_size(input_size)
+                    const primitive_id& input,
+                    const primitive_id& weights,
+                    const primitive_id& bias,
+                    const data_types data_type,
+                    const primitive_id& ext_prim_id = "",
+                    const padding& output_padding = padding(),
+                    const size_t input_size = 2)
+        : primitive_base(id, { input }, ext_prim_id, output_padding, optional_data_type{data_type}),
+          weights(weights),
+          bias(bias),
+          input_size(input_size)
     {}
 
     /// @brief Primitive id containing weights data.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp
index 6aed6cf6a7568a..306068233aeabd 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/fused_conv_eltwise.hpp
@@ -50,9 +50,10 @@ struct fused_conv_eltwise : public primitive_base<fused_conv_eltwise> {
                        float conv_activation_slp = 0.0f,
                        bool eltw_with_activation = false,
                        float eltw_activation_slp = 0.0f,
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding(),
                        optional_data_type output_data_type = {})
-        : primitive_base(id, {input, input2}, output_padding, output_data_type),
+        : primitive_base(id, {input, input2}, ext_prim_id, output_padding, output_data_type),
           conv((primitive_id_arr)weights,
               (primitive_id_arr)bias),
           eltw(),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp
index 18bc947b1e32ad..ab61ecbb68b5a4 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather.hpp
@@ -44,9 +44,10 @@ struct gather : public primitive_base<gather> {
            const tensor& output_shape,
            const int64_t batch_dim = 0,
            const bool support_neg_ind = false,
+           const primitive_id& ext_prim_id = "",
            const padding& output_padding = padding()
            )
-        : primitive_base(id, {dict, idx}, output_padding), axis(axis), output_format(output_format),
+        : primitive_base(id, {dict, idx}, ext_prim_id, output_padding), axis(axis), output_format(output_format),
                          output_shape(output_shape), batch_dim(batch_dim), support_neg_ind(support_neg_ind) {}
 
     /// @brief Gathering axis
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp
index d6d0ca9fdb24f9..d2d994f5e6934d 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_elements.hpp
@@ -41,8 +41,9 @@ struct gather_elements : public primitive_base<gather_elements> {
                     const format& output_format,
                     const tensor& output_shape,
                     const gather_elements_axis axis,
+                    const primitive_id& ext_prim_id = "",
                     const padding& output_padding = padding())
-        : primitive_base(id, {data, indices}, output_padding), output_format(output_format), output_shape(output_shape), axis(axis) {}
+        : primitive_base(id, {data, indices}, ext_prim_id, output_padding), output_format(output_format), output_shape(output_shape), axis(axis) {}
 
     /// @brief Gather Elements output format
     format output_format;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp
index 885f7297510f11..52e2d87f11ea10 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_nd.hpp
@@ -25,12 +25,13 @@ struct gather_nd : public primitive_base<gather_nd> {
     /// @param indices_rank Rank of indices.
     /// @param batch_dims batch_dims as an attribute of GatherND. Optional.
     gather_nd(const primitive_id& id,
-                   const primitive_id& data,
-                   const primitive_id& indices,
-                   const uint8_t indices_rank,
-                   const uint8_t batch_dims = 0,
-                   const padding& output_padding = padding())
-        : primitive_base(id, {data, indices}, output_padding), indices_rank(indices_rank), batch_dims(batch_dims) {}
+              const primitive_id& data,
+              const primitive_id& indices,
+              const uint8_t indices_rank,
+              const uint8_t batch_dims = 0,
+              const primitive_id& ext_prim_id = "",
+              const padding& output_padding = padding())
+        : primitive_base(id, {data, indices}, ext_prim_id, output_padding), indices_rank(indices_rank), batch_dims(batch_dims) {}
 
     /// @brief GatherND indices_rank
     uint8_t indices_rank;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp
index 59e7bec1955407..83cf6ccf0b9644 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gather_tree.hpp
@@ -31,12 +31,13 @@ struct gather_tree : public primitive_base<gather_tree> {
         ///                                a value of the end_token
         /// @param output_padding          Optional padding for output from primitive
         gather_tree(const primitive_id& id,
-            const primitive_id& step_input,
-            const primitive_id& parent_input,
-            const primitive_id& max_seq_len_input,
-            const primitive_id& end_token,
-            const padding& output_padding = padding())
-        : primitive_base(id, { step_input, parent_input, max_seq_len_input, end_token }, output_padding) {}
+                    const primitive_id& step_input,
+                    const primitive_id& parent_input,
+                    const primitive_id& max_seq_len_input,
+                    const primitive_id& end_token,
+                    const primitive_id& ext_prim_id = "",
+                    const padding& output_padding = padding())
+            : primitive_base(id, { step_input, parent_input, max_seq_len_input, end_token }, ext_prim_id, output_padding) {}
 };
     /// @}
     /// @}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp
index 5bac5ceb9ce55f..02a2c211ce01b4 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/gemm.hpp
@@ -46,8 +46,9 @@ struct gemm : public primitive_base<gemm> {
          const bool transpose_input1 = false,
          const float alpha = 1.0f,
          const float beta = 0.0f,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, inputs, output_padding, optional_data_type{ data_type }),
+        : primitive_base(id, inputs, ext_prim_id, output_padding, optional_data_type{ data_type }),
           transpose_input0(transpose_input0),
           transpose_input1(transpose_input1),
           alpha(alpha),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp
index 47c9cb19fa90a3..73b3ae9a2c87e4 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/grn.hpp
@@ -26,8 +26,9 @@ struct grn : public primitive_base<grn> {
         const primitive_id& input,
         const float bias,
         const data_types data_type,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{ data_type }),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{ data_type }),
         bias(bias)
     {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp
index c6be1bf5b39de6..e73b9e1cac1f21 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/input_layout.hpp
@@ -28,8 +28,8 @@ struct input_layout : public primitive_base<input_layout> {
     /// @brief Constructs input layout primitive.
     /// @param id This primitive id.
     /// @param layout Defines layout for the data will be passed to network.
-    input_layout(const primitive_id& id, const layout& layout)
-        : primitive_base(id, {}, layout.data_padding), layout(layout) {}
+    input_layout(const primitive_id& id, const layout& layout, const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {}, ext_prim_id, layout.data_padding), layout(layout) {}
 
     /// @brief Defines layout for the data will be passed to network.
     mutable cldnn::layout layout;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp
index 63215f3ad980b5..b888f1f9f7df57 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/loop.hpp
@@ -119,19 +119,20 @@ struct loop : public primitive_base<loop> {
     /// @param back_edges Output data primitive id.
     /// @param output_padding     Optional padding for output from primitive.
     loop(const primitive_id& id,
-        const std::vector<primitive_id>& inputs,
-        const topology& body,
-        const primitive_id& trip_count_id,
-        const primitive_id& initial_condition_id,
-        const primitive_id& num_iteration_id,
-        const std::vector<io_primitive_map>& input_primitive_maps,
-        const std::vector<io_primitive_map>& output_primitive_maps,
-        const std::vector<backedge_mapping>& back_edges,
-        int64_t max_iteration = -1,
-        const primitive_id& current_iteration_id = primitive_id(),
-        const primitive_id& condition_id = primitive_id(),
-        const padding& output_padding = padding())
-            : primitive_base(id, inputs, output_padding),
+         const std::vector<primitive_id>& inputs,
+         const topology& body,
+         const primitive_id& trip_count_id,
+         const primitive_id& initial_condition_id,
+         const primitive_id& num_iteration_id,
+         const std::vector<io_primitive_map>& input_primitive_maps,
+         const std::vector<io_primitive_map>& output_primitive_maps,
+         const std::vector<backedge_mapping>& back_edges,
+         int64_t max_iteration = -1,
+         const primitive_id& current_iteration_id = primitive_id(),
+         const primitive_id& condition_id = primitive_id(),
+         const primitive_id& ext_prim_id = "",
+         const padding& output_padding = padding())
+            : primitive_base(id, inputs, ext_prim_id, output_padding),
               body(body),
               trip_count_id(trip_count_id),
               initial_execution_id(initial_condition_id),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp
index 3a24f4f70e7a14..306b5f809bffe4 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lrn.hpp
@@ -48,8 +48,9 @@ struct lrn : public primitive_base<lrn> {
         float alpha,
         float beta,
         lrn_norm_region lrn_norm_region,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           size(size),
           k(k),
           alpha(alpha),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp
index 33c49bc7c186dc..585b3c289f0c2a 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm.hpp
@@ -85,8 +85,9 @@ struct lstm : public primitive_base<lstm> {
          const std::vector<activation_additional_params> activation_params = {},
          const lstm_output_selection output_selection = lstm_output_selection::sequence,
          const lstm_weights_order offset_order = lstm_weights_order::iofz,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, input, output_padding),
+        : primitive_base(id, input, ext_prim_id, output_padding),
           weights(weights),
           recurrent(recurrent),
           bias(bias),
@@ -166,8 +167,9 @@ struct lstm_gemm : public primitive_base<lstm_gemm> {
               const primitive_id& bias = "",
               const primitive_id& hidden = "",
               const uint32_t direction = 0,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           weights(weights),
           recurrent(recurrent),
           bias(bias),
@@ -222,8 +224,9 @@ struct lstm_elt : public primitive_base<lstm_elt> {
              const std::vector<activation_additional_params> activation_params = {},
              const lstm_weights_order offset_order = lstm_weights_order::iofz,
              const uint32_t direction = 0,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           cell(cell),
           clip(clip),
           input_forget(input_forget),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp
index 5f0d297e3cbc07..4a18c363ab8d68 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic.hpp
@@ -52,8 +52,9 @@ struct lstm_dynamic : public primitive_base<lstm_dynamic> {
                  const primitive_id& initial_cell = "",
                  const float clip = 0.0f,
                  const bool input_forget = 0,
+                 const primitive_id& ext_prim_id = "",
                  const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           dyn_length(dyn_length),
           weights(weights),
           recurrent(recurrent),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp
index 3733a989fe68d4..6737267c251c4e 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_input.hpp
@@ -39,8 +39,9 @@ struct lstm_dynamic_input : public primitive_base<lstm_dynamic_input> {
                        const primitive_id& dyn_length,
                        const primitive_id& weights,
                        const primitive_id& bias = "",
+                       const primitive_id& ext_prim_id = "",
                        const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), dyn_length(dyn_length), weights(weights), bias(bias) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), dyn_length(dyn_length), weights(weights), bias(bias) {}
 
     /// @brief Primitive id containing the dynamic sequence lengths.
     primitive_id dyn_length;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp
index c7b77fb1afe064..ed8a596c1e8d3f 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/lstm_dynamic_timeloop.hpp
@@ -47,8 +47,9 @@ struct lstm_dynamic_timeloop
                           const primitive_id& initial_cell = "",
                           const float clip = 0.0f,
                           const bool input_forget = 0,
+                          const primitive_id& ext_prim_id = "",
                           const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           dyn_length(dyn_length),
           recurrent(recurrent),
           last_hidden_state(last_hidden_state),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp
index c22852627e0587..35b287deb2c833 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/max_unpooling.hpp
@@ -36,8 +36,9 @@ struct max_unpooling : public primitive_base<max_unpooling> {
                   const tensor& size,
                   const tensor& stride,
                   const tensor& input_offset = {0, 0, 0, 0},
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           input_offset(input_offset),
           stride(stride),
@@ -54,8 +55,9 @@ struct max_unpooling : public primitive_base<max_unpooling> {
                   const primitive_id& input,
                   const primitive_id& argmax,
                   tensor output_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           with_output_size(true),
           output_size(output_size) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp
index a5aca1f4392063..769e5655cc0099 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mutable_data.hpp
@@ -31,8 +31,11 @@ struct mutable_data : public primitive_base<mutable_data> {
     /// @param mem @ref memory object which contains data.
     /// @param filler_type @ref data filling function, default is zero
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
-    mutable_data(const primitive_id& id, memory::ptr mem, filler_type fill_type = filler_type::no_fill)
-        : primitive_base(id, {}, padding()), mem(mem), fill_type(fill_type) {}
+    mutable_data(const primitive_id& id,
+                 memory::ptr mem,
+                 const primitive_id& ext_prim_id = "",
+                 filler_type fill_type = filler_type::no_fill)
+        : primitive_base(id, {}, ext_prim_id, padding()), mem(mem), fill_type(fill_type) {}
 
     /// @brief Constructs mutable_data primitive with inputs.
     /// @param id This primitive id.
@@ -43,8 +46,9 @@ struct mutable_data : public primitive_base<mutable_data> {
     mutable_data(const primitive_id& id,
                  const std::vector<primitive_id>& input,
                  memory::ptr mem,
+                 const primitive_id& ext_prim_id = "",
                  filler_type fill_type = filler_type::no_fill)
-        : primitive_base(id, {input}, padding()), mem(mem), fill_type(fill_type) {}
+        : primitive_base(id, {input}, ext_prim_id, padding()), mem(mem), fill_type(fill_type) {}
 
     /// @brief @ref memory object which contains data.
     /// @note If memory is attached by memory::attach(), the attached buffer should be valid till network build.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp
index 0f821debbb637f..0a73bd934a4bb6 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/mvn.hpp
@@ -32,8 +32,9 @@ struct mvn : public primitive_base<mvn> {
         const float epsilon,
         const bool eps_inside_sqrt,
         const bool across_channels = false,
+        const primitive_id& ext_prim_id = "",
         const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           normalize_variance(normalize_variance),
           epsilon(epsilon),
           eps_inside_sqrt(eps_inside_sqrt),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp
index ad017138248b78..2903c680ee74d8 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/non_max_suppression.hpp
@@ -47,8 +47,9 @@ struct non_max_suppression : public primitive_base<non_max_suppression> {
                         const primitive_id& score_threshold = primitive_id(),
                         const primitive_id& soft_nms_sigma = primitive_id(),
                         const primitive_id& second_output = primitive_id(),
-                        const primitive_id& third_output = primitive_id())
-        : primitive_base(id, {boxes_positions, boxes_score})
+                        const primitive_id& third_output = primitive_id(),
+                        const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {boxes_positions, boxes_score}, ext_prim_id)
         , selected_indices_num(selected_indices_num)
         , center_point_box(center_point_box)
         , sort_result_descending(sort_result_descending)
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp
index 931ffb0dd38050..12de706b008793 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/normalize.hpp
@@ -47,8 +47,9 @@ struct normalize : public primitive_base<normalize> {
               const primitive_id& scale_input,
               const bool across_spatial = true,
               const float epsilon = 1e-10f,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           scale_input(scale_input),
           across_spatial(across_spatial),
           epsilon(epsilon) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp
index 47d27c7970174e..b6a3c3bd538234 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/one_hot.hpp
@@ -52,8 +52,9 @@ struct one_hot : public primitive_base<one_hot> {
             const uint16_t& one_hot_axis,
             const float& on_value = 1.0f,
             const float& off_value = 0.0f,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), shape(shape), one_hot_axis(one_hot_axis),
+        : primitive_base(id, {input}, ext_prim_id, output_padding), shape(shape), one_hot_axis(one_hot_axis),
           on_value(on_value), off_value(off_value) {}
 
     /// @brief Constructs one-hot primitive layer.
@@ -70,8 +71,9 @@ struct one_hot : public primitive_base<one_hot> {
             const uint16_t& one_hot_axis,
             const float& on_value = 1.0f,
             const float& off_value = 0.0f,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_dt}), shape(shape), one_hot_axis(one_hot_axis),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_dt}), shape(shape), one_hot_axis(one_hot_axis),
           on_value(on_value), off_value(off_value) {}
 
     /// @brief Output size reference.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp
index db4f1b764c4e82..9a8fe93283d599 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/permute.hpp
@@ -33,8 +33,9 @@ struct permute : public primitive_base<permute> {
     permute(const primitive_id& id,
             const primitive_id& input,
             const std::vector<uint16_t>& permute_order = {},
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), permute_order(permute_order) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), permute_order(permute_order) {}
 
     /// @brief Array of permuted output order in bfyx format.
     std::vector<uint16_t> permute_order;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp
index 6975b1918d2062..11f552efe365c6 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pooling.hpp
@@ -49,8 +49,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& size,
             const tensor& stride,
             const tensor& input_offset = {0, 0, 0, 0},
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(""),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -61,6 +62,7 @@ struct pooling : public primitive_base<pooling> {
 
     /// @brief Constructs pooling primitive with argmax.
     /// @param id This primitive id.
+    /// @param ext_prim_id
     /// @param input Input primitive id.
     /// @param argmax Primitive id which contains indices of each max pooling region.
     /// Indices must be in flattened bfyx format with no padding. Needs to be fp32 data type.
@@ -76,8 +78,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& size,
             const tensor& stride,
             const tensor& input_offset = {0, 0, 0, 0},
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -102,8 +105,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& input_offset,
             tensor output_size,
             const data_types output_data_type,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
           argmax(""),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -131,8 +135,9 @@ struct pooling : public primitive_base<pooling> {
             const tensor& stride,
             const tensor& input_offset,
             tensor output_size,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(argmax),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(false),
@@ -149,8 +154,9 @@ struct pooling : public primitive_base<pooling> {
     pooling(const primitive_id& id,
             const primitive_id& input,
             pooling_mode mode,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           argmax(""),
           mode(static_cast<pooling_mode>(mode)),
           global_pooling(true),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp
index 856df2e56496af..c57b07789a1566 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/primitive.hpp
@@ -38,10 +38,12 @@ struct primitive {
     primitive(const primitive_type_id& type,
               const primitive_id& id,
               const std::vector<primitive_id>& input,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding(),
               const optional_data_type output_data_type = optional_data_type())
         : type(type),
           id(id),
+          ext_prim_id(ext_prim_id),
           output_padding(output_padding),
           output_data_type(output_data_type),
           input(input) {}
@@ -79,6 +81,9 @@ struct primitive {
     /// @brief Primitive's id.
     const primitive_id id;
 
+    /// @brief Primitive's external id.
+    const primitive_id ext_prim_id;
+
     /// @brief Requested output padding.
     padding output_padding;
 
@@ -104,9 +109,10 @@ class primitive_base : public primitive {
 protected:
     explicit primitive_base(const primitive_id& id,
                             const std::vector<primitive_id>& input,
+                            const primitive_id& ext_prim_id = "",
                             const padding& output_padding = padding(),
                             optional_data_type output_data_type = optional_data_type())
-        : primitive(PType::type_id(), id, input, output_padding, output_data_type) {}
+        : primitive(PType::type_id(), id, input, ext_prim_id, output_padding, output_data_type) {}
 };
 
 struct primitive_info {
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp
index 5d3849483087c6..d9caf35612c67a 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/prior_box.hpp
@@ -55,8 +55,9 @@ struct prior_box : public primitive_base<prior_box> {
               const std::vector<float>& fixed_ratio = {},
               const std::vector<float>& fixed_size = {},
               const std::vector<float>& density = {},
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           img_size(img_size),
           min_sizes(min_sizes),
           max_sizes(max_sizes),
@@ -113,8 +114,9 @@ struct prior_box : public primitive_base<prior_box> {
               const std::vector<float>& widths,
               const std::vector<float>& heights,
               data_types output_dt,
+              const primitive_id& ext_prim_id = "",
               const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_dt}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_dt}),
           img_size(img_size),
           flip(false),
           clip(clip),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp
index bce518b884330a..ceac3583641c69 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/proposal.hpp
@@ -33,8 +33,9 @@ struct proposal : public primitive_base<proposal> {
              int post_nms_topn,
              const std::vector<float>& ratios_param,
              const std::vector<float>& scales_param,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {cls_scores, bbox_pred, image_info}, output_padding),
+        : primitive_base(id, {cls_scores, bbox_pred, image_info}, ext_prim_id, output_padding),
           max_proposals(max_proposals),
           iou_threshold(iou_threshold),
           base_bbox_size(16),
@@ -80,8 +81,9 @@ struct proposal : public primitive_base<proposal> {
              bool round_ratios,
              bool shift_anchors,
              bool normalize,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {cls_scores, bbox_pred, image_info}, output_padding),
+        : primitive_base(id, {cls_scores, bbox_pred, image_info}, ext_prim_id, output_padding),
           max_proposals(max_proposals),
           iou_threshold(iou_threshold),
           base_bbox_size(base_bbox_size),
@@ -128,8 +130,9 @@ struct proposal : public primitive_base<proposal> {
              bool round_ratios,
              bool shift_anchors,
              bool normalize,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-            : primitive_base(id, {cls_scores, bbox_pred, image_info, second_output}, output_padding),
+            : primitive_base(id, {cls_scores, bbox_pred, image_info, second_output}, ext_prim_id, output_padding),
               max_proposals(max_proposals),
               iou_threshold(iou_threshold),
               base_bbox_size(base_bbox_size),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp
index b5272218d99e31..b07556d1425886 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/pyramid_roi_align.hpp
@@ -40,19 +40,21 @@ struct pyramid_roi_align : public primitive_base<pyramid_roi_align> {
     /// @param sampling_ratio Number of sampling points per output value.
     /// @param pyramid_scales Scales of each level of pyramid in relation to original image.
     /// @param pyramid_starting_level Starting level of the pyramid that should be used for region of whole image.
-    pyramid_roi_align(const primitive_id &id,
-                      const primitive_id &rois,
-                      const primitive_id &P2,
-                      const primitive_id &P3,
-                      const primitive_id &P4,
-                      const primitive_id &P5,
+    pyramid_roi_align(const primitive_id& id,
+                      const primitive_id& rois,
+                      const primitive_id& P2,
+                      const primitive_id& P3,
+                      const primitive_id& P4,
+                      const primitive_id& P5,
                       int output_size,
                       int sampling_ratio,
                       std::vector<int> pyramid_scales,
                       int pyramid_starting_level,
+                      const primitive_id& ext_prim_id = "",
                       const padding &output_padding = padding())
         : primitive_base(id,
-                         { rois, P2, P3, P4, P5},
+                         { rois, P2, P3, P4, P5 },
+                         ext_prim_id,
                          output_padding)
         , output_size(output_size)
         , sampling_ratio(sampling_ratio)
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp
index 5073641b1b71c3..225e773bb85bde 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/quantize.hpp
@@ -31,8 +31,9 @@ struct quantize : public primitive_base<quantize> {
              const primitive_id& output_high,
              const int levels,
              const data_types output_data_type,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input, input_low, input_high, output_low, output_high}, output_padding, optional_data_type{output_data_type})
+        : primitive_base(id, {input, input_low, input_high, output_low, output_high}, ext_prim_id, output_padding, optional_data_type{output_data_type})
         , levels(levels) {}
 
     /// @brief levels The number of quantization levels.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp
index eadaeca114a0e1..6abf72059d7e5f 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reduce.hpp
@@ -62,9 +62,14 @@ struct reduce : public primitive_base<reduce> {
     /// @param id This primitive id
     /// @param input Input primitive id
     /// @param keep_dims The axes which reduced
-    reduce(const primitive_id& id, const primitive_id& input, const reduce_mode mode, const std::vector<uint16_t> axes,
-           const int32_t keep_dims, const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), mode(mode), axes(axes), keep_dims(keep_dims) {}
+    reduce(const primitive_id& id,
+           const primitive_id& input,
+           const reduce_mode mode,
+           const std::vector<uint16_t> axes,
+           const int32_t keep_dims,
+           const primitive_id& ext_prim_id = "",
+           const padding& output_padding = padding())
+        : primitive_base(id, {input}, ext_prim_id, output_padding), mode(mode), axes(axes), keep_dims(keep_dims) {}
 
     /// @brief Reduce operation type
     reduce_mode mode;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp
index f36b31fc96d798..384a95acf77d23 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/region_yolo.hpp
@@ -32,8 +32,9 @@ struct region_yolo : public primitive_base<region_yolo> {
                 const uint32_t num,
                 const uint32_t mask_size = 0,
                 const bool do_softmax = true,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           coords(coords),
           classes(classes),
           num(num),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp
index c980c34f0d4216..feb7a6d0afaf54 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorder.hpp
@@ -40,8 +40,9 @@ struct reorder : public primitive_base<reorder> {
             const primitive_id& input,
             const layout& output_layout,
             const std::vector<float>& values_to_subtract = {},
-            const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, {input}, output_layout.data_padding, optional_data_type {output_layout.data_type}),
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {input}, ext_prim_id, output_layout.data_padding, optional_data_type {output_layout.data_type}),
           output_format(output_layout.format),
           mean(""),
           subtract_per_feature(values_to_subtract),
@@ -56,8 +57,9 @@ struct reorder : public primitive_base<reorder> {
             const primitive_id& input,
             const layout& output_layout,
             primitive_id const& mean,
-            const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, {input}, output_layout.data_padding, optional_data_type {output_layout.data_type}),
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, {input}, ext_prim_id, output_layout.data_padding, optional_data_type {output_layout.data_type}),
           output_format(output_layout.format),
           mean(mean),
           subtract_per_feature(0),
@@ -74,8 +76,9 @@ struct reorder : public primitive_base<reorder> {
             data_types output_data_type,
             const std::vector<float>& values_to_subtract = {},
             const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type{output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type{output_data_type}),
           output_format(output_format),
           mean(""),
           subtract_per_feature(values_to_subtract),
@@ -92,8 +95,9 @@ struct reorder : public primitive_base<reorder> {
             data_types output_data_type,
             primitive_id const& mean,
             const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding, optional_data_type {output_data_type}),
+        : primitive_base(id, {input}, ext_prim_id, output_padding, optional_data_type {output_data_type}),
           output_format(output_format),
           mean(mean),
           subtract_per_feature(0),
@@ -106,12 +110,13 @@ struct reorder : public primitive_base<reorder> {
     /// @param output_layout Requested memory layout.
     /// @param values_to_subtract Array of mean subtract values.
     reorder(const primitive_id& id,
-        const primitive_id& input,
-        const primitive_id& input2,
-        const layout& output_layout,
-        const std::vector<float>& values_to_subtract = {},
-        const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, { input, input2 }, output_layout.data_padding, optional_data_type { output_layout.data_type }),
+            const primitive_id& input,
+            const primitive_id& input2,
+            const layout& output_layout,
+            const std::vector<float>& values_to_subtract = {},
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, { input, input2 }, ext_prim_id, output_layout.data_padding, optional_data_type { output_layout.data_type }),
           output_format(output_layout.format),
           mean(""),
           subtract_per_feature(values_to_subtract),
@@ -124,12 +129,13 @@ struct reorder : public primitive_base<reorder> {
     /// @param output_layout Requested memory layout.
     /// @param mean Primitive id to get mean subtract values.
     reorder(const primitive_id& id,
-        const primitive_id& input,
-        const primitive_id& input2,
-        const layout& output_layout,
-        primitive_id const& mean,
-        const reorder_mean_mode mode = reorder_mean_mode::subtract)
-        : primitive_base(id, { input, input2 }, output_layout.data_padding, optional_data_type{ output_layout.data_type }),
+            const primitive_id& input,
+            const primitive_id& input2,
+            const layout& output_layout,
+            primitive_id const& mean,
+            const reorder_mean_mode mode = reorder_mean_mode::subtract,
+            const primitive_id& ext_prim_id = "")
+        : primitive_base(id, { input, input2 }, ext_prim_id, output_layout.data_padding, optional_data_type{ output_layout.data_type }),
         output_format(output_layout.format),
         mean(mean),
         mean_mode(mode) {}
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp
index 1993cc13b88dbe..6f286646f1099b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reorg_yolo.hpp
@@ -28,8 +28,9 @@ struct reorg_yolo : public primitive_base<reorg_yolo> {
     reorg_yolo(const primitive_id& id,
                const primitive_id& input,
                const uint32_t stride,
+               const primitive_id& ext_prim_id = "",
                const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), stride(stride) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), stride(stride) {}
 
     /// @brief Defines a scope of a reorg yolo normalization
     /// @details
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp
index ffeed3b0cf208a..c1c18c834c30bc 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/resample.hpp
@@ -93,8 +93,9 @@ struct resample : public primitive_base<resample> {
              tensor output_size,
              uint32_t num_filter,
              resample_type operation_type = resample_type::nearest,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_size(output_size),
           num_filter(num_filter),
           axesAndScales({}),
@@ -126,8 +127,9 @@ struct resample : public primitive_base<resample> {
              std::vector<int32_t> pads_end = {},
              int32_t align_corners = 1,
              resample_type operation_type = resample_type::bilinear,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_size(output_size),
           num_filter(0),
           axesAndScales({}),
@@ -158,8 +160,9 @@ struct resample : public primitive_base<resample> {
              shape_calculation_mode shape_calc_mode = shape_calculation_mode::sizes,
              coordinate_transformation_mode ctm = coordinate_transformation_mode::half_pixel,
              nearest_mode nm = nearest_mode::round_prefer_floor,
+             const primitive_id& ext_prim_id = "",
              const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_size(output_size),
           num_filter(0),
           axesAndScales(axesAndScales),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp
index 5c14fb68ad8d4d..8335fea5cbfb78 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reshape.hpp
@@ -32,8 +32,9 @@ struct reshape : public primitive_base<reshape> {
     reshape(const primitive_id& id,
             const primitive_id& input,
             const tensor& output_shape,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), output_shape(output_shape) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), output_shape(output_shape) {}
 
     /// @brief Requested memory shape.
     tensor output_shape;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp
index c0007868b8a6d3..e05a3b9159e0aa 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/reverse_sequence.hpp
@@ -31,8 +31,9 @@ struct reverse_sequence : public primitive_base<reverse_sequence> {
                      const primitive_id& seq_lengths,
                      const int32_t seq_axis,
                      const int32_t batch_axis = 0,
+                     const primitive_id& ext_prim_id = "",
                      const padding& output_padding = padding())
-        : primitive_base(id, {input, seq_lengths}, output_padding), seq_axis(seq_axis), batch_axis(batch_axis) {
+        : primitive_base(id, {input, seq_lengths}, ext_prim_id, output_padding), seq_axis(seq_axis), batch_axis(batch_axis) {
         const int32_t number_of_dims = 4;
 
         int32_t batch_a = batch_axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp
index ef1e101e97cc0a..c57cea446c0c23 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/roi_pooling.hpp
@@ -30,8 +30,9 @@ struct roi_pooling : public primitive_base<roi_pooling> {
                 int output_dim = 0,
                 int spatial_bins_x = 1,
                 int spatial_bins_y = 1,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {input_data, input_rois}, output_padding),
+        : primitive_base(id, {input_data, input_rois}, ext_prim_id, output_padding),
           mode(mode),
           position_sensitive(position_sensitive),
           pooled_width(pooled_width),
@@ -59,8 +60,9 @@ struct roi_pooling : public primitive_base<roi_pooling> {
                 int output_dim = 0,
                 int spatial_bins_x = 1,
                 int spatial_bins_y = 1,
+                const primitive_id& ext_prim_id = "",
                 const padding& output_padding = padding())
-        : primitive_base(id, {inputs}, output_padding),
+        : primitive_base(id, {inputs}, ext_prim_id, output_padding),
           mode(mode),
           position_sensitive(position_sensitive),
           pooled_width(pooled_width),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp
index 1d8d3340061915..8dbb13247bb76c 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scale.hpp
@@ -40,8 +40,9 @@ struct scale : public primitive_base<scale> {
           const primitive_id& scale_input,  // should be bfyx or yxfb, where each dimension can be 1, if all dimensions
                                             // are 1 then this is scalar
           const optional_data_type& output_dt = {},
+          const primitive_id& ext_prim_id = "",
           const padding& output_padding = padding())
-        : primitive_base(id, {input, scale_input}, output_padding, output_dt), bias("") {}
+        : primitive_base(id, {input, scale_input}, ext_prim_id, output_padding, output_dt), bias("") {}
 
     /// @brief Constructs scale primitive with optional adding bias.
     /// @param id This primitive id.
@@ -54,8 +55,9 @@ struct scale : public primitive_base<scale> {
                                             // are 1 then this is scalar
           const primitive_id& bias,  // should be same size as scale_input
           const optional_data_type& output_dt = {},
+          const primitive_id& ext_prim_id = "",
           const padding& output_padding = padding())
-        : primitive_base(id, {input, scale_input}, output_padding, output_dt), bias(bias) {}
+        : primitive_base(id, {input, scale_input}, ext_prim_id, output_padding, output_dt), bias(bias) {}
 
     /// @brief Primitive id containing bias data.
     primitive_id bias;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp
index e99a46ea2e2dc0..cd65fd16d2d650 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_elements_update.hpp
@@ -35,12 +35,13 @@ struct scatter_elements_update : public primitive_base<scatter_elements_update>
     /// @param idupd Input updates primitive id.
     /// @param axis Gathering axis.
     scatter_elements_update(const primitive_id& id,
-                   const primitive_id& data,
-                   const primitive_id& idx,
-                   const primitive_id& idupd,
-                   const scatter_elements_update_axis axis,
-                   const padding& output_padding = padding())
-        : primitive_base(id, {data, idx, idupd}, output_padding), axis(axis) {}
+                            const primitive_id& data,
+                            const primitive_id& idx,
+                            const primitive_id& idupd,
+                            const scatter_elements_update_axis axis,
+                            const primitive_id& ext_prim_id = "",
+                            const padding& output_padding = padding())
+        : primitive_base(id, {data, idx, idupd}, ext_prim_id, output_padding), axis(axis) {}
 
     /// @brief ScatterElementsUpdate axis
     scatter_elements_update_axis axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp
index e36e2b373c2bbf..bf31b746ac2534 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_nd_update.hpp
@@ -26,12 +26,13 @@ struct scatter_nd_update : public primitive_base<scatter_nd_update> {
     /// @param idupd Input updates primitive id.
     /// @param indices_rank Rank of indices.
     scatter_nd_update(const primitive_id& id,
-                   const primitive_id& data,
-                   const primitive_id& idx,
-                   const primitive_id& idupd,
-                   const size_t indices_rank,
-                   const padding& output_padding = padding())
-        : primitive_base(id, {data, idx, idupd}, output_padding), indices_rank(indices_rank) {}
+                      const primitive_id& data,
+                      const primitive_id& idx,
+                      const primitive_id& idupd,
+                      const size_t indices_rank,
+                      const primitive_id& ext_prim_id = "",
+                      const padding& output_padding = padding())
+        : primitive_base(id, {data, idx, idupd}, ext_prim_id, output_padding), indices_rank(indices_rank) {}
 
     /// @brief ScatterNDUpdate indices_rank
     size_t indices_rank;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp
index a28063b8f4c558..7969a2ae624d7d 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/scatter_update.hpp
@@ -39,8 +39,9 @@ struct scatter_update : public primitive_base<scatter_update> {
                    const primitive_id& idx,
                    const primitive_id& idupd,
                    const scatter_update_axis axis,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {dict, idx, idupd}, output_padding), axis(axis) {}
+        : primitive_base(id, {dict, idx, idupd}, ext_prim_id, output_padding), axis(axis) {}
 
     /// @brief ScatterUpdate axis
     scatter_update_axis axis;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp
index 3527318626b141..d983bf1dc7f2ba 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/select.hpp
@@ -40,9 +40,10 @@ struct select : public primitive_base<select> {
            const primitive_id& mask,
            const primitive_id& input,
            const primitive_id& input2,
+           const primitive_id& ext_prim_id = "",
            const padding& output_padding = padding(),
            const std::string& broadcast_type = "numpy")
-        : primitive_base(id, {mask, input, input2}, output_padding),
+        : primitive_base(id, {mask, input, input2}, ext_prim_id, output_padding),
           broadcast_type(broadcast_type) {}
 
     /// @brief String which determines broadcast type.
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp
index 8965a266fa51ee..5e27ee609f59aa 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/shuffle_channels.hpp
@@ -29,8 +29,9 @@ struct shuffle_channels : public primitive_base<shuffle_channels> {
                      const primitive_id& input,
                      const int32_t group,
                      const int32_t axis = 1,
+                     const primitive_id& ext_prim_id = "",
                      const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), group(group), axis(axis) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), group(group), axis(axis) {}
 
     /// @brief The number of groups to split the channel dimension. This number must evenly divide the channel dimension size.
     int32_t group;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp
index 984acd627336d2..b6b5ca867c2cc1 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/softmax.hpp
@@ -42,8 +42,9 @@ struct softmax : public primitive_base<softmax> {
     softmax(const primitive_id& id,
             const primitive_id& input,
             const dimension_t dimension = normalize_fyx,
+            const primitive_id& ext_prim_id = "",
             const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), dimension(dimension) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), dimension(dimension) {}
 
     /// @brief Defines a scope of a single softmax normalization.
     /// @details
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp
index bd10ed3e74cf69..a3587752ebc55c 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_batch.hpp
@@ -56,8 +56,9 @@ struct space_to_batch : public primitive_base<space_to_batch> {
                    const tensor& pads_begin,
                    const tensor& pads_end,
                    const tensor& out_size,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           block_shape(block_shape),
           pads_begin(pads_begin),
           pads_end(pads_end),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp
index 1a7e6616ea46f1..4ef13df02de327 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/space_to_depth.hpp
@@ -63,8 +63,9 @@ struct space_to_depth : public primitive_base<space_to_depth> {
                    const primitive_id& input,
                    depth_mode mode,
                    const size_t block_size = 1,
+                   const primitive_id& ext_prim_id = "",
                    const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), mode(mode), block_size(block_size) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), mode(mode), block_size(block_size) {}
 
     /// @brief Depth mode.
     depth_mode mode;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp
index cb69c2bad5d8a4..d0568138fa730a 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/split.hpp
@@ -46,8 +46,9 @@ struct split : public primitive_base<split> {
     split(const primitive_id& id,
           const primitive_id& input,
           const std::vector<std::pair<primitive_id, tensor> >& output_ids_offsets,
+          const primitive_id& ext_prim_id = "",
           const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding),
+        : primitive_base(id, {input}, ext_prim_id, output_padding),
           output_offsets(extract_tensor_vector(output_ids_offsets)),
           output_ids(extract_primitive_vector(output_ids_offsets)) {}
 
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp
index 8d379d1e66bcec..08b762c948b4ee 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/strided_slice.hpp
@@ -41,8 +41,9 @@ struct strided_slice : public primitive_base<strided_slice> {
                   std::vector<uint8_t> new_axis_mask,
                   std::vector<uint8_t> shrink_axis_mask,
                   const tensor out_size,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input, begin_id, end_id, strides_id}, output_padding),
+        : primitive_base(id, {input, begin_id, end_id, strides_id}, ext_prim_id, output_padding),
           begin_mask(begin_mask),
           end_mask(end_mask),
           new_axis_mask(new_axis_mask),
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp
index 5cc8a7c005fc0e..43055b1a1a1f3b 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/primitives/tile.hpp
@@ -33,8 +33,9 @@ struct tile : public primitive_base<tile> {
     tile(const primitive_id& id,
          const primitive_id& input,
          const tensor out_shape,
+         const primitive_id& ext_prim_id = "",
          const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), out_shape(out_shape) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), out_shape(out_shape) {}
 
     /// @brief Shape of the output tensor
     tensor out_shape;
diff --git a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp
index 8aa53a14fe2061..fb79a20a785ecb 100644
--- a/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp
+++ b/inference-engine/thirdparty/clDNN/api/cldnn/runtime/engine.hpp
@@ -96,17 +96,20 @@ class engine {
     /// Returns user context handle which was used to create the engine
     virtual void* get_user_context() const = 0;
 
-    /// Returns the maximum amount of GPU memory that engine allocated in current process
+    /// Returns the total maximum amount of GPU memory allocated by engine in current process for all allocation types
     uint64_t get_max_used_device_memory() const;
 
-    /// Returns the amount of GPU memory currently used by the engine
-    uint64_t get_used_device_memory() const;
+    /// Returns the maximum amount of GPU memory allocated by engine in current process for the specified allocation @p type
+    uint64_t get_max_used_device_memory(allocation_type type) const;
 
-    /// Adds @p bytes count to currently used memory size
-    void add_memory_used(uint64_t bytes);
+    /// Returns the amount of GPU memory specified allocation @p type that currently used by the engine
+    uint64_t get_used_device_memory(allocation_type type) const;
 
-    /// Subtracts @p bytes count from currently used memory size
-    void subtract_memory_used(uint64_t bytes);
+    /// Adds @p bytes count to currently used memory size of the specified allocation @p type
+    void add_memory_used(uint64_t bytes, allocation_type type);
+
+    /// Subtracts @p bytes count from currently used memory size of the specified allocation @p type
+    void subtract_memory_used(uint64_t bytes, allocation_type type);
 
     /// Returns true if USM is enabled in engine config and device/driver supports required features
     bool use_unified_shared_memory() const;
@@ -142,8 +145,8 @@ class engine {
     const device::ptr _device;
     engine_configuration _configuration;
 
-    std::atomic<uint64_t> memory_usage = {0};
-    std::atomic<uint64_t> peak_memory_usage = {0};
+    std::map<allocation_type, std::atomic<uint64_t>> memory_usage_map;
+    std::map<allocation_type, std::atomic<uint64_t>> peak_memory_usage_map;
 };
 
 }  // namespace cldnn
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.cpp
index 14fb4322d2b749..b89a45bd527ec9 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.cpp
@@ -4,6 +4,7 @@
 
 #include "convolution_kernel_b_fs_yx_fsv16.h"
 #include "kernel_selector_utils.h"
+#include "reorder/reorder_kernel_base.h"
 #include <vector>
 #include <algorithm>
 
@@ -95,6 +96,8 @@ ParamsKey ConvolutionKernel_b_fs_yx_fsv16::GetSupportedKey() const {
 
     k.EnableInputLayout(DataLayout::b_fs_yx_fsv16);
     k.EnableOutputLayout(DataLayout::b_fs_yx_fsv16);
+    k.EnableOutputLayout(DataLayout::bfyx);
+
     k.EnableTensorOffset();
     k.EnableTensorPitches();
     k.EnableDilation();
@@ -176,12 +179,28 @@ bool ConvolutionKernel_b_fs_yx_fsv16::Validate(const Params& p, const optional_p
     if (input.Feature().pad.before % tuning_data.feature_block_size != 0 || output.Feature().pad.before % tuning_data.feature_block_size != 0)
         return false;
 
+    // Not supporting batch padding for different format (reorder-fused case)
+    if (input.GetLayout() == DataLayout::b_fs_yx_fsv16 && output.GetLayout() == DataLayout::bfyx) {
+        if (output.Batch().pad.before != 0 || output.Batch().pad.after != 0)
+            return false;
+    }
+
     if (!params.bias.empty() && params.bias[0].GetDType() != input.GetDType())
         return false;
 
     return true;
 }
 
+bool post_reorder_fused(const convolution_params& params) {
+    if (!params.fused_ops.empty()) {
+        if (params.fused_ops.back().GetType() == KernelType::REORDER) {
+            return true;
+        }
+    }
+
+    return false;
+}
+
 JitConstants ConvolutionKernel_b_fs_yx_fsv16::GetJitConstants(const convolution_params& params,
                                                               const DispatchData& dispatchData) const {
     auto input = params.inputs[0];
@@ -190,8 +209,18 @@ JitConstants ConvolutionKernel_b_fs_yx_fsv16::GetJitConstants(const convolution_
 
     ConvolutionTuningData tuning_data = GetTuningParams(params);
 
+    if (post_reorder_fused(params) &&
+        input.GetLayout() == DataLayout::b_fs_yx_fsv16 &&
+        output.GetLayout() == DataLayout::bfyx) {
+        jit.AddConstant(MakeJitConstant("OUTPUT_FORMAT_BFYX", 1));
+    }
+
     auto blockWidth = dispatchData.cldnnStyle.blockWidth;
     if (!params.fused_ops.empty()) {
+        DataLayout orig_output_layout = output.GetLayout();
+        if (post_reorder_fused(params)) {
+            orig_output_layout = params.fused_ops.back().GetOpParams<reorder_fuse_params>()->input_layout;
+        }
         auto input_dt = GetActivationType(params);
         FusedOpsConfiguration conf_vec = { "_VEC",
                                            {"b", "(feature_block * 16)", "y", "x"},
@@ -201,7 +230,8 @@ JitConstants ConvolutionKernel_b_fs_yx_fsv16::GetJitConstants(const convolution_
                                            LoadType::LT_ALIGNED_READ,
                                            BoundaryCheck::ENABLED,
                                            IndexType::TENSOR_COORD,
-                                           Tensor::DataChannelName::X };
+                                           Tensor::DataChannelName::X,
+                                           {}, false, "", orig_output_layout };
         FusedOpsConfiguration conf_scalar = { "_SCALAR",
                                               {"b", "(feature_block * 16)", "y", "(x + i)"},
                                               "dst[i]",
@@ -210,7 +240,8 @@ JitConstants ConvolutionKernel_b_fs_yx_fsv16::GetJitConstants(const convolution_
                                               LoadType::LT_ALIGNED_READ,
                                               BoundaryCheck::ENABLED,
                                               IndexType::TENSOR_COORD,
-                                              Tensor::DataChannelName::X };
+                                              Tensor::DataChannelName::X,
+                                              {}, false, "", orig_output_layout };
         jit.Merge(MakeFusedOpsJitConstants(params, {conf_vec, conf_scalar}));
     }
 
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.h b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.h
index e22aca5dc449bd..6c9ac8b146af58 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.h
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_b_fs_yx_fsv16.h
@@ -30,10 +30,15 @@ class ConvolutionKernel_b_fs_yx_fsv16 : public ConvolutionKernelBase {
         return (p.groups > 1) ? WeightsLayout::g_os_is_yx_isv16_osv16 : WeightsLayout::os_is_yx_isv16_osv16;
     }
     std::vector<FusedOpType> GetSupportedFusedOps() const override {
+        // FusedOpType::REORDER should be registered explicitly here
+        // only when fused_primitive_desc for reorder is added by optimization passes (e.g., remove_redundant_reorder) for corresponding primitive.
+        // The typical usage for fused_primitive_desc for convolution is to get original output layout from jitter,
+        // so that it can decide whether to fuse eltwise along with reorder.
         return { FusedOpType::ELTWISE,
                  FusedOpType::QUANTIZE,
                  FusedOpType::SCALE,
-                 FusedOpType::ACTIVATION };
+                 FusedOpType::ACTIVATION,
+                 FusedOpType::REORDER };
     }
 
     bool NeedPaddedInput() const override { return false; }
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_ref.h b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_ref.h
index a07032c6e10678..d17e48eb41c3e4 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_ref.h
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/convolution/convolution_kernel_ref.h
@@ -27,10 +27,15 @@ class ConvolutionKernel_Ref : public ConvolutionKernelBase {
             return (params.groups > 1) ? WeightsLayout::goizyx : WeightsLayout::oizyx;
     }
     std::vector<FusedOpType> GetSupportedFusedOps() const override {
+        // FusedOpType::REORDER should be registered explicitly here
+        // only when fused_primitive_desc for reorder is added by optimization passes (e.g., remove_redundant_reorder) for corresponding primitive.
+        // The typical usage for fused_primitive_desc for convolution is to get original output layout from jitter,
+        // so that it can decide whether to fuse eltwise along with reorder.
         return { FusedOpType::ELTWISE,
                  FusedOpType::QUANTIZE,
                  FusedOpType::SCALE,
-                 FusedOpType::ACTIVATION };
+                 FusedOpType::ACTIVATION,
+                 FusedOpType::REORDER };
     }
 
     JitConstants GetJitConstants(const convolution_params& params, const DispatchData& dispatchData) const override;
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.h b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.h
index e75e85c38806e2..eca73fec479c4c 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.h
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.h
@@ -43,6 +43,17 @@ struct reorder_optional_params : optional_params {
     reorder_optional_params() : optional_params(KernelType::REORDER) {}
 };
 
+////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
+// reorder_fuse_params
+////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
+struct reorder_fuse_params : fuse_params {
+    DataLayout input_layout;
+    DataLayout output_layout;
+
+    reorder_fuse_params(DataLayout input_layout, DataLayout output_layout) :
+        fuse_params(KernelType::REORDER), input_layout(input_layout), output_layout(output_layout) {}
+};
+
 ////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
 // reorder_weights_params
 ////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/convolution_gpu_bfyx_f16.cl b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/convolution_gpu_bfyx_f16.cl
index 149c00edacb252..212f4bc04dc1b5 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/convolution_gpu_bfyx_f16.cl
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/cl_kernels/convolution_gpu_bfyx_f16.cl
@@ -41,24 +41,30 @@
 #   error convolution_gpu_bfyx_f16.cl: unsupported filter type
 #endif
 
-#if OUTPUT_TYPE_SIZE == 1
-#   define OUTPUT_BLOCK_WRITE(ptr, offset, val)    BLOCK_WRITE_UC_1((__global uchar*)(ptr) + (offset), as_uchar(val))
-#   define OUTPUT_BLOCK_WRITE2(ptr, offset, val)   BLOCK_WRITE_UC_2((__global uchar*)(ptr) + (offset), as_uchar2(val))
-#   define OUTPUT_BLOCK_WRITE4(ptr, offset, val)   BLOCK_WRITE_UC_4((__global uchar*)(ptr) + (offset), as_uchar4(val))
-#   define OUTPUT_BLOCK_WRITE8(ptr, offset, val)   BLOCK_WRITE_UC_8((__global uchar*)(ptr) + (offset), as_uchar8(val))
-#elif OUTPUT_TYPE_SIZE == 2
-#   define OUTPUT_BLOCK_WRITE(ptr, offset, val)    intel_sub_group_block_write_us((__global ushort*)(ptr) + (offset), as_ushort(val))
-#   define OUTPUT_BLOCK_WRITE2(ptr, offset, val)   intel_sub_group_block_write_us2((__global ushort*)(ptr) + (offset), as_ushort2(val))
-#   define OUTPUT_BLOCK_WRITE4(ptr, offset, val)   intel_sub_group_block_write_us4((__global ushort*)(ptr) + (offset), as_ushort4(val))
-#   define OUTPUT_BLOCK_WRITE8(ptr, offset, val)   intel_sub_group_block_write_us8((__global ushort*)(ptr) + (offset), as_ushort8(val))
-#elif OUTPUT_TYPE_SIZE == 4
-#   define OUTPUT_BLOCK_WRITE(ptr, offset, val)    intel_sub_group_block_write((__global uint*)(ptr) + (offset), as_uint(val))
-#   define OUTPUT_BLOCK_WRITE2(ptr, offset, val)   intel_sub_group_block_write2((__global uint*)(ptr) + (offset), as_uint2(val))
-#   define OUTPUT_BLOCK_WRITE4(ptr, offset, val)   intel_sub_group_block_write4((__global uint*)(ptr) + (offset), as_uint4(val))
-#   define OUTPUT_BLOCK_WRITE8(ptr, offset, val)   intel_sub_group_block_write8((__global uint*)(ptr) + (offset), as_uint8(val))
+#if OUTPUT_FORMAT_BFYX
+#   define OUTPUTVTYPE(n)       CAT(OUTPUT_TYPE, n)
+#   define TO_OUTPUTVTYPE       CAT(convert_, OUTPUTVTYPE(OUTPUT_X_BLOCK_SIZE))
+#   define VSTORE               CAT(vstore, OUTPUT_X_BLOCK_SIZE)
 #else
-#   error convolution_gpu_bfyx_f16.cl: unsupported output type
-#endif
+#   if OUTPUT_TYPE_SIZE == 1
+#       define OUTPUT_BLOCK_WRITE(ptr, offset, val)    BLOCK_WRITE_UC_1((__global uchar*)(ptr) + (offset), as_uchar(val))
+#       define OUTPUT_BLOCK_WRITE2(ptr, offset, val)   BLOCK_WRITE_UC_2((__global uchar*)(ptr) + (offset), as_uchar2(val))
+#       define OUTPUT_BLOCK_WRITE4(ptr, offset, val)   BLOCK_WRITE_UC_4((__global uchar*)(ptr) + (offset), as_uchar4(val))
+#       define OUTPUT_BLOCK_WRITE8(ptr, offset, val)   BLOCK_WRITE_UC_8((__global uchar*)(ptr) + (offset), as_uchar8(val))
+#   elif OUTPUT_TYPE_SIZE == 2
+#       define OUTPUT_BLOCK_WRITE(ptr, offset, val)    intel_sub_group_block_write_us((__global ushort*)(ptr) + (offset), as_ushort(val))
+#       define OUTPUT_BLOCK_WRITE2(ptr, offset, val)   intel_sub_group_block_write_us2((__global ushort*)(ptr) + (offset), as_ushort2(val))
+#       define OUTPUT_BLOCK_WRITE4(ptr, offset, val)   intel_sub_group_block_write_us4((__global ushort*)(ptr) + (offset), as_ushort4(val))
+#       define OUTPUT_BLOCK_WRITE8(ptr, offset, val)   intel_sub_group_block_write_us8((__global ushort*)(ptr) + (offset), as_ushort8(val))
+#   elif OUTPUT_TYPE_SIZE == 4
+#       define OUTPUT_BLOCK_WRITE(ptr, offset, val)    intel_sub_group_block_write((__global uint*)(ptr) + (offset), as_uint(val))
+#       define OUTPUT_BLOCK_WRITE2(ptr, offset, val)   intel_sub_group_block_write2((__global uint*)(ptr) + (offset), as_uint2(val))
+#       define OUTPUT_BLOCK_WRITE4(ptr, offset, val)   intel_sub_group_block_write4((__global uint*)(ptr) + (offset), as_uint4(val))
+#       define OUTPUT_BLOCK_WRITE8(ptr, offset, val)   intel_sub_group_block_write8((__global uint*)(ptr) + (offset), as_uint8(val))
+#   else
+#       error convolution_gpu_bfyx_f16.cl: unsupported output type
+#   endif
+#endif  // OUTPUT_FORMAT_BFYX
 
 #if INPUT0_TYPE_SIZE == 2
 #   define AS_INPUT_SRC         CAT(as_, MAKE_VECTOR_TYPE(INPUT_TYPE, OUTPUT_X_BLOCK_SIZE))
@@ -129,18 +135,30 @@ KERNEL(convolution_bfyx_f16)(
                               (INPUT0_PAD_BEFORE_SIZE_X + input_x) * input_x_pitch;
 
     // Output offset calculations:
+
+#if OUTPUT_FORMAT_BFYX
+    const uint output_y_pitch = (OUTPUT_PAD_BEFORE_SIZE_X + OUTPUT_SIZE_X + OUTPUT_PAD_AFTER_SIZE_X);
+    const uint output_fs_pitch = output_y_pitch * (OUTPUT_PAD_BEFORE_SIZE_Y + OUTPUT_SIZE_Y + OUTPUT_PAD_AFTER_SIZE_Y);
+    const uint output_b_pitch = output_fs_pitch * (OUTPUT_PAD_BEFORE_FEATURE_NUM + OUTPUT_FEATURE_NUM + OUTPUT_PAD_AFTER_FEATURE_NUM);
+
+    const uint output_offset = b * output_b_pitch +
+                               feature_block * (output_fs_pitch * FEATURE_SLICE_SIZE) +
+                               (sglid + OUTPUT_PAD_BEFORE_FEATURE_NUM) * output_fs_pitch +
+                               (y + OUTPUT_PAD_BEFORE_SIZE_Y) * output_y_pitch +
+                               (x + OUTPUT_PAD_BEFORE_SIZE_X);
+#else
     const uint output_x_pitch = FEATURE_SLICE_SIZE;
-    const uint output_y_pitch = output_x_pitch * (OUTPUT_PAD_BEFORE_SIZE_X +  OUTPUT_SIZE_X + OUTPUT_PAD_AFTER_SIZE_X);
+    const uint output_y_pitch = output_x_pitch * (OUTPUT_PAD_BEFORE_SIZE_X + OUTPUT_SIZE_X + OUTPUT_PAD_AFTER_SIZE_X);
     const uint output_total_f_size = OUTPUT_PAD_BEFORE_FEATURE_NUM + OUTPUT_FEATURE_NUM + OUTPUT_PAD_AFTER_FEATURE_NUM;
-    const uint output_fs_pitch = output_y_pitch * (OUTPUT_PAD_BEFORE_SIZE_Y +  OUTPUT_SIZE_Y + OUTPUT_PAD_AFTER_SIZE_Y);
+    const uint output_fs_pitch = output_y_pitch * (OUTPUT_PAD_BEFORE_SIZE_Y + OUTPUT_SIZE_Y + OUTPUT_PAD_AFTER_SIZE_Y);
     const uint output_b_pitch = output_fs_pitch * ((output_total_f_size + FEATURE_SLICE_SIZE - 1) / FEATURE_SLICE_SIZE);
-
     const uint output_fs_pad_before = OUTPUT_PAD_BEFORE_FEATURE_NUM / FEATURE_SLICE_SIZE;
 
     const uint output_offset = b * output_b_pitch +
                                (feature_block + output_fs_pad_before) * output_fs_pitch +
                                (y + OUTPUT_PAD_BEFORE_SIZE_Y) * output_y_pitch +
                                (x + OUTPUT_PAD_BEFORE_SIZE_X) * output_x_pitch;
+#endif
 
     // Filter offset calculations:
     const uint filter_isv_pitch = FEATURE_SLICE_SIZE;
@@ -383,15 +401,27 @@ KERNEL(convolution_bfyx_f16)(
 #if OUTPUT_LEFTOVERS
     if ((feature_block + 1) * FEATURE_SLICE_SIZE >= OUTPUT_FEATURE_NUM) {
         for (int i = 0; i < OUTPUT_X_BLOCK_SIZE; i++) {
+
 #if HAS_FUSED_OPS
             FUSED_OPS_SCALAR;
+#   if OUTPUT_FORMAT_BFYX
+            res[i] = TO_OUTPUT_TYPE(FUSED_OPS_RESULT_SCALAR);
+#   else
             res[i] = FUSED_OPS_RESULT_SCALAR;
+#   endif
 #else
             res[i] = TO_OUTPUT_TYPE(dst[i]);
 #endif
+
+#if OUTPUT_FORMAT_BFYX
+            if ((feature_block * FEATURE_SLICE_SIZE + sglid < OUTPUT_FEATURE_NUM) && (x + i) < OUTPUT_SIZE_X) {
+                output[output_offset + i] = res[i];
+            }
+#else
             if ((feature_block * FEATURE_SLICE_SIZE + sglid < OUTPUT_FEATURE_NUM) && (x + i) < OUTPUT_SIZE_X) {
                 output[output_offset + i * output_x_pitch + sglid] = res[i];
             }
+#endif
         }
     }
     else
@@ -400,35 +430,61 @@ KERNEL(convolution_bfyx_f16)(
         if (x + OUTPUT_X_BLOCK_SIZE <= OUTPUT_SIZE_X || OUTPUT_SIZE_X % OUTPUT_X_BLOCK_SIZE == 0) {
 #if HAS_FUSED_OPS
             FUSED_OPS_VEC;
+#   if OUTPUT_FORMAT_BFYX
+            res = TO_OUTPUTVTYPE(FUSED_OPS_RESULT_VEC);
+#   else
             res = FUSED_OPS_RESULT_VEC;
+#   endif
 #else
+#   if OUTPUT_FORMAT_BFYX
+            res = TO_OUTPUTVTYPE(dst);
+#   else
             res = dst;
+#   endif
 #endif
             // TODO Generalize for other block sizes
-#if OUTPUT_X_BLOCK_SIZE == 8
+#if OUTPUT_FORMAT_BFYX
+    #if OUTPUT_X_BLOCK_SIZE == 2 || OUTPUT_X_BLOCK_SIZE == 4 || OUTPUT_X_BLOCK_SIZE == 8
+            VSTORE(res, 0, output + output_offset);
+    #elif OUTPUT_X_BLOCK_SIZE == 1
+            output[output_offset] = res[0];
+    #else
+    #   error convolution_gpu_bfyx_f16.cl: unsupported output x block size
+    #endif
+#else
+    #if OUTPUT_X_BLOCK_SIZE == 8
             OUTPUT_BLOCK_WRITE8(output, output_offset, res);
-#elif OUTPUT_X_BLOCK_SIZE == 4
+    #elif OUTPUT_X_BLOCK_SIZE == 4
             OUTPUT_BLOCK_WRITE4(output, output_offset, res);
-#elif OUTPUT_X_BLOCK_SIZE == 2
+    #elif OUTPUT_X_BLOCK_SIZE == 2
             OUTPUT_BLOCK_WRITE2(output, output_offset, res);
-#elif OUTPUT_X_BLOCK_SIZE == 1
+    #elif OUTPUT_X_BLOCK_SIZE == 1
             OUTPUT_BLOCK_WRITE(output, output_offset, res);
-#else
-#   error convolution_gpu_bfyx_f16.cl: unsupported output x block size
-#endif
+    #else
+    #   error convolution_gpu_bfyx_f16.cl: unsupported output x block size
+    #endif
+#endif  // OUTPUT_FORMAT_BFYX
         } else {
             for (int i = 0; i < OUTPUT_SIZE_X % OUTPUT_X_BLOCK_SIZE; i++) {
 #if HAS_FUSED_OPS
                 FUSED_OPS_SCALAR;
+#   if OUTPUT_FORMAT_BFYX
+                res[i] = TO_OUTPUT_TYPE(FUSED_OPS_RESULT_SCALAR);
+#   else
                 res[i] = FUSED_OPS_RESULT_SCALAR;
+#   endif
 #else
                 res[i] = TO_OUTPUT_TYPE(dst[i]);
 #endif
+
+#if OUTPUT_FORMAT_BFYX
+                output[output_offset + i] = res[i];
+#else
                 OUTPUT_BLOCK_WRITE(output, output_offset + i * output_x_pitch, res[i]);
+#endif
             }
         }
     }
-
 #if SLM_DIV_FACTOR > 1
     }
 #endif
@@ -462,7 +518,13 @@ KERNEL(convolution_bfyx_f16)(
 
 #undef FILTER_BLOCK_READ8
 
-#undef OUTPUT_BLOCK_WRITE
-#undef OUTPUT_BLOCK_WRITE2
-#undef OUTPUT_BLOCK_WRITE4
-#undef OUTPUT_BLOCK_WRITE8
+#if OUTPUT_FORMAT_BFYX
+#   undef OUTPUTVTYPE
+#   undef TO_OUTPUTVTYPE
+#   undef VSTORE
+#else
+#   undef OUTPUT_BLOCK_WRITE
+#   undef OUTPUT_BLOCK_WRITE2
+#   undef OUTPUT_BLOCK_WRITE4
+#   undef OUTPUT_BLOCK_WRITE8
+#endif  // OUTPUT_FORMAT_BFYX
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp
index e4fb9d8055b75b..813c375bf2a57e 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/common/jitter.cpp
@@ -1741,8 +1741,10 @@ std::string FusedOpsCodeGenerator::GetJitLoad(const FusedOpsConfiguration& conf,
 
     // Eltwise fused op can't have full tensor argument when requested vec_size > 1, since it might require
     // splitting load into several parts and some kind of index recalculation which is not supported
+    DataLayout orig_output_layout = conf.IsPostReorderFused() ? conf.orig_output_layout : prim_output.GetLayout();
+
     if (desc.GetType() == KernelType::ELTWISE && !valid_broadcast_case &&
-        input_tensor.GetLayout() != prim_output.GetLayout() && conf.vec_size > 1) {
+        input_tensor.GetLayout() != orig_output_layout && conf.vec_size > 1) {
         throw std::runtime_error("[clDNN] Mixed layouts of input tensors are not supported in fused eltwise:"
                                  "\nfused_input: " + toString_v2(input_tensor) +
                                  "\noutput: " + toString_v2(prim_output));
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_base.cpp b/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_base.cpp
index 41d067d1f62565..7b977147465445 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_base.cpp
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_base.cpp
@@ -108,6 +108,9 @@ JitConstants KernelBase::MakeFusedOpsJitConstants(const kernel_selector::base_pa
     if (conf.empty())
         return jit;
 
+    if (params.fused_ops.size() == 1 && params.fused_ops[0].GetType() == KernelType::REORDER)
+        return jit;
+
     try {
         for (auto& c : conf) {
             std::string fused_ops;
@@ -119,6 +122,10 @@ JitConstants KernelBase::MakeFusedOpsJitConstants(const kernel_selector::base_pa
             bool can_all_use_preload = true;
 
             for (size_t i = 0; i < params.fused_ops.size(); i++) {
+                // Reorder is not processed by jitter
+                if (params.fused_ops[i].GetType() == FusedOpType::REORDER)
+                    continue;
+
                 auto fused_dep_codegen = FusedOpsCodeGenerator(params.fused_ops[i]);
                 jit.Merge(fused_dep_codegen.MakeLoadJitConstants(c, params.output));
                 jit.Merge(fused_dep_codegen.MakeOpJitConstants(c, in_name, in_type, out_name));
diff --git a/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_params.h b/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_params.h
index 4638de3fbe93e2..b68054dad7cb13 100644
--- a/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_params.h
+++ b/inference-engine/thirdparty/clDNN/kernel_selector/core/kernel_selector_params.h
@@ -469,6 +469,8 @@ struct FusedOpsConfiguration {
     bool allow_for_partial_preload;
     // Load index for shuffle fused op
     std::string shuffle_var_name;
+    // Record original output layout before reorder is fused
+    DataLayout orig_output_layout;
 
     FusedOpsConfiguration(std::string suffix,
                           std::vector<std::string> bfzyx_idx_order,
@@ -481,7 +483,8 @@ struct FusedOpsConfiguration {
                           Tensor::DataChannelName vec_axis = Tensor::DataChannelName::COUNT,
                           std::vector<Tensor::DataChannelName> loop_axes = {},
                           bool allow_for_partial_preload = false,
-                          std::string shuffle_var_name = "")
+                          std::string shuffle_var_name = "",
+                          DataLayout orig_output_layout = DataLayout::DataLayoutCount)
       : suffix(suffix)
       , bfzyx_idx_order(bfzyx_idx_order)
       , input_var_name(input_var_name)
@@ -493,7 +496,8 @@ struct FusedOpsConfiguration {
       , index_type(index_type)
       , loop_axes(loop_axes)
       , allow_for_partial_preload(allow_for_partial_preload)
-      , shuffle_var_name(shuffle_var_name) { }
+      , shuffle_var_name(shuffle_var_name)
+      , orig_output_layout(orig_output_layout) { }
 
     FusedOpsConfiguration& SetVectorSize(size_t val) { vec_size = val; return *this; }
     FusedOpsConfiguration& SetLoadType(LoadType val) { load_type = val; return *this; }
@@ -505,6 +509,7 @@ struct FusedOpsConfiguration {
         allow_for_partial_preload = partial_preload;
         return *this; }
     FusedOpsConfiguration& SetShuffleVarName(std::string val) { shuffle_var_name = val; return *this; }
+    bool IsPostReorderFused(void) const { return orig_output_layout != DataLayout::DataLayoutCount; }
 };
 
 // Instance of fused_operation_desc is added to fused_ops vector if a node has been fused to current one using program::fuse_nodes
diff --git a/inference-engine/thirdparty/clDNN/runtime/engine.cpp b/inference-engine/thirdparty/clDNN/runtime/engine.cpp
index 976e7bae595b89..3738ec2ae9d9b9 100644
--- a/inference-engine/thirdparty/clDNN/runtime/engine.cpp
+++ b/inference-engine/thirdparty/clDNN/runtime/engine.cpp
@@ -120,22 +120,51 @@ memory_ptr engine::share_surface(const layout& layout, shared_surface surf, uint
 #endif  // _WIN32
 
 uint64_t engine::get_max_used_device_memory() const {
-    return peak_memory_usage.load();
+    uint64_t total_peak_memory_usage {0};
+    for (auto const& m : peak_memory_usage_map) {
+        total_peak_memory_usage += m.second.load();
+    }
+    return total_peak_memory_usage;
 }
 
-uint64_t engine::get_used_device_memory() const {
-    return memory_usage.load();
+uint64_t engine::get_max_used_device_memory(allocation_type type) const {
+    uint64_t peak_memory_usage {0};
+    auto iter = peak_memory_usage_map.find(type);
+    if (iter != peak_memory_usage_map.end()) {
+        peak_memory_usage = iter->second.load();
+    }
+    return peak_memory_usage;
 }
 
-void engine::add_memory_used(size_t bytes) {
-    memory_usage += bytes;
-    if (memory_usage > peak_memory_usage) {
-        peak_memory_usage = memory_usage.load();
+uint64_t engine::get_used_device_memory(allocation_type type) const {
+    uint64_t memory_usage {0};
+    auto iter = memory_usage_map.find(type);
+    if (iter != memory_usage_map.end()) {
+        memory_usage = iter->second.load();
     }
+    return memory_usage;
 }
 
-void engine::subtract_memory_used(size_t bytes) {
-    memory_usage -= bytes;
+void engine::add_memory_used(size_t bytes, allocation_type type) {
+    if (!memory_usage_map.count(type) && !peak_memory_usage_map.count(type)) {
+        static std::mutex m;
+        std::lock_guard<std::mutex> guard(m);
+        memory_usage_map[type] = 0;
+        peak_memory_usage_map[type] = 0;
+    }
+    memory_usage_map[type] += bytes;
+    if (memory_usage_map[type] > peak_memory_usage_map[type]) {
+        peak_memory_usage_map[type] = memory_usage_map[type].load();
+    }
+}
+
+void engine::subtract_memory_used(size_t bytes, allocation_type type) {
+    auto iter = memory_usage_map.find(type);
+    if (iter != memory_usage_map.end()) {
+        memory_usage_map[type] -= bytes;
+    } else {
+        throw std::runtime_error("Attempt to free unallocated memory");
+    }
 }
 
 std::shared_ptr<cldnn::engine> engine::create(engine_types engine_type,
diff --git a/inference-engine/thirdparty/clDNN/runtime/memory.cpp b/inference-engine/thirdparty/clDNN/runtime/memory.cpp
index 80a6ee980edd37..9a22d3a2ae9d86 100644
--- a/inference-engine/thirdparty/clDNN/runtime/memory.cpp
+++ b/inference-engine/thirdparty/clDNN/runtime/memory.cpp
@@ -20,27 +20,25 @@ namespace cldnn {
 memory::memory(engine* engine, const layout& layout, allocation_type type, bool reused)
     : _engine(engine), _layout(layout), _bytes_count(_layout.bytes_count()), _type(type), _reused(reused) {
     if (!_reused && _engine) {
-        _engine->add_memory_used(_bytes_count);
-    }
-
-    GPU_DEBUG_GET_INSTANCE(debug_config);
-    GPU_DEBUG_IF(debug_config->verbose >= 1) {
-        GPU_DEBUG_COUT << "Allocate " << _bytes_count << " bytes of " << type << " allocation type"
-                       << " (current=" << _engine->get_used_device_memory() << ";"
-                       << " max=" << _engine->get_max_used_device_memory() << ")" << std::endl;
+        _engine->add_memory_used(_bytes_count, type);
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 1) {
+            GPU_DEBUG_COUT << "Allocate " << _bytes_count << " bytes of " << type << " allocation type"
+                           << " (current=" << _engine->get_used_device_memory(type) << ";"
+                           << " max=" << _engine->get_max_used_device_memory(type) << ")" << std::endl;
+        }
     }
 }
 
 memory::~memory() {
     if (!_reused && _engine) {
-        _engine->subtract_memory_used(_bytes_count);
-    }
-
-    GPU_DEBUG_GET_INSTANCE(debug_config);
-    GPU_DEBUG_IF(debug_config->verbose >= 1) {
-        GPU_DEBUG_COUT << "Free " << _bytes_count << " bytes"
-                       << " (current=" << _engine->get_used_device_memory() << ";"
-                       << " max=" << _engine->get_max_used_device_memory() << ")" << std::endl;
+        _engine->subtract_memory_used(_bytes_count, _type);
+        GPU_DEBUG_GET_INSTANCE(debug_config);
+        GPU_DEBUG_IF(debug_config->verbose >= 1) {
+            GPU_DEBUG_COUT << "Free " << _bytes_count << " bytes of " << _type << " allocation type"
+                           << " (current=" << _engine->get_used_device_memory(_type) << ";"
+                           << " max=" << _engine->get_max_used_device_memory(_type) << ")" << std::endl;
+        }
     }
 }
 
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp
index 24d45ecca785bb..0a1ba4156b7bf2 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/graph_initializations.cpp
@@ -346,6 +346,7 @@ void graph_initializations::handle_dynamic_lstm_node(program& p, lstm_dynamic_no
                                              dyn_length_id,
                                              weights_id,
                                              bias_id,
+                                             "",
                                              node.get_primitive()->output_padding);
     auto& lstm_dynamic_input_node = p.get_or_create(lstm_dynamic_input_primitive);
     p.add_connection(node.input(), lstm_dynamic_input_node);  // connect real input to dlstm_input
@@ -372,6 +373,7 @@ void graph_initializations::handle_dynamic_lstm_node(program& p, lstm_dynamic_no
                                                 init_cell_id,
                                                 node.clip(),
                                                 node.input_forget(),
+                                                "",
                                                 lstm_dynamic_input_primitive->output_padding);
     auto& lstm_dynamic_timeloop_node = p.get_or_create(lstm_dynamic_timeloop_primitive);
     p.add_connection(lstm_dynamic_input_node, lstm_dynamic_timeloop_node);  // connect dlstm_input to dlstm_timeloop
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp
index db2db73e4d587d..7816ab6d4bdaa7 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/pre_replace_deconv.cpp
@@ -119,6 +119,7 @@ void pre_replace_deconv::run(program& p) {
                                                               input_offset,
                                                               tensor{ 1, 1, 1, 1 },
                                                               grouped_weights_shape,
+                                                              "",
                                                               output_padding);
                 } else {
                     conv_prim = std::make_shared<convolution>(deconv_node_id,
@@ -129,6 +130,7 @@ void pre_replace_deconv::run(program& p) {
                                                               input_offset,
                                                               tensor{ 1, 1, 1, 1 },
                                                               grouped_weights_shape,
+                                                              "",
                                                               output_padding);
                 }
                 program_node& new_node = p.get_or_create(conv_prim);
@@ -263,6 +265,7 @@ void pre_replace_deconv::run(program& p) {
                                                                input_offset,
                                                                tensor{ 1, 1, 1, 1 },
                                                                grouped_weights_shape,
+                                                               "",
                                                                output_padding);
                 program_node& created_node = p.get_or_create(conv_prim);
 
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp
index 819cb87dd405be..898fda4273af45 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/prepare_quantization.cpp
@@ -657,6 +657,7 @@ void prepare_quantization::prepare_asymmetric_quantization(program &p, convoluti
                 old_conv_prim->dilation,
                 output_size,
                 old_conv_prim->grouped_weights_shape,
+                "",
                 old_conv_prim->output_padding);
 
     auto& new_conv_node = p.get_or_create(new_conv_prim);
diff --git a/inference-engine/thirdparty/clDNN/src/graph_optimizer/remove_redundant_reorders.cpp b/inference-engine/thirdparty/clDNN/src/graph_optimizer/remove_redundant_reorders.cpp
index fc7ce14f260c87..e40be287243ce8 100644
--- a/inference-engine/thirdparty/clDNN/src/graph_optimizer/remove_redundant_reorders.cpp
+++ b/inference-engine/thirdparty/clDNN/src/graph_optimizer/remove_redundant_reorders.cpp
@@ -334,26 +334,24 @@ void remove_redundant_reorders::run(program& p) {
         p.remove_if_dangling(node);
     }
 
-    // This pass removes reorder for Convolution BFYX -> FS_B_YX_FSV32
-    itr = p.get_processing_order().begin();
-    while (itr != p.get_processing_order().end()) {
-        auto& node = *itr++;
-        if (!node->is_type<reorder>() || !node->is_in_data_flow() || node->get_users().size() != 1 || node->get_dependencies().size() != 1)
-            continue;
+    // Remove reorder for Convolution bfyx -> fs_b_yx_fsv32
+    auto try_fuse_reorder_bfyx_to_fsv32 = [&](reorder_node* node) {
+        if (node->get_users().size() != 1)
+            return;
 
         auto& usr = node->get_users().front();
         auto& dep = node->get_dependency(0);
         if (!(usr->is_type<convolution>()) ||
              (usr->get_output_layout().data_type != dep.get_output_layout().data_type) ||
-             (usr->get_output_layout().format != format::fs_b_yx_fsv32) ||
-             (dep.get_output_layout().format != format::bfyx))
-            continue;
+             (dep.get_output_layout().format != format::bfyx) ||
+             (usr->get_output_layout().format != format::fs_b_yx_fsv32))
+            return;
 
         if (dep.is_type<input_layout>())
-            continue;
+            return;
 
         if (usr->as<convolution>().get_primitive()->groups != 1)
-            continue;
+            return;
 
         dep.merge_output_padding(node->get_output_layout().data_padding);
         p.replace_all_usages(*node, dep);
@@ -361,6 +359,83 @@ void remove_redundant_reorders::run(program& p) {
         p.add_optimized_primitive_info(node->id());
         p.remove_all_connections(*node);
         p.remove_if_dangling(*node);
+    };
+
+    // Remove reorder for Convolution b_fs_yx_fsv16 -> bfyx
+    auto try_fuse_reorder_fsv16_to_bfyx = [&](reorder_node* node) {
+        if (!node->get_fused_activations_funcs().empty() ||
+            !node->get_fused_primitives().empty())
+            return;
+
+        auto& input = node->input();
+
+        if (!(input.is_type<convolution>()) ||
+            !(input.get_output_layout().format == format::b_fs_yx_fsv16) ||
+            !(node->get_output_layout().format == format::bfyx))
+            return;
+
+        if (input.as<convolution>().get_primitive()->groups != 1)
+            return;
+
+        if (input.get_users().size() != 1)
+            return;
+
+        auto& input_dep = input.get_dependency(0);
+        if (input_dep.get_output_layout().format != format::b_fs_yx_fsv16 ||
+            input_dep.get_output_layout().data_type == data_types::u8 ||
+            input_dep.get_output_layout().data_type == data_types::i8)
+            return;
+
+        for (auto& user : node->get_users()) {
+            // if concat is reorder's user and concat's axis is 0(Batch) or 1(Feature), conv's output would have padding.
+            // This padding might lead not to select the optimized conv kernel("convolution_gpu_bfyx_f16")
+            if (user->is_type<concatenation>()) {
+                auto& concat_node = user->as<concatenation>();
+                auto concat_axis = concat_node.get_primitive()->axis;
+                if (concat_axis == 0 || concat_axis == 1)
+                    return;
+            }
+        }
+
+        auto output_layout = node->get_output_layout();
+        input.set_output_layout(output_layout, false);
+        if (input.type()->does_possible_implementation_exist(input)) {
+            input.set_output_padding(node->get_output_layout().data_padding);
+
+            // Add fused_primitive_desc of reorder to convolution which propagate original output layout to jitter
+            fused_primitive_desc local_desc;
+            local_desc.node = p.get_node_ptr(node->id());
+            local_desc.dep_start_idx = input.get_fused_primitives().size();
+            local_desc.output_layout = output_layout;
+            local_desc.input_layout = input.get_dependency(0).get_output_layout();  // original convolution's output layout
+            local_desc.activation = activation_func::none;
+            input.add_fused_primitive(local_desc);
+            node->set_input_layout(local_desc.input_layout);
+
+            // remove reorder node
+            node->can_be_optimized(true);
+            p.add_optimized_primitive_info(node->id());
+            p.extract_and_remove(*node);
+        }
+    };
+
+    if (enable_reorder_fusing) {
+        itr = p.get_processing_order().begin();
+        while (itr != p.get_processing_order().end()) {
+            auto& node = *itr++;
+            if (!node->is_type<reorder>())
+                continue;
+
+            if (!node->is_in_data_flow() || node->get_dependencies().size() != 1)
+                continue;
+
+            auto& r_node = node->as<reorder>();
+
+            // Remove reorder for Convolution bfyx -> fs_b_yx_fsv32
+            try_fuse_reorder_bfyx_to_fsv32(&r_node);
+            // Remove reorder for Convolution b_fs_yx_fsv16 -> bfyx
+            try_fuse_reorder_fsv16_to_bfyx(&r_node);
+        }
     }
 
     // Additional reshape chains shrink.
diff --git a/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp b/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp
index 79f0616b9161e1..b7d84a211c15a1 100644
--- a/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp
+++ b/inference-engine/thirdparty/clDNN/src/include/generic_layer.hpp
@@ -35,8 +35,9 @@ struct generic_layer : public primitive_base<generic_layer> {
                   const primitive_id& input,
                   const layout& output_layout,
                   const kernel_selector::generic_kernel_params& generic_params,
+                  const primitive_id& ext_prim_id = "",
                   const padding& output_padding = padding())
-        : primitive_base(id, {input}, output_padding), output_layout(output_layout), generic_params(generic_params) {}
+        : primitive_base(id, {input}, ext_prim_id, output_padding), output_layout(output_layout), generic_params(generic_params) {}
 
     /// @brief Requested memory layout.
     layout output_layout;
diff --git a/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h b/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h
index 863d2267dc1c3c..6b69286d8c334f 100644
--- a/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h
+++ b/inference-engine/thirdparty/clDNN/src/include/primitive_inst.h
@@ -83,6 +83,7 @@ class primitive_inst {
     primitive_type_id type() const { return _node.type(); }
     primitive_id id() const { return _node.id(); }
     primitive_id org_id() const { return _node.get_org_primitive_id(); }
+    const primitive_id& get_ext_prim_id() const { return _node.get_ext_prim_id(); }
     bool can_be_optimized() const { return _node.can_be_optimized(); }
     std::shared_ptr<const primitive> desc() const { return _node.get_primitive(); }
     program_node const& get_node() const { return _node; }
diff --git a/inference-engine/thirdparty/clDNN/src/include/program_node.h b/inference-engine/thirdparty/clDNN/src/include/program_node.h
index 2b38d85d966a60..9b11846ee6ea77 100644
--- a/inference-engine/thirdparty/clDNN/src/include/program_node.h
+++ b/inference-engine/thirdparty/clDNN/src/include/program_node.h
@@ -41,6 +41,7 @@ struct fused_primitive_desc {
     std::vector<primitive_id> fused_deps;
     activation_func activation;
     activation_additional_params activation_params;
+    layout input_layout = layout(data_types::f32, format::bfyx, tensor());
     layout output_layout = layout(data_types::f32, format::bfyx, tensor());
 };
 
@@ -81,6 +82,8 @@ struct program_node {
     virtual primitive_type_id type() const { return desc->type; }
     virtual std::shared_ptr<kernel_selector::fuse_params> get_fuse_params() const { return nullptr; }
 
+    const primitive_id& get_ext_prim_id() const { return desc->ext_prim_id; }
+
     template <class PType>
     bool is_type() const {
         static_assert(
diff --git a/inference-engine/thirdparty/clDNN/src/include/reorder_inst.h b/inference-engine/thirdparty/clDNN/src/include/reorder_inst.h
index 85d301e5b137a9..3589b9453f6431 100644
--- a/inference-engine/thirdparty/clDNN/src/include/reorder_inst.h
+++ b/inference-engine/thirdparty/clDNN/src/include/reorder_inst.h
@@ -7,6 +7,8 @@
 
 #include "cldnn/primitives/reorder.hpp"
 #include "primitive_inst.h"
+#include "kernel_selector/core/actual_kernels/reorder/reorder_kernel_base.h"
+#include "kernel_selector/common/tensor_type.h"
 
 #include <string>
 #include <memory>
@@ -33,11 +35,19 @@ struct typed_program_node<reorder> : public typed_program_node_base<reorder> {
     void requires_reinterpret(bool val) { req_reinterpr = (optimized && val); }
 
     void set_input_offset(tensor const& io) { input_offset = io; }
+    void set_input_layout(layout const& lo) { input_layout = lo; }
     tensor get_input_offset() const { return input_offset; }
 
+    std::shared_ptr<kernel_selector::fuse_params> get_fuse_params() const override {
+        kernel_selector::DataLayout ks_input_layout = convert_data_tensor(input_layout).GetLayout();
+        kernel_selector::DataLayout ks_output_layout = convert_data_tensor(get_output_layout()).GetLayout();
+        return std::make_shared<kernel_selector::reorder_fuse_params>(ks_input_layout, ks_output_layout);
+    }
+
 private:
     bool req_reinterpr = false;
     tensor input_offset = tensor{0};  // used by reorder to winograd domain
+    layout input_layout = layout(data_types::f32, format::bfyx, { 0, 0, 0, 0 });
 };
 
 using reorder_node = typed_program_node<reorder>;
diff --git a/inference-engine/thirdparty/clDNN/src/network.cpp b/inference-engine/thirdparty/clDNN/src/network.cpp
index 9692bd7ee73edf..6b6f20f697a7cf 100644
--- a/inference-engine/thirdparty/clDNN/src/network.cpp
+++ b/inference-engine/thirdparty/clDNN/src/network.cpp
@@ -662,6 +662,21 @@ const program::graph_optimizer_info& network::get_optimizer_passes_info() const
     return _program->get_optimizer_passes_info();
 }
 
+std::map<primitive_id, primitive_id> network::get_ext_id_mapping() const {
+    std::map<primitive_id, primitive_id> result;
+    for (auto& prim : _primitives) {
+        result.emplace(prim.first, prim.second->get_ext_prim_id());
+    }
+    for (auto& opt_id : _program->get_optimized_out()) {
+        std::string ext_id = opt_id;
+        if (opt_id.find(":") != std::string::npos) {
+            ext_id = opt_id.substr(opt_id.find(":") + 1, opt_id.length());
+        }
+        result.emplace(opt_id, ext_id);
+    }
+    return result;
+}
+
 std::shared_ptr<primitive_inst> network::get_primitive(const primitive_id& id) {
     if (!_primitives.count(id))
         allocate_primitive_instance(_program->get_node(id));
diff --git a/inference-engine/thirdparty/clDNN/src/program.cpp b/inference-engine/thirdparty/clDNN/src/program.cpp
index 82b0f9b111f641..1d576d3399ee76 100644
--- a/inference-engine/thirdparty/clDNN/src/program.cpp
+++ b/inference-engine/thirdparty/clDNN/src/program.cpp
@@ -893,6 +893,7 @@ void program::replace(program_node& old_node, program_node& new_node) {
     new_node.constant = old_node.constant;
     new_node.data_flow = old_node.data_flow;
     new_node.user_mark = old_node.user_mark;
+    const_cast<primitive_id&>(new_node.desc->ext_prim_id) = old_node.desc->ext_prim_id;
 
     processing_order.insert(&old_node, &new_node);
     if (processing_order.get_processing_iterator(old_node) != processing_order.end())
diff --git a/inference-engine/thirdparty/clDNN/tests/CMakeLists.txt b/inference-engine/thirdparty/clDNN/tests/CMakeLists.txt
index 9d865973a0442d..02189c28ffc01c 100644
--- a/inference-engine/thirdparty/clDNN/tests/CMakeLists.txt
+++ b/inference-engine/thirdparty/clDNN/tests/CMakeLists.txt
@@ -116,3 +116,8 @@ endif()
 ie_sse42_optimization_flags(sse4_2_flags)
 set_source_files_properties(${__CLDNN_AllSources}
   PROPERTIES COMPILE_FLAGS "${sse4_2_flags}")
+
+install(TARGETS "${CLDNN_BUILD__PROJ}"
+  RUNTIME DESTINATION tests
+  COMPONENT tests
+  EXCLUDE_FROM_ALL)
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp
index 742c3061d39830..5f54dabf7f4ea5 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/activation_simple_gpu_test.cpp
@@ -497,7 +497,7 @@ TEST(activation_f32_fw_gpu, relu_basic_yxfb) {
 
     topology topology(
         input_layout("input", input->get_layout()),
-        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0 }, 0 }));
+        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -573,7 +573,7 @@ TEST(activation_f32_fw_gpu, relu_basic_bfzyx) {
 
     topology topology(
         input_layout("input", input->get_layout()),
-        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0, 0 }, 0 }));
+        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -983,8 +983,8 @@ TEST(activation_f32_fw_gpu, relu_basic_acosh_yxfb) {
 
     topology topology(
             input_layout("input", input->get_layout()),
-            reorder("reorder", "input", input->get_layout().with_padding(padding{{0, 0, 2, 1}, 0})),
-            activation("relu", "reorder", activation_func::acosh, {0.5f, 0.f}, padding{{0, 0, 0, 0}, 0}));
+            reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })),
+            activation("relu", "reorder", activation_func::acosh, {0.5f, 0.f}, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -1050,7 +1050,7 @@ TEST(activation_f32_fw_gpu, relu_basic_input_padding_yxfb) {
     topology topology(
         input_layout("input", input->get_layout()),
         reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })),
-        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0 }, 0 }));
+        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -1137,7 +1137,7 @@ TEST(activation_f32_fw_gpu, relu_basic_input_padding_bfzyx) {
     topology topology(
         input_layout("input", input->get_layout()),
         reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 1, 0 }, 0 })),
-        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 0, 0, 0 }, 0 }));
+        activation("relu", "reorder", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0, 0 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
@@ -1210,7 +1210,7 @@ TEST(activation_f32_fw_gpu, relu_basic_output_padding_yxfb) {
 
     topology topology(
         input_layout("input", input->get_layout()),
-        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, padding{ { 0, 0, 3, 3 }, 0 }));
+        activation("relu", "input", activation_func::relu_negative_slope, { 0.5f, 0.f }, "", padding{ { 0, 0, 3, 3 }, 0 }));
     network network(engine, topology);
     network.set_input_data("input", input);
     auto outputs = network.execute();
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp
index d7b4b630201304..9f5144d1dc1104 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/arg_max_gpu_test.cpp
@@ -23,7 +23,7 @@ void generic_arg_max_test_xyf(int input_b, int input_f, int input_y, int input_x
     auto input = engine.allocate_memory({ type_to_data_type<Tin>::value, test_input_fmt, input_tensor });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, mode, 1U, axis, sort_type, false, padding(), type_to_data_type<Tout>::value));
+    topology.add(arg_max_min("arg_max", { "input" }, mode, 1U, axis, sort_type, false, "", padding(), type_to_data_type<Tout>::value));
 
     int min_random = -2, max_random = 2;
     VVVVF<Tin> input_rnd = generate_random_4d<Tin>(input_b, input_f, input_y, input_x, min_random, max_random);
@@ -393,7 +393,7 @@ TEST(arg_max_gpu_min_axis_batch, i32) {
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::i32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::i32));
 
     std::vector<float> input_vec = {
         //y0x0 y0x1 y1x0 y1x1
@@ -436,7 +436,7 @@ TEST(arg_max_gpu_min_axis_batch_bfzyx, i32) {
     auto input = engine.allocate_memory({ data_types::f32, format::bfzyx,{ batch_num, feature_num, x_size , y_size, z_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::i32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::min, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::i32));
 
     std::vector<float> input_vec = {
             //y0x0 y0x1 y1x0 y1x1
@@ -478,7 +478,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb, f32) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -542,7 +542,7 @@ TEST(arg_max_gpu_min_axis_batch_yxfb, f32) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -606,7 +606,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb_topk_2, f32) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -735,7 +735,7 @@ TEST(top_k_layer_tests, second_output2) {
     topology.add(input_layout("input", input->get_layout()));
     topology.add(cldnn::data("const", top_k_input));
     topology.add(mutable_data("second_output", second_output));
-    topology.add(arg_max_min("arg_max", { "input", "const", "second_output" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input", "const", "second_output" }, arg_max_min::max, top_k, arg_max_min::batch, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -825,7 +825,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb_topk_2, sort_by_values) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_values, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
@@ -899,7 +899,7 @@ TEST(arg_max_gpu_min_axis_y_yxfb_topk_2, sort_by_indices) {
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ batch_num, feature_num, x_size , y_size } });
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_indices, false, padding(), data_types::f32));
+    topology.add(arg_max_min("arg_max", { "input" }, arg_max_min::max, top_k, arg_max_min::y, arg_max_min::sort_by_indices, false, "", padding(), data_types::f32));
 
     std::vector<float> input_vec = {
             0.1f, -0.1f,
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp
index 7674100106094d..4530093e3c434e 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/average_unpooling_gpu_test.cpp
@@ -186,7 +186,7 @@ TEST(average_unpooling_gpu, basic_in2x2x2x1_output_padding) {
 
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(average_unpooling("average_unpooling", "input", { 2, 2, 3, 2 }, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, padding({ 0, 0, 1, 1 }, 0)));
+    topology.add(average_unpooling("average_unpooling", "input", { 2, 2, 3, 2 }, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, "", padding({ 0, 0, 1, 1 }, 0)));
 
     network network(engine, topology);
 
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp
index 84c37330b5b73d..f73fd8b19c61f8 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/binary_convolution_gpu_test.cpp
@@ -364,6 +364,7 @@ TEST(binary_convolution, basic_convolution_1x1_single_packed_channel) {
                                { 1,4,2,2 },
                                0, 0.0f,
                                data_types::f32,
+                               "",
                                padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -447,6 +448,7 @@ TEST(binary_convolution, basic_convolution_1x1_single_packed_channel_fp16) {
                                { 1,4,2,2 },
                                0, 0.0f,
                                data_types::f16,
+                               "",
                                padding{ { 0,0,0,0 }, 0 })
     );
 
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp
index ca80202bb5c718..444e1cde280483 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/concatenation_gpu_test.cpp
@@ -63,6 +63,7 @@ TEST(concat_gpu, mixed_input_types) {
                           { "input0", "input1", "input2", "input3", "input4" },
                           concatenation::concatenation_axis::along_f,
                           data_types::f32,
+                          "",
                           padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -136,6 +137,7 @@ TEST(concat_gpu, mixed_input_types_5d) {
                           { "input0", "input1", "input2", "input3" },
                           concatenation::concatenation_axis::along_f,
                           data_types::f32,
+                          "",
                           padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -210,6 +212,7 @@ TEST(concat_gpu, i8_optimization_with_pool) {
                                     {"pool0", "pool1"},
                                     concatenation::concatenation_axis::along_f,
                                     data_types::i8,
+                                    "",
                                     padding{{0, 0, 0, 0}, 0}),
                       reorder("reorder", "concat", reorder_layout));
     cldnn::build_options options;
@@ -310,6 +313,7 @@ TEST(concat_gpu, i8_optimization_with_conv) {
                                     {"input0", "input1", "input2"},
                                     concatenation::concatenation_axis::along_f,
                                     data_types::i8,
+                                    "",
                                     padding{{0, 0, 0, 0}, 0}),
                       data("weights", weights),
                       convolution("conv", "concat", { "weights" }, { 1,1,1,2 }),
@@ -411,6 +415,7 @@ TEST(concat_gpu, i8_optimization_with_pool_conv) {
                                     {"pool0", "pool1"},
                                     concatenation::concatenation_axis::along_f,
                                     data_types::i8,
+                                    "",
                                     padding{{0, 0, 0, 0}, 0}),
                       data("weights", weights),
                       convolution("conv", "concat", {"weights"}, {1, 1, 1, 1}, {0, 0, -1, 0}),
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp
index 11e79771a94241..98986e264ac579 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/convolution_gpu_test.cpp
@@ -1558,6 +1558,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_input_padding) {
             { 1,1,1,1 },
             { 0,0,-1,-2 },
             { 1, 1, 1, 1 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1660,6 +1661,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_sym_input_padding) {
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,1,2 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1757,6 +1759,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_asym_input_padding) {
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,2,3 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1864,6 +1867,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_sym_input_padding_with_input_offs
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,1,2 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -1974,6 +1978,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_asym_input_padding_with_input_off
             { 1, 1, 1, 1 },
             { 0,0,1,2 },
             { 0,0,2,3 },
+            "",
             padding{ { 0,0,0,0 }, 0 })
     );
 
@@ -2072,6 +2077,7 @@ TEST(convolution_f32_fw_gpu, basic_convolution_input_and_output_padding) {
             { 1,1,1,1 },
             { 0,0,-1,-2 },
             { 1, 1, 1, 1 },
+            "",
             padding{ { 0,0,-x_pad,-y_pad }, 0 })
     );
 
@@ -2637,6 +2643,7 @@ TEST(convolution_f32_fw_gpu, offsets_wsiz3x3_wstr2x2_in2x2x1x1_zeropad) {
             { 1,1,2,2 },
             { 0,0,-1,-1 },
             { 1, 1, 1, 1 },
+            "",
             padding{ { 0,0,1,1 }, 0 })
     );
 
@@ -5498,7 +5505,7 @@ TEST(convolution_f32_fw_gpu, convolution_int8_b_fs_yx_fsv4_to_bfyx) {
         reorder("to_int", "input", { data_types::i8,format::bfyx,{ batch_num, input_f, input_size_x, input_size_y } }),
         data("weights", weights),
         data("biases", biases),
-        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1,1,1,1 },
+        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1, 1, 1, 1 }, "",
             padding{ { 0, 0, output_padding, output_padding }, 0 }),
         reorder("output", "conv", { data_types::f32,format::bfyx,{ batch_num, input_f, input_size_x, input_size_y } }));
 
@@ -5520,7 +5527,7 @@ TEST(convolution_f32_fw_gpu, convolution_int8_b_fs_yx_fsv4_to_bfyx) {
         reorder("to_int", "input", { data_types::i8,format::b_fs_yx_fsv4,{ batch_num, input_f, input_size_x, input_size_y } }),
         data("weights", weights),
         data("biases", biases),
-        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1,1,1,1 },
+        convolution("conv", "to_int", { "weights" }, { "biases" }, { 1, 1, 1, 1 }, { 0, 0, -2, -2 }, { 1, 1, 1, 1 }, "",
             padding{ { 0, 0, output_padding, output_padding }, 0 }),
         reorder("output", "conv", { data_types::f32,format::bfyx,{ batch_num, input_f, input_size_x, input_size_y } }));
 
@@ -7609,6 +7616,222 @@ TEST_P(convolution_general_gpu, conv_fp16_cases) {
                 }
 }
 
+struct convolution_gpu_fsv16_to_bfyx : public convolution_general_gpu {};
+
+INSTANTIATE_TEST_SUITE_P(conv_b_fs_yx_fsv16_to_bfyx,
+                        convolution_gpu_fsv16_to_bfyx,
+                        ::testing::Values(
+                            // Input X size, Input Y size, Input Z size, Input features, Output features,
+                            // Kernel size X, Kernel size Y, Kernel size Z, Groups number, Stride, Batch,
+                            // Input data format, Implementation name, WithBias
+                            TestParamType_general_convolution_gpu(6, 6, 0, 16, 16, 3, 3, 0, 1, 1, 4, format::b_fs_yx_fsv16, "convolution_gpu_fsv16_to_bfyx", false),
+                            TestParamType_general_convolution_gpu(6, 6, 0, 32, 32, 3, 3, 0, 1, 1, 1, format::b_fs_yx_fsv16, "convolution_gpu_fsv16_to_bfyx", false),
+                            TestParamType_general_convolution_gpu(6, 6, 0, 16, 16, 3, 3, 0, 1, 1, 16, format::b_fs_yx_fsv16, "convolution_gpu_fsv16_to_bfyx", false),
+                            TestParamType_general_convolution_gpu(16, 6, 0, 20, 16, 3, 3, 0, 1, 1, 20, format::b_fs_yx_fsv16, "convolution_gpu_fsv16_to_bfyx", false)
+                        ),
+                        convolution_gpu_fsv16_to_bfyx::PrintToStringParamName);
+
+TEST_P(convolution_gpu_fsv16_to_bfyx, conv_b_fs_yx_fsv16_to_bfyx_padding)
+{
+    auto& engine = get_test_engine();
+
+    if (!engine.get_device_info().supports_fp16)
+    {
+        std::cout << "[ SKIPPED ] The test is skipped (cl_khr_fp16 is not supported)." << std::endl;
+        EXPECT_EQ(1, 1);
+        return;
+    }
+
+    const int input_b = testing::get<10>(GetParam());
+    const int input_f = testing::get<3>(GetParam());
+    const int input_y = testing::get<1>(GetParam());
+    const int input_x = testing::get<0>(GetParam());
+
+    const int filter_x = testing::get<5>(GetParam());
+    const int filter_y = testing::get<6>(GetParam());
+    const int stride = testing::get<9>(GetParam());
+
+    const int input_offset_y = (filter_y - 1) / 2;
+    const int input_offset_x = (filter_x - 1) / 2;
+
+    auto input_size = tensor(input_b, input_f, input_x, input_y);
+    auto input_data = generate_random_4d<FLOAT16>(input_b, input_f, input_y, input_x, -1, 1);
+    auto input_data_bfyx = flatten_4d(format::bfyx, input_data);
+    auto input_mem = engine.allocate_memory({ data_types::f16, format::bfyx, input_size });
+    set_values(input_mem, input_data_bfyx);
+
+    auto weights_size = tensor(input_b, input_f, filter_x, filter_y, 1);
+    auto weights_data = generate_random_4d<FLOAT16>(input_b, input_f, filter_x, filter_y, -1, 1);
+    auto weights_data_bfyx = flatten_4d(format::bfyx, weights_data);
+    auto weights_mem = engine.allocate_memory({ data_types::f16, format::goiyx, weights_size });
+    set_values(weights_mem, weights_data_bfyx);
+
+    // Set topology
+    topology topology(
+        input_layout("input_origin", input_mem->get_layout()),
+        data("weights_fsv", weights_mem),
+        reorder("input_fsv16", "input_origin", { data_types::f16, format::b_fs_yx_fsv16, input_size }));    // format 3 to 8
+
+    // Add convolution
+    auto input_stride = tensor(1, 1, stride, stride);
+    auto input_offset = tensor(0, 0, input_offset_x, input_offset_y);
+    auto input_dilation = tensor(1, 1, 1, 1);
+    auto input_padding_before = tensor(0, 0, input_offset_x, input_offset_y);
+    auto input_padding_after = tensor(0, 0, input_offset_x, input_offset_y);
+
+    auto conv_fsv = convolution("conv_fsv", "input_fsv16", { "weights_fsv" }, input_stride, input_offset, input_dilation, input_padding_before, input_padding_after);
+    conv_fsv.output_padding = padding({ 0, 32, 2, 2 }, 0.f);
+    topology.add(conv_fsv);                                                                                 // format 8 to 8 -> after fusing, format 8 to 3
+
+    // Add reorder to bfyx
+    auto reorder_bfyx = reorder("reorder_bfyx", "conv_fsv", { data_types::f16, format::bfyx, input_size });
+    reorder_bfyx.output_padding = padding({ 0, 16, 1, 1 }, 0.f);
+    topology.add(reorder_bfyx);                                                                             // format 8 to 3 -> after fusing, removed
+
+    // Exec ref network (non-fusing)
+    build_options options_ref;
+    options_ref.set_option(build_option::optimize_data(false));
+    options_ref.set_option(build_option::allow_static_input_reorder(true));
+
+    network network_ref(engine, topology, options_ref);
+    network_ref.set_input_data("input_origin", input_mem);
+    auto ref_out = network_ref.execute();
+
+    auto ref_out_mem = ref_out.begin()->second.get_memory();
+    cldnn::mem_lock<FLOAT16> ref_out_ptr(ref_out_mem, get_test_stream());
+
+    // Exec target network (fusing: conv+reorder)
+    build_options options_target;
+    implementation_desc conv_impl = { format::b_fs_yx_fsv16, "convolution_gpu_bfyx_f16" };
+    options_target.set_option(build_option::force_implementations({ {"conv_fsv", conv_impl} }));
+    options_target.set_option(build_option::optimize_data(true));
+
+    network network_target(engine, topology, options_target);
+    network_target.set_input_data("input_origin", input_mem);
+    auto target_out = network_target.execute();
+
+    auto target_out_mem = target_out.begin()->second.get_memory();
+    cldnn::mem_lock<FLOAT16> target_out_ptr(target_out_mem, get_test_stream());
+
+    // Compare ref and target result
+    for (size_t i = 0; i < ref_out_ptr.size(); i++) {
+        auto ref_val = static_cast<float>(ref_out_ptr[i]);
+        auto target_val = static_cast<float>(target_out_ptr[i]);
+        auto diff = std::fabs(ref_val - target_val);
+        auto equal = (diff > 1e-5f) ? false : true;
+
+        EXPECT_TRUE(equal);
+        if (!equal)
+        {
+            std::cout << "i:" << i \
+                << "\t ref_out = " << ref_val \
+                << "\t target_out = " << target_val \
+                << std::endl;
+
+            break;
+        }
+    }
+}
+
+TEST_P(convolution_gpu_fsv16_to_bfyx, conv_b_fs_yx_fsv16_to_bfyx_different_type)
+{
+    auto& engine = get_test_engine();
+
+    if (!engine.get_device_info().supports_fp16)
+    {
+        std::cout << "[ SKIPPED ] The test is skipped (cl_khr_fp16 is not supported)." << std::endl;
+        EXPECT_EQ(1, 1);
+        return;
+    }
+
+    const int input_b = testing::get<10>(GetParam());
+    const int input_f = testing::get<3>(GetParam());
+    const int input_y = testing::get<1>(GetParam());
+    const int input_x = testing::get<0>(GetParam());
+
+    const int filter_x = testing::get<5>(GetParam());
+    const int filter_y = testing::get<6>(GetParam());
+    const int stride = testing::get<9>(GetParam());
+
+    const int input_offset_y = (filter_y - 1) / 2;
+    const int input_offset_x = (filter_x - 1) / 2;
+
+    auto input_size = tensor(input_b, input_f, input_x, input_y);
+    auto input_data = generate_random_4d<FLOAT16>(input_b, input_f, input_y, input_x, -1, 1);
+    auto input_data_bfyx = flatten_4d(format::bfyx, input_data);
+    auto input_mem = engine.allocate_memory({ data_types::f16, format::bfyx, input_size });
+    set_values(input_mem, input_data_bfyx);
+
+    auto weights_size = tensor(input_b, input_f, filter_x, filter_y, 1);
+    auto weights_data = generate_random_4d<FLOAT16>(input_b, input_f, filter_x, filter_y, -1, 1);
+    auto weights_data_bfyx = flatten_4d(format::bfyx, weights_data);
+    auto weights_mem = engine.allocate_memory({ data_types::f16, format::goiyx, weights_size });
+    set_values(weights_mem, weights_data_bfyx);
+
+    // Set topology
+    topology topology(
+        input_layout("input_origin", input_mem->get_layout()),
+        data("weights_fsv", weights_mem),
+        reorder("input_fsv16", "input_origin", { data_types::f16, format::b_fs_yx_fsv16, input_size }));    // format 3 to 8
+
+    // Add convolution
+    auto input_stride = tensor(1, 1, stride, stride);
+    auto input_offset = tensor(0, 0, input_offset_x, input_offset_y);
+    auto input_dilation = tensor(1, 1, 1, 1);
+    auto no_padding = tensor(0, 0, input_offset_x, input_offset_y);
+
+    auto conv_fsv = convolution("conv_fsv", "input_fsv16", { "weights_fsv" }, input_stride, input_offset, input_dilation, no_padding, no_padding);
+    topology.add(conv_fsv);                                                                                 // format 8 to 8 -> after fusing, format 8 to 3
+
+    // Add reorder to bfyx
+    auto reorder_bfyx = reorder("reorder_bfyx", "conv_fsv", { data_types::f32, format::bfyx, input_size });
+    topology.add(reorder_bfyx);                                                                             // format 8 to 3 -> after fusing, removed
+
+    // Exec ref network (non-fusing)
+    build_options options_ref;
+    options_ref.set_option(build_option::optimize_data(false));
+    options_ref.set_option(build_option::allow_static_input_reorder(true));
+
+    network network_ref(engine, topology, options_ref);
+    network_ref.set_input_data("input_origin", input_mem);
+    auto ref_out = network_ref.execute();
+
+    auto ref_out_mem = ref_out.begin()->second.get_memory();
+    cldnn::mem_lock<float> ref_out_ptr(ref_out_mem, get_test_stream());
+
+    // Exec target network (fusing: conv+reorder)
+    build_options options_target;
+    implementation_desc conv_impl = { format::b_fs_yx_fsv16, "convolution_gpu_bfyx_f16" };
+    options_target.set_option(build_option::force_implementations({ {"conv_fsv", conv_impl} }));
+    options_target.set_option(build_option::optimize_data(true));
+
+    network network_target(engine, topology, options_target);
+    network_target.set_input_data("input_origin", input_mem);
+    auto target_out = network_target.execute();
+
+    auto target_out_mem = target_out.begin()->second.get_memory();
+    cldnn::mem_lock<float> target_out_ptr(target_out_mem, get_test_stream());
+
+    // Compare ref and target result
+    for (size_t i = 0; i < ref_out_ptr.size(); i++) {
+        auto ref_val = static_cast<float>(ref_out_ptr[i]);
+        auto target_val = static_cast<float>(target_out_ptr[i]);
+        auto diff = std::abs(ref_val - target_val);
+        auto equal = (diff > 1e-5f) ? false : true;
+
+        EXPECT_TRUE(equal);
+        if (!equal)
+        {
+            std::cout << "i:" << i \
+                << "\t ref_out = " << ref_val \
+                << "\t target_out = " << target_val \
+                << std::endl;
+
+            break;
+        }
+    }
+}
+
 template <typename InputT, typename WeightsT, typename OutputT>
 class convolution_test_base {
 public:
@@ -8399,12 +8622,12 @@ class convolution_test : public tests::generic_test {
         all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[3], input_offset_sizes[3], dilation_sizes[3]));
 
         // Output padding
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[1], input_offset_sizes[1], dilation_sizes[1], { { 0, 0, 2, 4 },{ 0, 0, 0, 19 } }));
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[2], input_offset_sizes[2], dilation_sizes[2], { { 0, 0, 1, 0 },{ 0, 0, 13, 9 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[1], input_offset_sizes[1], dilation_sizes[1], "", { { 0, 0, 2, 4 }, { 0, 0, 0, 19 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "input0", weights, bias, stride_sizes[2], input_offset_sizes[2], dilation_sizes[2], "", { { 0, 0, 1, 0 }, { 0, 0, 13, 9 } }));
 
         // Input + Output padding
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[0], input_offset_sizes[0], dilation_sizes[0], { { 0, 0, 1, 5 },{ 0, 0, 19, 4 } }));
-        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[3], input_offset_sizes[3], dilation_sizes[3], { { 0, 0, 1, 2 },{ 0, 0, 3, 4 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[0], input_offset_sizes[0], dilation_sizes[0], "", { { 0, 0, 1, 5 }, { 0, 0, 19, 4 } }));
+        all_layer_params.emplace_back(new convolution("convolution_no_relu", "reorder0", weights, bias, stride_sizes[3], input_offset_sizes[3], dilation_sizes[3], "", { { 0, 0, 1, 2 }, { 0, 0, 3, 4 } }));
 
         return all_layer_params;
     }
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp
index 6fcd3aecb557c4..4a2281afa13a53 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/eltwise_gpu_test.cpp
@@ -96,7 +96,7 @@ void generic_eltwise_test(cldnn::format test_input_fmt, int input_b, int input_f
     topology.add(input_layout("input1", input1->get_layout()));
     topology.add(input_layout("input2", input2->get_layout()));
     topology.add(reorder("reorder1", "input1", input1->get_layout().with_padding(padding{{ 0, 0, input_padding_x, input_padding_y }, 0 })));
-    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
+    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, "", padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
     primitive_id out_id = "eltwise";
     if (relu)
     {
@@ -2660,7 +2660,7 @@ TEST(eltwise_gpu_f16, bfyx_and_fs_b_yx_fsv32_output_padding) {
     topology golden_topology;
     golden_topology.add(input_layout("input1", input1->get_layout()));
     golden_topology.add(input_layout("input2", input2->get_layout()));
-    golden_topology.add(eltwise("eltwise", "input1", "input2", eltwise_mode::sum, padding{ {0,0,5,10} , 0 }));
+    golden_topology.add(eltwise("eltwise", "input1", "input2", eltwise_mode::sum, "", padding{ {0,0,5,10} , 0 }));
 
     network golden_network(engine, golden_topology);
     golden_network.set_input_data("input1", input1);
@@ -2676,7 +2676,7 @@ TEST(eltwise_gpu_f16, bfyx_and_fs_b_yx_fsv32_output_padding) {
     FS_B_YX_FSV32_OUTPUT_topology.add(input_layout("input2", input2->get_layout()));
     FS_B_YX_FSV32_OUTPUT_topology.add(reorder("reorder1", "input1", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor)));
     FS_B_YX_FSV32_OUTPUT_topology.add(reorder("reorder2", "input2", layout(data_types::f16, format::byxf, input_tensor)));
-    FS_B_YX_FSV32_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, padding{ {0,0,5,10} , 0 }));
+    FS_B_YX_FSV32_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, "", padding{ {0,0,5,10} , 0 }));
     FS_B_YX_FSV32_OUTPUT_topology.add(reorder("reorderOutput", "eltwise", layout(data_types::f16, format::bfyx, input_tensor,
                                               padding{ {0,0,5,10} , 0 })));
 
@@ -2694,7 +2694,7 @@ TEST(eltwise_gpu_f16, bfyx_and_fs_b_yx_fsv32_output_padding) {
     BYXF_OUTPUT_topology.add(input_layout("input2", input2->get_layout()));
     BYXF_OUTPUT_topology.add(reorder("reorder1", "input1", layout(data_types::f16, format::byxf, input_tensor)));
     BYXF_OUTPUT_topology.add(reorder("reorder2", "input2", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor)));
-    BYXF_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, padding{ {0,0,5,10} , 0 }));
+    BYXF_OUTPUT_topology.add(eltwise("eltwise", "reorder1", "reorder2", eltwise_mode::sum, "", padding{ {0,0,5,10} , 0 }));
     BYXF_OUTPUT_topology.add(reorder("reorderOutput", "eltwise", layout(data_types::f16, format::bfyx, input_tensor,
                                      padding{ {0,0,5,10} , 0 })));
 
@@ -2876,7 +2876,7 @@ void generic_eltwise_bool_test(cldnn::format test_input_fmt, int input_b, int in
     topology.add(input_layout("input1", input1->get_layout()));
     topology.add(input_layout("input2", input2->get_layout()));
     topology.add(reorder("reorder1", "input1", input1->get_layout().with_padding(padding{{ 0, 0, input_padding_x, input_padding_y }, 0 })));
-    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
+    topology.add(eltwise("eltwise", {"reorder1", "input2"}, mode, "", padding{ { 0, 0, output_padding_x, output_padding_y }, 0 }));
 
     network network(engine, topology);
     network.set_input_data("input1", input1);
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp
index d683d1172862e8..903d7e18bab216 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/fusings_gpu_test.cpp
@@ -616,6 +616,73 @@ class ConvFusingTest : public WeightsPrimitiveFusingTest<bc_test_params> {
     }
 };
 
+class conv_fp32_reorder_fsv16_to_bfyx : public ConvFusingTest {};
+TEST_P(conv_fp32_reorder_fsv16_to_bfyx, basic) {
+    auto p = GetParam();
+    create_topologies(input_layout("input", get_input_layout(p)),
+        data("weights", get_mem(get_weights_layout(p))),
+        reorder("reorder_fsv16", "input", format::b_fs_yx_fsv16, data_types::f32),
+        convolution("conv_prim", "reorder_fsv16", { "weights" }, p.groups, p.stride, p.pad, p.dilation),
+        reorder("reorder_bfyx", "conv_prim", format::bfyx, data_types::f32)
+    );
+
+    execute(p);
+}
+
+INSTANTIATE_TEST_SUITE_P(fusings_gpu, conv_fp32_reorder_fsv16_to_bfyx, ::testing::ValuesIn(std::vector<bc_test_params>{
+    bc_test_params{ CASE_CONV_FP32_1, 2, 2},
+    bc_test_params{ CASE_CONV_FP32_2, 2, 2},
+    bc_test_params{ CASE_CONV_FP32_3, 2, 2},
+    bc_test_params{ CASE_CONV_FP32_4, 2, 2 },
+    bc_test_params{ CASE_CONV_FP32_5, 2, 2 },
+    bc_test_params{ CASE_CONV_FP32_14, 2, 2 },
+
+    bc_test_params{ CASE_CONV_FP16_1, 2, 2},
+    bc_test_params{ CASE_CONV_FP16_2, 2, 2},
+    bc_test_params{ CASE_CONV_FP16_3, 2, 2},
+    bc_test_params{ CASE_CONV_FP16_4, 2, 2 },
+    bc_test_params{ CASE_CONV_FP16_5, 2, 2 },
+    bc_test_params{ CASE_CONV_FP16_13, 2, 2}
+}));
+
+class conv_fp32_reorder_fsv16_to_bfyx_conv : public ConvFusingTest {};
+TEST_P(conv_fp32_reorder_fsv16_to_bfyx_conv, basic) {
+    auto p = GetParam();
+
+    auto dw_tensor = cldnn::tensor(group(p.out_shape.feature[0]), batch(1), feature(1), spatial(3, 3));
+    auto dw_weights_layout = layout{ p.default_type, format::goiyx, dw_tensor };
+    auto dw_stride = tensor{ 0, 0, 1, 1 };
+
+    create_topologies(input_layout("input", get_input_layout(p)),
+        data("weights", get_mem(get_weights_layout(p), -127, 127)),
+        data("weights_dw", get_mem(dw_weights_layout, -127, 127)),
+        reorder("reorder_fsv16", "input", format::b_fs_yx_fsv16, data_types::f32),
+        convolution("conv_prim", "reorder_fsv16", { "weights" }, p.groups, p.stride, p.pad, p.dilation),
+        reorder("reorder_bfyx", "conv_prim", format::bfyx, data_types::f32),
+        convolution("conv_output", "reorder_bfyx", { "weights_dw" }, 1, dw_stride, p.pad, p.dilation),
+        activation("activation", "conv_output", activation_func::abs),
+        reorder("reorder_output", "activation", p.default_format, data_types::f32)
+    );
+
+    execute(p);
+}
+
+INSTANTIATE_TEST_SUITE_P(fusings_gpu, conv_fp32_reorder_fsv16_to_bfyx_conv, ::testing::ValuesIn(std::vector<bc_test_params>{
+    bc_test_params{ CASE_CONV_FP32_1,  3, 4 },
+    bc_test_params{ CASE_CONV_FP32_2,  3, 4 },
+    bc_test_params{ CASE_CONV_FP32_3,  3, 4 },
+    bc_test_params{ CASE_CONV_FP32_4,  3, 4 },
+    bc_test_params{ CASE_CONV_FP32_5,  3, 4 },
+    bc_test_params{ CASE_CONV_FP32_14, 3, 4 },
+
+    bc_test_params{ CASE_CONV_FP16_1,  3, 4 },
+    bc_test_params{ CASE_CONV_FP16_2,  3, 4 },
+    bc_test_params{ CASE_CONV_FP16_3,  3, 4 },
+    bc_test_params{ CASE_CONV_FP16_4,  3, 4 },
+    bc_test_params{ CASE_CONV_FP16_5,  3, 4 },
+    bc_test_params{ CASE_CONV_FP16_13, 3, 4 },
+}));
+
 class conv_fp32_activation : public ConvFusingTest {};
 TEST_P(conv_fp32_activation, basic) {
     auto p = GetParam();
@@ -1026,6 +1093,7 @@ TEST_P(conv_fp32_multi_eltwise_concat, basic) {
             {"eltwise1", "eltwise2"},
             concatenation::concatenation_axis::along_f,
             data_types::i8,
+            "",
             padding{{0, 0, 0, 0}, 0}),
         reorder("reorder_bfyx", "concat", p.default_format, data_types::f32)
     );
@@ -2761,7 +2829,7 @@ TEST_P(fc_fp32_activation, basic) {
     create_topologies(input_layout("input", get_input_layout(p)),
                 data("weights", get_mem(get_fc_weights_layout(p))),
                 data("bias", get_mem(get_fc_bias_layout(p))),
-                fully_connected("fc_prim", "input", "weights", "bias", padding(), get_fc_output_dim_size(p)),
+                fully_connected("fc_prim", "input", "weights", "bias", "", padding(), get_fc_output_dim_size(p)),
                 activation("activation", "fc_prim", activation_func::abs),
                 reorder("reorder_bfyx", "activation", p.default_format, data_types::f32)
     );
@@ -2807,7 +2875,7 @@ TEST_P(fc_int8_scale, basic) {
         data("weights", get_mem(get_fc_weights_layout(p))),
         data("bias", get_mem(get_fc_bias_layout(p))),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count())),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data"),
         reorder("reorder_bfyx", "scale", p.default_format, data_types::f32)
     );
@@ -2822,7 +2890,7 @@ TEST_P(fc_int8_scale, fp16_scale_out) {
         data("weights", get_mem(get_fc_weights_layout(p))),
         data("bias", get_mem(get_fc_bias_layout(p))),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count())),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data", optional_data_type{data_types::f16}),
         reorder("reorder_bfyx", "scale", p.default_format, data_types::f32)
     );
@@ -2851,7 +2919,7 @@ TEST_P(fc_int8_quantize_u8, basic) {
         data("in_hi", get_mem(get_per_channel_layout(p), 1, max_random)),
         data("out_lo", get_mem(get_single_element_layout(p), 0)),
         data("out_hi", get_mem(get_single_element_layout(p), 255)),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         quantize("quantize", "fc_prim", "in_lo", "in_hi", "out_lo", "out_hi", 256, data_types::u8),
         reorder("reorder_bfyx", "quantize", p.default_format, data_types::f32)
     );
@@ -2881,7 +2949,7 @@ TEST_P(fc_int8_scale_quantize_i8, basic) {
         data("out_lo", get_mem(get_single_element_layout(p), -127)),
         data("out_hi", get_mem(get_single_element_layout(p), 127)),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count() / 255)),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data"),
         quantize("quantize", "scale", "in_lo", "in_hi", "out_lo", "out_hi", 255, data_types::i8),
         reorder("reorder_bfyx", "quantize", p.default_format, data_types::f32)
@@ -2913,7 +2981,7 @@ TEST_P(fc_int8_scale_activation_quantize_i8, basic) {
         data("out_lo", get_mem(get_single_element_layout(p), -127)),
         data("out_hi", get_mem(get_single_element_layout(p), 127)),
         data("scale_data", get_mem(get_per_channel_layout(p), 1.0f / p.kernel.count() / 255)),
-        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, padding(), get_fc_output_dim_size(p)),
+        fully_connected("fc_prim", "input", "weights", "bias", data_types::f32, "", padding(), get_fc_output_dim_size(p)),
         scale("scale", "fc_prim", "scale_data"),
         activation("activation_scale", "scale", activation_func::exp),
         quantize("quantize", "activation_scale", "in_lo", "in_hi", "out_lo", "out_hi", 255, data_types::i8),
@@ -8279,9 +8347,6 @@ INSTANTIATE_TEST_SUITE_P(fusings_gpu, scatter_nd_update_scale_activation_eltwise
         scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_5D_4, 2, 5 },
         scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_5D_5, 2, 5 },
         scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_5D_6, 2, 5 },
-        scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_5D_7, 2, 5 },
-        scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_5D_9, 2, 5 },
-        scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_5D_8, 2, 5 },
 
         scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_6D_1, 2, 5 },
         scatter_nd_update_test_params{ CASE_SCATTER_ND_UPDATE_FP16_6D_2, 2, 5 },
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp
index 0cb3c2cb828f1a..5bf6f5784dda1e 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/max_unpooling_gpu_test.cpp
@@ -63,7 +63,7 @@ TEST(max_unpooling_gpu, basic_in2x3x2x2) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(data("arg_max", arg_max));
-    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, ""));
 
     network network(engine, topology);
 
@@ -145,7 +145,7 @@ TEST(max_unpooling_gpu, basic_in2x3x2x2_output_padding) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(data("arg_max", arg_max));
-    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, padding({ 0, 0, 1, 1 }, 0)));
+    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, "", padding({ 0, 0, 1, 1 }, 0)));
 
     network network(engine, topology);
 
@@ -317,7 +317,7 @@ TEST(max_unpooling_gpu, basic_in2x3x2x2_fp16) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(data("arg_max", arg_max));
-    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(max_unpooling("max_unpooling", "input", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, ""));
 
     network network(engine, topology);
 
@@ -395,7 +395,7 @@ TEST(max_unpooling_gpu, basic_in2x2x3x2_max_with_argmax_pooling_unpooling) {
     topology.add(input_layout("input", input->get_layout()));
     topology.add(mutable_data("arg_max", arg_max));
     topology.add(pooling("pooling_max_with_argmax", "input", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
-    topology.add(max_unpooling("max_unpooling", "pooling_max_with_argmax", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(max_unpooling("max_unpooling", "pooling_max_with_argmax", "arg_max", { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, ""));
 
     network network(engine, topology);
 
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/memory_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/memory_test.cpp
index 4582f2ad06340e..e5e8bd01f09cea 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/memory_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/memory_test.cpp
@@ -403,7 +403,7 @@ TEST(memory_pool, shared_mem_pool_diff_batches) {
     network network_second(*engine, topo, bo);
     network_second.set_input_data("input", input_1);
     auto outputs_second = network_second.execute();
-    EXPECT_EQ(engine->get_max_used_device_memory(), (uint64_t)3928);
+    EXPECT_EQ(engine->get_max_used_device_memory(), (uint64_t)4328);
 }
 
 TEST(memory_pool, shared_dep_two_output) {
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp
index 0443137e933ab7..24a7f7ad9cf826 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/pooling_gpu_test.cpp
@@ -225,7 +225,7 @@ TEST(pooling_forward_gpu, basic_max_byxf_f32_wsiz3x3_wstr1x1_i1x3x3x8_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,3,3 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 3, 3 }, { 1, 1, 1, 1 }));
     network network(engine, topology);
     set_values(input_prim, { 0.5f, -0.5f, -0.5f, -0.5f, 0.5f, -0.5f, -0.5f, -0.5f,
         1.0f, 0.0f, 0.0f, 0.0f, 0.5f, -0.5f, -0.5f, -0.5f,
@@ -270,7 +270,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz3x3_wstr1x1_i3x3x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,3,3 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 3, 3 }, { 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 1.0f, 0.5f, 2.0f, 1.5f, -0.5f, 0.0f, -1.0f, 0.5f });
@@ -425,9 +425,9 @@ TEST(pooling_forward_gpu, basic_avg_b_fs_yx_fsv16_i8_global_i3x3x1x1_nopad) {
 TEST(pooling_forward_gpu, basic_max_pooling_int8) {
 
     auto& engine = get_test_engine();
-    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,3,3 } };
-    layout out_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,1,1 } };
-    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1,1,3,3 } };
+    layout in_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 3, 3 } };
+    layout out_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 1, 1 } };
+    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx, { 1, 1, 3, 3 } };
     std::initializer_list<float> input_f = { 1.0f, -2.5f, 3.1f, -4.0f, 5.03f, -6.99f, 7.0f, -8.0f, 9.5f };
     std::list<float> final_results = { 10.0f };
 
@@ -444,7 +444,7 @@ TEST(pooling_forward_gpu, basic_max_pooling_int8) {
         input,
         // 2. reorder primitive with id "reorder_input"
         reorder("reorder_input", input, byte_layout),
-        pooling("pool1", "reorder_input", pooling_mode::max, { 1,1,3,3 }, {1,1,1,1}),
+        pooling("pool1", "reorder_input", pooling_mode::max, { 1, 1, 3, 3 }, {1, 1, 1, 1}),
         reorder("reorder2", "pool1", out_layout)
     );
 
@@ -471,9 +471,9 @@ TEST(pooling_forward_gpu, basic_max_pooling_int8) {
 TEST(pooling_forward_gpu, basic_avg_pooling_int8) {
 
     auto& engine = get_test_engine();
-    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,3,3 } };
-    layout out_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,1,1 } };
-    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1,1,3,3 } };
+    layout in_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 3, 3 } };
+    layout out_layout = { type_to_data_type<float>::value, format::byxf, { 1, 1, 1, 1 } };
+    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx, { 1, 1, 3, 3 } };
     std::initializer_list<float> input_f = { 2.0f, -2.5f, 5.1f, -4.0f, 8.03f, -6.99f, 17.0f, -8.0f, 19.5f };
     // Average pooling returns fp32 by default for int8 inputs
     auto final_result = 0.0f;
@@ -496,7 +496,7 @@ TEST(pooling_forward_gpu, basic_avg_pooling_int8) {
         input,
         // 2. reorder primitive with id "reorder_input"
         reorder("reorder_input", input, byte_layout),
-        pooling("pool1", "reorder_input", pooling_mode::average, { 1,1,3,3 }, { 1,1,1,1 }),
+        pooling("pool1", "reorder_input", pooling_mode::average, { 1, 1, 3, 3 }, { 1, 1, 1, 1 }),
         reorder("reorder2", "pool1", out_layout)
     );
 
@@ -539,7 +539,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz2x2_wstr1x1_i3x3x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 1.0f, 0.5f, 2.0f, 1.5f, -0.5f, 0.0f, -1.0f, 0.5f });
@@ -583,7 +583,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz2x2_wstr2x2_i4x4x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.25f, 1.00f, 0.50f, 0.25f, 2.00f, 1.50f, -0.50f, -0.75f, 0.00f, -1.00f, 0.50f, 0.25f, 0.50f, -2.00f, -1.50f, -2.50f });
@@ -637,7 +637,7 @@ TEST(pooling_forward_gpu, basic_max_yxfb_f32_wsiz2x2_wstr1x1_i3x3x2x2_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 0.5f, -1.5f, 0.0f, 0.5f, 0.0f, -0.5f, 0.5f, 0.0f, -0.5f, 0.0f, -0.5f, 1.0f, -2.0f, 0.0f, 1.0f, -1.0f, -1.0f, -1.0f, -1.0f, -2.0f, 1.0f, 1.5f, 0.0f, -1.0f, -0.5f, -2.0f, 0.5f, -0.5f, -1.0f, 1.0f, -0.5f, -0.5f, 1.5f, -0.5f, 0.0f });
@@ -687,7 +687,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_f32_wsiz2x2_wstr2x2_i2x2x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0, 0, -1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1,-1 }));
 
     network network(engine, topology);
     set_values(input_prim, { 1.50f, -0.50f, -1.00f, 0.50f });
@@ -732,7 +732,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_f32_wsiz2x2_wstr2x2_i3x3x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
 
@@ -781,7 +781,7 @@ TEST(pooling_forward_gpu, basic_avg_yxfb_f32_wsiz2x2_wstr1x1_i3x3x1x1_nopad) {
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average,{ 1,1,2,2 },{ 1,1,1,1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average,{ 1, 1, 2, 2 },{ 1, 1, 1, 1 }));
 
     network network(engine, topology);
     set_values(input_prim, { -0.5f, 1.0f, 0.5f, 2.0f, 1.5f, -0.5f, 4.0f, -1.0f, 3.5f });
@@ -826,7 +826,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_f32_wsiz2x2_wstr2x2_i2x2x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
     set_values(input_prim, { 1.5f, -0.5f, -1.0f, 0.5f });
@@ -867,11 +867,11 @@ TEST(pooling_forward_gpu, offsets_avg_bfyx_f32_wsiz3x3_wstr3x3_i1x1x3x3_zeropad)
 
     auto& engine = get_test_engine();
 
-    auto input_prim = engine.allocate_memory({ data_types::f32, format::bfyx,{ 1, 1, 3, 3 } });
+    auto input_prim = engine.allocate_memory({ data_types::f32, format::bfyx, { 1, 1, 3, 3 } });
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,3,3 }, { 1,1,3,3 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, -1, 3, 3 }, { 1, 1, 3, 3 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
 
@@ -919,7 +919,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_f32_wsiz2x2_wstr2x2_i3x3x1x1_zeropad)
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }));
+    topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }));
 
     network network(engine, topology);
     set_values(input_prim, { 1.5f, -0.5f, 2.5f, -1.0f, 0.5f, 3.0f, 0.5f, 0.0f, -8.0f });
@@ -974,7 +974,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i2x2x1x1_out
 
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
-        topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,2,2 }, 0 }));
+        topology.add(pooling("pool_prim", "input_prim", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 2, 2 }, 0 }));
 
         network network(engine, topology);
         set_values(input_prim, { 1.5f, -0.5f, -1.0f, 0.5f });
@@ -1035,7 +1035,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i3x3x1x1_out
 
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
-        topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
+        topology.add(pooling("pool_prim", "input_prim", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
 
         network network(engine, topology);
 
@@ -1106,7 +1106,7 @@ TEST(pooling_forward_gpu, offsets_avg_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i2x2x1x1_inp
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ {0,0,1,2}, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,2,2 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 2, 2 }, 0 }));
 
         network network(engine, topology);
         set_values(input_prim, { 1.5f, -0.5f, -1.0f, 0.5f });
@@ -1169,7 +1169,7 @@ TEST(pooling_forward_gpu, offsets_max_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i3x3x1x1_inp
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ { 0, 0, 1, 2 }, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
 
         network network(engine, topology);
 
@@ -1240,7 +1240,7 @@ TEST(pooling_forward_gpu, avg_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i2x2x1x1_inpad2x1_ou
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,0,0 }, padding{ { 0,0,2,2 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, 0, 0 }, "", padding{ { 0, 0, 2, 2 }, 0 }));
 
         network network(engine, topology);
         set_values(input_prim, {
@@ -1308,7 +1308,7 @@ TEST(pooling_forward_gpu, max_yxfb_bfyx_f32_wsiz2x2_wstr2x2_i3x3x1x1_inpad2x1_ou
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder", "input_prim", input_prim->get_layout().with_padding(padding{ { 0, 0, 2, 1 }, 0 })));
-        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
+        topology.add(pooling("pool_prim", "reorder", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
 
         network network(engine, topology);
 
@@ -1366,8 +1366,8 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2_max_with_argmax) {
 
     auto& engine = get_test_engine();
 
-    auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 3, 2 } });
-    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 1 } });
+    auto input = engine.allocate_memory({ data_types::f32, format::bfyx, { 2, 2, 3, 2 } });
+    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfyx, { 2, 2, 2, 1 } });
 
     set_values(input, {
         1.0f, 2.0f, -10.f,
@@ -1443,8 +1443,8 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2x1_max_with_argmax) {
 
     auto& engine = get_test_engine();
 
-    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx,{ 2, 2, 3, 2, 1 } });
-    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfzyx,{ 2, 2, 2, 1, 1 } });
+    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx, { 2, 2, 3, 2, 1 } });
+    auto arg_max = engine.allocate_memory({ data_types::f32, format::bfzyx, { 2, 2, 2, 1, 1 } });
 
     set_values(input, {
         1.0f, 2.0f, -10.f,
@@ -1619,7 +1619,7 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2_max_with_argmax_output_padding) {
     topology.add(input_layout("input", input->get_layout()));
     topology.add(reorder("reorder", "input", input->get_layout().with_padding(padding{ { 0, 0, 2, 2 }, 0 })));
     topology.add(mutable_data("arg_max", arg_max));
-    topology.add(pooling("pooling", "reorder", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, padding({ 0, 0, 1, 1 }, 0)));
+    topology.add(pooling("pooling", "reorder", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, "", padding({ 0, 0, 1, 1 }, 0)));
 
     network network(engine, topology);
 
@@ -1707,7 +1707,7 @@ TEST(pooling_forward_gpu, basic_in2x2x3x2_max_with_argmax_with_output_size) {
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
     topology.add(mutable_data("arg_max", arg_max));
-    topology.add(pooling("pooling", "input", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, { 2, 2, 2, 1 }));
+    topology.add(pooling("pooling", "input", "arg_max", pooling_mode::max_with_argmax, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }, { 0, 0, 0, 0 }, { 2, 2, 2, 1 }, ""));
 
     network network(engine, topology);
 
@@ -2073,8 +2073,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_3x3_input_2x2_pool_1x1_stride_2x2_ou
     topology topology;
     topology.add(input_layout("input", input_prim->get_layout()));
     topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, { 1, 1, 3, 3 })));
-    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1,1,2,2 }, { 1,1,1,1 }));
-    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1,1,2,2 })));
+    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 1, 1 }));
+    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1, 1, 2, 2 })));
 
     network network(engine, topology);
     set_values(input_prim, { FLOAT16(-0.5f), FLOAT16(1.0f), FLOAT16(0.5f), FLOAT16(2.0f), FLOAT16(1.5f), FLOAT16(-0.5f), FLOAT16(4.0f), FLOAT16(-1.0f), FLOAT16(3.5f) });
@@ -2125,8 +2125,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_3x3_input_2x2_pool_2x2_stride)
     topology topology;
     topology.add(input_layout("input", input_prim->get_layout()));
     topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, { 1, 1, 3, 3 })));
-    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }));
-    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1,1,3,3 })));
+    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }));
+    topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { 1, 1, 3, 3 })));
 
     network network(engine, topology);
     set_values(input_prim, { FLOAT16(-0.5f), FLOAT16(1.0f), FLOAT16(0.5f), FLOAT16(2.0f), FLOAT16(1.5f), FLOAT16(-0.5f), FLOAT16(4.0f), FLOAT16(-1.0f), FLOAT16(3.5f) });
@@ -2191,7 +2191,7 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_2x2x3x3_input_2x2_pool_2x2_stride)
     topology topology;
     topology.add(input_layout("input", input_prim->get_layout()));
     topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, { batch_count, features_count, 3, 3 })));
-    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1,1,2,2 }, { 1,1,2,2 }));
+    topology.add(pooling("avg_pooling", "reorder_input", pooling_mode::average, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }));
     topology.add(reorder("reorder_after_pooling", "avg_pooling", layout(data_types::f16, format::bfyx, { batch_count, features_count, out_y, out_x })));
 
     network network(engine, topology);
@@ -2262,8 +2262,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_max_1x1x3x3_input_2x2_pool_2x2_stride_2x
         topology topology;
         topology.add(input_layout("input_prim", input_prim->get_layout()));
         topology.add(reorder("reorder_input", "input_prim", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor)));
-        topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
-        topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, { 1,1,4,4 }, padding{ {0,0,1,1},0 })));
+        topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
+        topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, { 1,1,4,4 }, padding{ { 0, 0, 1, 1 }, 0 })));
 
         network network(engine, topology);
 
@@ -2334,9 +2334,9 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_max_1x1x5x5_input_2x2_pool_2x2_stride_2x
 
     topology topology;
     topology.add(input_layout("input_prim", input_prim->get_layout()));
-    topology.add(reorder("reorder_input", "input_prim", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ { 0,0,2,1 } , 0 })));
-    topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1,1,2,2 }, { 1,1,2,2 }, { 0,0,-1,-1 }, padding{ { 0,0,1,1 }, 0 }));
-    topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, input_tensor, padding{{0,0,1,1},0})));
+    topology.add(reorder("reorder_input", "input_prim", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ { 0, 0, 2, 1 } , 0 })));
+    topology.add(pooling("pool_prim", "reorder_input", pooling_mode::max, { 1, 1, 2, 2 }, { 1, 1, 2, 2 }, { 0, 0, -1, -1 }, "", padding{ { 0, 0, 1, 1 }, 0 }));
+    topology.add(reorder("reorder_pooling", "pool_prim", layout(data_types::f16, format::bfyx, input_tensor, padding{ { 0, 0, 1, 1 }, 0 })));
 
     network network(engine, topology);
 
@@ -2412,7 +2412,7 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_65x5x6x7_input_3x3_pool_4x4_stride_3
         topology golden_topology;
         golden_topology.add(input_layout("input", input_prim->get_layout()));
         golden_topology.add(reorder("reorder_input", "input", input_prim->get_layout().with_padding(padding{ {0,0,x_in_pad,y_in_pad},0 })));
-        golden_topology.add(pooling("golden_pooling", "reorder_input", pooling_mode::average, { 1,1,pool_size,pool_size }, { 1,1,stride_size,stride_size }, { 0,0,0,0 }, padding{ { 0,0,x_out_pad,y_out_pad },0 }));
+        golden_topology.add(pooling("golden_pooling", "reorder_input", pooling_mode::average, { 1, 1, pool_size, pool_size }, { 1, 1, stride_size, stride_size }, { 0, 0, 0, 0 }, "", padding{ { 0, 0, x_out_pad, y_out_pad }, 0 }));
 
         network golden_network(engine, golden_topology);
         golden_network.set_input_data("input", input_prim);
@@ -2428,8 +2428,8 @@ TEST(pooling_forward_gpu, fs_b_yx_fsv32_avg_65x5x6x7_input_3x3_pool_4x4_stride_3
     { //FSV32 TOPOLOGY
         topology golden_topology;
         golden_topology.add(input_layout("input", input_prim->get_layout()));
-        golden_topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ {0,0,x_in_pad, y_in_pad}, 0 })));
-        golden_topology.add(pooling("fsv32_pooling", "reorder_input", pooling_mode::average, { 1,1,pool_size,pool_size }, { 1,1,stride_size,stride_size }, { 0,0,0,0 }, padding{ { 0,0,x_out_pad,y_out_pad },0 }));
+        golden_topology.add(reorder("reorder_input", "input", layout(data_types::f16, format::fs_b_yx_fsv32, input_tensor, padding{ {0, 0, x_in_pad, y_in_pad}, 0 })));
+        golden_topology.add(pooling("fsv32_pooling", "reorder_input", pooling_mode::average, { 1, 1, pool_size, pool_size }, { 1, 1, stride_size, stride_size }, { 0, 0, 0, 0 }, "", padding{ { 0, 0, x_out_pad, y_out_pad }, 0 }));
         golden_topology.add(reorder("reorder_pooling", "fsv32_pooling", layout(data_types::f16, format::bfyx, input_tensor, padding{ { 0,0,x_out_pad,y_out_pad },0 })));
 
         network fsv32_network(engine, golden_topology);
@@ -3481,10 +3481,10 @@ class pooling_test : public tests::generic_test
                     all_layer_params.emplace_back(new pooling("pooling", "reorder0", pooling_mode, size, stride));
 
                     // Output padding
-                    all_layer_params.emplace_back(new pooling("pooling", "input0", pooling_mode, size, stride, generate_input_offset(2, 3, size), { { 0, 0, 1, 5 },{ 0, 0, 19, 4 } }));
+                    all_layer_params.emplace_back(new pooling("pooling", "input0", pooling_mode, size, stride, generate_input_offset(2, 3, size), "", { { 0, 0, 1, 5 }, { 0, 0, 19, 4 } }));
 
                     // Input + output padding
-                    all_layer_params.emplace_back(new pooling("pooling", "reorder0", pooling_mode, size, stride, generate_input_offset(2, 3, size), { { 0, 0, 2, 1 },{ 0, 0, 3, 4 } }));
+                    all_layer_params.emplace_back(new pooling("pooling", "reorder0", pooling_mode, size, stride, generate_input_offset(2, 3, size), "", { { 0, 0, 2, 1 }, { 0, 0, 3, 4 } }));
                 }
             }
         }
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp
index a7ea1040828e28..5bb4fdecdac731 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/proposal_cpu_test.cpp
@@ -88,6 +88,7 @@ TestRunnerProposal<Dtype, ImInfoType>::TestRunnerProposal(cldnn::tensor image_in
                                         post_nms_topn,
                                         ratios,
                                         scales,
+                                        "",
                                         padding())
 {
     _topology.add(input_layout(cls_scores_name, _cls_scores_layout));
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp
index 3070fc902863fe..f2ce1cfbde5450 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/reorder_gpu_test.cpp
@@ -290,7 +290,7 @@ TEST(reorder_gpu_f32, basic) {
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx,{ 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f,
@@ -375,7 +375,7 @@ TEST(reorder_gpu_f32, basic_subtract) {
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32,  format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout( data_types::f32, format::bfyx, {2,2,2,2} );
+    layout output_layout( data_types::f32, format::bfyx, { 2, 2, 2, 2 } );
     auto subtract = engine.allocate_memory({ data_types::f32, format::byxf, { 1, 2, 2, 2 } });
 
     set_values(input, {
@@ -464,7 +464,7 @@ TEST(reorder_gpu_f32, basic_subtract_value) {
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx,{ 2, 2, 2, 2 });
     std::vector<float> subtract_val = { 0.5, 2.5 };
 
     set_values(input, {
@@ -555,7 +555,7 @@ TEST(reorder_gpu_f16, basic_subtract_f32_output_f32) {
     }
 
     auto input = engine.allocate_memory({ data_types::f16, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx,{ 2, 2, 2, 2 });
     auto subtract = engine.allocate_memory({ data_types::f32, format::byxf, { 1, 2, 2, 2 } });
 
     set_values(input, {
@@ -649,7 +649,7 @@ TEST(reorder_gpu_f16, basic_subtract_value) {
     }
 
     auto input = engine.allocate_memory({ data_types::f16, format::yxfb, { 2, 2, 2, 2 } });
-    layout output_layout(data_types::f16, format::bfyx,{ 2,2,2,2 });
+    layout output_layout(data_types::f16, format::bfyx,{ 2, 2, 2, 2 });
     std::vector<float> subtract_val = { 0.5, 2.5 };
 
     set_values(input, {
@@ -789,8 +789,8 @@ TEST(reorder_gpu, basic_convert_f16_f32_f16) {
 TEST(reorder_gpu, basic_convert_int8) {
 
     auto& engine = get_test_engine();
-    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1,1,3,3 } };
-    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1,1,3,3 } };
+    layout in_layout = { type_to_data_type<float>::value,format::byxf,{ 1, 1, 3, 3 } };
+    layout byte_layout = { type_to_data_type<int8_t>::value, format::bfyx,{ 1, 1, 3, 3 } };
     std::initializer_list<float> input_f = { 1.0f, -2.5f, 3.1f, -4.0f, 5.03f, -6.99f, 7.0f, -8.0f, 9.0f };
     std::list<float> final_results = { 1.0f, -3.0f, 3.0f, -4.0f, 5.0f, -7.0f, 7.0f, -8.0f, 9.0f };
 
@@ -835,74 +835,75 @@ TEST(reorder_gpu, basic_convert_int8) {
 }
 
 TEST(reorder_gpu, basic_convert_uint8rgbabyxf_to_fp32_bfyx) {
-	//  Converts an ARGB(uint8) image to common clDNN input of bfyx FP32
-	//
-	//  Input               : 1x5x5x4 (UINT8)
-	//  Intermediate        : 1x4x5x5 (FP32) {different mem format and ordering}
-	//  Output              : 1x3x5x5 (FP32) {using crop layer to reduce feature dimention and drop A from RGBA}
-	//
-	//  Output is expected to contain the same value as input
-	//
-	const int kernel_size = 5;
-	const int feature_size = 4;
-	auto& engine = get_test_engine();
-
-	if (!engine.get_device_info().supports_fp16)
-	{
-		std::cout << "[ SKIPPED ] The test is skipped (cl_khr_fp16 is not supported)." << std::endl;
-		EXPECT_EQ(1, 1);
-		return;
-	}
-
-	std::initializer_list<uint8_t> input_i8 = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20,
-		55, 54, 53, 52, 51, 50, 49, 48, 47, 46, 45, 44, 43, 42, 41, 40, 39, 38, 37, 36,
-		101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120,
-		155, 154, 153, 152, 151, 150, 149, 148, 147, 146, 145, 144, 143, 142, 141, 140, 139, 138, 137, 136,
-		255, 254, 253, 252, 251, 250, 249, 248, 247, 246, 245, 244, 243, 242, 241, 240, 239, 238, 237, 236
-	};
-
-	layout in_layout = { type_to_data_type<uint8_t>::value,format::byxf,{ 1,4,kernel_size,kernel_size } };
-	layout output_layout = { type_to_data_type<float>::value, format::bfyx, {1,4,kernel_size,kernel_size } };
-
-	// Allocate memory for input image.
-	auto input_memory = engine.allocate_memory(in_layout);
-	set_values(input_memory, input_i8);
+    //  Converts an ARGB(uint8) image to common clDNN input of bfyx FP32
+    //
+    //  Input               : 1x5x5x4 (UINT8)
+    //  Intermediate        : 1x4x5x5 (FP32) {different mem format and ordering}
+    //  Output              : 1x3x5x5 (FP32) {using crop layer to reduce feature dimention and drop A from RGBA}
+    //
+    //  Output is expected to contain the same value as input
+    //
+    const int kernel_size = 5;
+    const int feature_size = 4;
+    auto& engine = get_test_engine();
+
+    if (!engine.get_device_info().supports_fp16)
+    {
+        std::cout << "[ SKIPPED ] The test is skipped (cl_khr_fp16 is not supported)." << std::endl;
+        EXPECT_EQ(1, 1);
+        return;
+    }
+
+    std::initializer_list<uint8_t> input_i8 = { 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20,
+        55, 54, 53, 52, 51, 50, 49, 48, 47, 46, 45, 44, 43, 42, 41, 40, 39, 38, 37, 36,
+        101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120,
+        155, 154, 153, 152, 151, 150, 149, 148, 147, 146, 145, 144, 143, 142, 141, 140, 139, 138, 137, 136,
+        255, 254, 253, 252, 251, 250, 249, 248, 247, 246, 245, 244, 243, 242, 241, 240, 239, 238, 237, 236
+    };
+
+    layout in_layout = { type_to_data_type<uint8_t>::value,format::byxf,{ 1, 4, kernel_size,kernel_size } };
+    layout output_layout = { type_to_data_type<float>::value, format::bfyx, { 1, 4, kernel_size,kernel_size } };
+
+    // Allocate memory for input image.
+    auto input_memory = engine.allocate_memory(in_layout);
+    set_values(input_memory, input_i8);
 
     // Create input_layout description
-	// "input" - is the primitive id inside topology
-	input_layout input("input", in_layout);
-
-	// Create topology object with 2 primitives
-	topology topology(
-		// 1. input layout primitive.
-		input,
-		// 2. reorder primitive with id "reorder_input"
-		reorder("reorder_input",
-			// input primitive for reorder (implicitly converted to primitive_id)
-			input,
-			// output layout for reorder
-			output_layout)
-	);
-
-	tensor crop_reference_input_tensor(spatial(kernel_size, kernel_size), batch(1), feature(4 - 1));
-	tensor crop_offset_tensor(spatial(0, 0), batch(0), feature(0));
-	padding output_padding = padding({ 0,0,0,0 }, { 0,0,0,0 }, 0);
-	topology.add(
-		// cropping primitive with id "crop1"
-		crop("crop",
-			"reorder_input",    // primitive id of the cropping input
-			crop_reference_input_tensor,  // input tensor
-			crop_offset_tensor,    // bias primitive id
-			output_padding
-		)
-	);
-
-	network network(
-		engine,
-		topology,
+    // "input" - is the primitive id inside topology
+    input_layout input("input", in_layout);
+
+    // Create topology object with 2 primitives
+    topology topology(
+        // 1. input layout primitive.
+        input,
+        // 2. reorder primitive with id "reorder_input"
+        reorder("reorder_input",
+            // input primitive for reorder (implicitly converted to primitive_id)
+            input,
+            // output layout for reorder
+            output_layout)
+    );
+
+    tensor crop_reference_input_tensor(spatial(kernel_size, kernel_size), batch(1), feature(4 - 1));
+    tensor crop_offset_tensor(spatial(0, 0), batch(0), feature(0));
+    padding output_padding = padding({ 0, 0, 0, 0 }, { 0, 0, 0, 0 }, 0);
+    topology.add(
+        // cropping primitive with id "crop1"
+        crop("crop",
+             "reorder_input",               // primitive id of the cropping input
+             crop_reference_input_tensor,   // input tensor
+             crop_offset_tensor,            // bias primitive id
+             "",
+             output_padding
+            )
+    );
+
+    network network(
+        engine,
+        topology,
         build_options{
-			build_option::outputs({ "reorder_input", "crop" })
-		});
+            build_option::outputs({ "reorder_input", "crop" })
+        });
 
     network.set_input_data("input", input_memory);
 
@@ -979,7 +980,7 @@ TEST(reorder_gpu_f32, basic_yxfb_to_bfyx_input_padding)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::yxfb,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::bfyx, { 2,2,2,2 });
+    layout output_layout(data_types::f32, format::bfyx, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f,
@@ -997,7 +998,7 @@ TEST(reorder_gpu_f32, basic_yxfb_to_bfyx_input_padding)
 
     topology topology(
         input_layout("input", input->get_layout()),
-        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, padding{ { 0, 0, 1, 2 }, 0 }),
+        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, "", padding{ { 0, 0, 1, 2 }, 0 }),
         reorder("reorder2", "reorder", output_layout));
 
     network network(engine, topology);
@@ -1058,7 +1059,7 @@ TEST(reorder_gpu_f32, basic_bfyx_to_yxfb_input_padding)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::f32, format::yxfb, { 2,2,2,2 });
+    layout output_layout(data_types::f32, format::yxfb, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.0f,  2.0f,
@@ -1076,7 +1077,7 @@ TEST(reorder_gpu_f32, basic_bfyx_to_yxfb_input_padding)
 
     topology topology(
         input_layout("input", input->get_layout()),
-        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, padding{ { 0, 0, 2, 1 }, 0 }),
+        reorder("reorder", "input", input->get_layout().format, input->get_layout().data_type, "", reorder_mean_mode::subtract, "", padding{ { 0, 0, 2, 1 }, 0 }),
         reorder("reorder2", "reorder", output_layout));
 
     network network(engine, topology);
@@ -1357,12 +1358,12 @@ TEST(reorder_gpu_opt, remove_redundant_activation_fuse)
 
     memory::ptr in = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{ 1, 1, 2, 1 } });
     set_values(in, { -1.0f, -1.0f });
-    memory::ptr scale_mem = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{1, 1, 1, 1 } });
+    memory::ptr scale_mem = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{ 1, 1, 1, 1 } });
     set_values(scale_mem, { 2.0f });
     topology tpl{
         input_layout("in", in->get_layout()),
         reorder("r1", "in", format::bfyx, data_types::f32),
-        activation("relu", "r1", activation_func::relu_negative_slope, {0.01f, 0.0f}),
+        activation("relu", "r1", activation_func::relu_negative_slope, { 0.01f, 0.0f }),
         data("scale_data", scale_mem),
         scale("output", "relu", "scale_data")
     };
@@ -1467,7 +1468,7 @@ TEST(reorder_gpu_opt, mean_mul)
     auto& engine = get_test_engine();
 
     memory::ptr in  = engine.allocate_memory({ data_types::i8, format::bfyx, tensor{ 1, 3, 1, 2 } });
-    memory::ptr mul = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{1, 3, 1, 2 } });
+    memory::ptr mul = engine.allocate_memory({ data_types::f32, format::bfyx, tensor{ 1, 3, 1, 2 } });
 
     set_values<char>(in,
     { 1, 2,
@@ -1598,7 +1599,7 @@ TEST(reorder_gpu_i32, basic)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::i32, format::bfyx, { 2,2,2,2 });
+    layout output_layout(data_types::i32, format::bfyx, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f, 5.f, 1.5f,
@@ -1639,7 +1640,7 @@ TEST(reorder_gpu_i64, basic)
     auto& engine = get_test_engine();
 
     auto input = engine.allocate_memory({ data_types::f32, format::bfyx,{ 2, 2, 2, 2 } });
-    layout output_layout(data_types::i64, format::bfyx, { 2,2,2,2 });
+    layout output_layout(data_types::i64, format::bfyx, { 2, 2, 2, 2 });
 
     set_values(input, {
         1.f, 0.f, 5.f, 1.5f,
@@ -1910,11 +1911,11 @@ TEST(reorder_gpu_f32, bfzyx_to_bsv16_fsv16)
             for (int32_t z = 0; z < z_in; z++) {
                 for (int32_t y = 0; y < y_in; y++) {
                     for (int32_t x = 0; x < x_in; x++) {
-                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in,f_in,z_in,y_in,x_in,b,
-                                                                          0,f,0,
-                                                                          0,z,0,
-                                                                          0,y,0,
-                                                                          0,x,0);
+                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in, f_in, z_in, y_in, x_in, b,
+                                                                          0, f, 0,
+                                                                          0, z, 0,
+                                                                          0, y, 0,
+                                                                          0, x, 0);
                         EXPECT_FLOAT_EQ(input_ptr[linear_index++], output_ptr[bsv16_fsv16_index]);
                     }
                 }
@@ -1937,14 +1938,14 @@ TEST(reorder_gpu_f32, bfzyx_to_bsv16_fsv16_padded)
     const int32_t y_pad= 2;
     const int32_t x_pad= 1;
 
-    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx, { b_in,f_in,x_in,y_in,z_in } });
-    layout output_layout(data_types::f32, format::bs_fs_zyx_bsv16_fsv16,{ b_in,f_in,x_in,y_in,z_in });
+    auto input = engine.allocate_memory({ data_types::f32, format::bfzyx, { b_in, f_in, x_in, y_in, z_in } });
+    layout output_layout(data_types::f32, format::bs_fs_zyx_bsv16_fsv16, { b_in, f_in, x_in, y_in, z_in });
 
     tests::set_random_values<float>(input);
 
     topology topology(
             input_layout("input", input->get_layout()),
-            reorder("reorder", "input", output_layout.with_padding(padding({0, 0, x_pad, y_pad, 0}, 0.f))));
+            reorder("reorder", "input", output_layout.with_padding(padding({ 0, 0, x_pad, y_pad, 0 }, 0.f))));
 
     network network(engine, topology);
     network.set_input_data("input", input);
@@ -1992,11 +1993,11 @@ TEST(reorder_gpu_f32, bfzyx_to_bsv16_fsv16_padded)
             for (int32_t z = 0; z < z_in; z++) {
                 for (int32_t y = 0; y < y_in; y++) {
                     for (int32_t x = 0; x < x_in; x++) {
-                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in,f_in,z_in,y_in,x_in,b,
-                                                                          f_pad,f,f_pad,
-                                                                          z_pad,z,z_pad,
-                                                                          y_pad,y,y_pad,
-                                                                          x_pad,x,x_pad);
+                        int32_t bsv16_fsv16_index = get_bsv16_fsv16_index(b_in, f_in, z_in, y_in, x_in, b,
+                                                                          f_pad, f, f_pad,
+                                                                          z_pad, z, z_pad,
+                                                                          y_pad, y, y_pad,
+                                                                          x_pad, x, x_pad);
                         EXPECT_FLOAT_EQ(input_ptr[linear_index++], output_ptr[bsv16_fsv16_index]);
                     }
                 }
@@ -2066,7 +2067,7 @@ TEST(reorder_gpu_f32, b_fs_yx_fsv16_to_bfyx_opt_not_allowed)
             input_layout("input", input->get_layout()),
             data("weights", weights),
             reorder(reorder_name, "input", format::bfyx, data_types::f32),
-            convolution("convolution", reorder_name, {"weights"}, {1,1,1,1}, {0,0,-1,-1}, {1,1,1,1}));
+            convolution("convolution", reorder_name, {"weights"}, { 1, 1, 1, 1 }, { 0, 0, -1, -1 }, { 1, 1, 1, 1 }));
 
     build_options bo;
     bo.set_option(build_option::optimize_data(true));
@@ -2099,7 +2100,7 @@ TEST(reorder_gpu_f32, b_fs_yx_fsv16_to_bfyx_opt_padded)
     auto input = engine.allocate_memory({ data_types::f32,
                                             format::b_fs_yx_fsv16,
                                             { 2, 4, 1, 1 },
-                                            padding({1, 16, 0, 0}, {1, 0, 0, 0}) });
+                                            padding({ 1, 16, 0, 0 }, { 1, 0, 0, 0 }) });
 
     std::vector<float> in_data = {
         // b -1 (lower pad)
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp
index ff35e58e75eb7f..18916b3e3c3fb5 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/reshape_gpu_test.cpp
@@ -62,7 +62,7 @@ void generic_reshape_test(format fmt, tensor const& input_size, tensor const& re
         tpl.add(reorder("reorder", "input", padded_input_layout));
         reshape_input = "reorder";
     }
-    tpl.add(reshape("reshape", reshape_input, reshape_size, output_padd));
+    tpl.add(reshape("reshape", reshape_input, reshape_size, "", output_padd));
 
     build_options bo;
     bo.set_option(build_option::outputs({reshape_input, "reshape"}));
@@ -525,7 +525,7 @@ TEST(reshape_gpu_f32, basic_bfwzyx) {
 
     topology topology;
     topology.add(input_layout("input", input->get_layout()));
-    topology.add(reshape("reshape", "input", tensor(batch(1), feature(1), spatial(2, 2, 3, 3)), padding({0, 0, 0, 0, 0, 1}, 0.f)));
+    topology.add(reshape("reshape", "input", tensor(batch(1), feature(1), spatial(2, 2, 3, 3)), "", padding({0, 0, 0, 0, 0, 1}, 0.f)));
 
     // clang-format off
     std::vector<float> input_data = {
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp
index 286588efefa928..2795968a94b392 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/spatial_concatenate_gpu_test.cpp
@@ -15,8 +15,8 @@ using namespace ::tests;
 TEST(spatial_concatenate_f32_gpu, test01) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -68,8 +68,8 @@ TEST(spatial_concatenate_f32_gpu, test01) {
 TEST(spatial_concatenate_f32_gpu, test02) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -123,8 +123,8 @@ TEST(spatial_concatenate_f32_gpu, test02) {
 TEST(spatial_concatenate_f32_gpu, test03) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -148,7 +148,7 @@ TEST(spatial_concatenate_f32_gpu, test03) {
     topology tpl;
     tpl.add(input_layout("in1", input1->get_layout()));
     tpl.add(input_layout("in2", input2->get_layout()));
-    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_y, padding({ 0, 0, 1, 1 }, 0.0f)));
+    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_y, "", padding({ 0, 0, 1, 1 }, 0.0f)));
 
     network net(engine, tpl);
     net.set_input_data("in1", input1);
@@ -180,8 +180,8 @@ TEST(spatial_concatenate_f32_gpu, test03) {
 TEST(spatial_concatenate_f32_gpu, test04) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 }, padding({ 0,0,0,0 }, { 0,0,1,0 }) });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1,1,2,2 }, padding({ 0,0,0,1 }, 0.0f) });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 }, padding({ 0, 0, 0, 0 }, { 0, 0, 1, 0 }) });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx,{ 1, 1, 2, 2 }, padding({ 0, 0, 0, 1 }, 0.0f) });
 
     set_values(input1, {
         1.0f, 2.0f, 0.0f,
@@ -203,7 +203,7 @@ TEST(spatial_concatenate_f32_gpu, test04) {
     topology tpl;
     tpl.add(input_layout("in1", input1->get_layout()));
     tpl.add(input_layout("in2", input2->get_layout()));
-    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_x, padding({ 0,0,2,0 }, { 0,0,0,0 })));
+    tpl.add(concatenation("conc", { "in1", "in2" }, concatenation::along_x, "", padding({ 0, 0, 2, 0 }, { 0, 0, 0, 0 })));
 
     network net(engine, tpl);
     net.set_input_data("in1", input1);
@@ -235,9 +235,9 @@ TEST(spatial_concatenate_f32_gpu, test04) {
 TEST(spatial_concatenate_f32_gpu, inputs_3) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -296,9 +296,9 @@ TEST(spatial_concatenate_f32_gpu, inputs_3) {
 TEST(spatial_concatenate_f32_gpu, inputs_3_uneven_axis_b) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 3,1,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1,1,2,2 } });
-    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 2,1,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 3, 1, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 1, 1, 2, 2 } });
+    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfyx, { 2, 1, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -384,8 +384,8 @@ TEST(spatial_concatenate_f32_gpu, inputs_3_uneven_axis_b) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_x) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -444,8 +444,8 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_x) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_y) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -508,8 +508,8 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_y) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_z) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -572,8 +572,8 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_z) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_axis_b) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
 
     set_values(input1, {
         1.0f, 2.0f,
@@ -647,9 +647,9 @@ TEST(spatial_concatenate_f32_gpu, inputs3d_axis_b) {
 TEST(spatial_concatenate_f32_gpu, inputs3d_3_uneven_axis_b) {
     auto& engine = get_test_engine();
 
-    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 3,1,2,2,2 } });
-    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1,1,2,2,2 } });
-    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2,1,2,2,2 } });
+    memory::ptr input1 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 3, 1, 2, 2, 2 } });
+    memory::ptr input2 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 1, 1, 2, 2, 2 } });
+    memory::ptr input3 = engine.allocate_memory(layout{ data_types::f32, format::bfzyx, { 2, 1, 2, 2, 2 } });
 
     set_values(input1, {
         //b0
diff --git a/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp b/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp
index e7bbe9b553aa3a..795020327ad83e 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp
+++ b/inference-engine/thirdparty/clDNN/tests/test_cases/streams_test.cpp
@@ -28,7 +28,7 @@ TEST(gpu_streams, can_create_networks_for_stream) {
 
     topology topology(
             input_layout("input", input->get_layout()),
-            activation("relu", "input", activation_func::relu_negative_slope, activation_additional_params{ 0.5f, 0.f }, padding{ { 0, 0, 0, 0 }, 0 }));
+            activation("relu", "input", activation_func::relu_negative_slope, activation_additional_params{ 0.5f, 0.f }, "", padding{ { 0, 0, 0, 0 }, 0 }));
     network network(engine, topology, build_options());
 
     network.set_input_data("input", input);
diff --git a/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h b/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h
index 018b247643da4f..0577fb8c0757ae 100644
--- a/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h
+++ b/inference-engine/thirdparty/clDNN/tests/test_utils/network_test.h
@@ -329,7 +329,7 @@ class network_test {
                                                            std::shared_ptr<reference_node<BiasT, 2>> bias,
                                                            cldnn::implementation_desc force = cldnn::implementation_desc{cldnn::format::any, ""},
                                                            size_t input_dim_size = 3) {
-        topo.add(cldnn::fully_connected(id, input->id, weights->id, bias->id, cldnn::type_to_data_type<T>::value, cldnn::padding(), input_dim_size));
+        topo.add(cldnn::fully_connected(id, input->id, weights->id, bias->id, cldnn::type_to_data_type<T>::value, "", cldnn::padding(), input_dim_size));
         if (force.output_format != cldnn::format::any || force.kernel_name != "")
             forced_impls[id] = force;
         VVVVF<T> output_data = fully_connected_reference_typed_3d<T>(input->reference.reference,
diff --git a/inference-engine/thirdparty/mkl-dnn b/inference-engine/thirdparty/mkl-dnn
index aa5a4685377992..da792246029e22 160000
--- a/inference-engine/thirdparty/mkl-dnn
+++ b/inference-engine/thirdparty/mkl-dnn
@@ -1 +1 @@
-Subproject commit aa5a4685377992ae0733372c1568146872706670
+Subproject commit da792246029e226843883b449ef4847e8a544003
diff --git a/inference-engine/tools/package_BOM.txt b/inference-engine/tools/package_BOM.txt
deleted file mode 100644
index b1d58875c4819e..00000000000000
--- a/inference-engine/tools/package_BOM.txt
+++ /dev/null
@@ -1,6 +0,0 @@
-cross_check_tool/__init__.py
-cross_check_tool/utils.py
-cross_check_tool/requirements.txt
-cross_check_tool/README.md
-cross_check_tool/cross_check_tool.py
-compile_tool/README.md
\ No newline at end of file
diff --git a/model-optimizer/CMakeLists.txt b/model-optimizer/CMakeLists.txt
index 1cb74d6d67a7ad..220388cc87186e 100644
--- a/model-optimizer/CMakeLists.txt
+++ b/model-optimizer/CMakeLists.txt
@@ -23,7 +23,7 @@ configure_file(
     @ONLY)
 
 install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/
-        DESTINATION deployment_tools/model_optimizer
+        DESTINATION tools/model_optimizer
         USE_SOURCE_PERMISSIONS
         COMPONENT model_optimizer
         PATTERN ".*" EXCLUDE
@@ -31,13 +31,13 @@ install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/
         PATTERN "requirements_dev.txt" EXCLUDE
         PATTERN "README.md" EXCLUDE
         PATTERN "CMakeLists.txt" EXCLUDE
-        
+
         PATTERN "extensions/front/caffe/CustomLayersMapping.xml" EXCLUDE
         PATTERN "mo/utils/convert.py" EXCLUDE
         PATTERN "unit_tests" EXCLUDE
         PATTERN "openvino_mo.egg-info" EXCLUDE
         PATTERN "build" EXCLUDE
-        
+
         REGEX ".*__pycache__.*" EXCLUDE
         REGEX ".*\\.pyc$" EXCLUDE
         REGEX ".*\\.swp" EXCLUDE
@@ -45,12 +45,17 @@ install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/
         REGEX ".*_test\.py$" EXCLUDE
         )
 
-install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/unit_tests
-        DESTINATION deployment_tools/model_optimizer
+install(FILES requirements_dev.txt
+        DESTINATION tools/model_optimizer
+        COMPONENT tests
+        EXCLUDE_FROM_ALL)
+
+install(DIRECTORY unit_tests
+        DESTINATION tools/model_optimizer
         COMPONENT tests
         EXCLUDE_FROM_ALL)
 
-install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/automation
-        DESTINATION deployment_tools/model_optimizer
+install(DIRECTORY automation
+        DESTINATION tools/model_optimizer
         COMPONENT tests
         EXCLUDE_FROM_ALL)
diff --git a/model-optimizer/README.md b/model-optimizer/README.md
index bedd7dea26b8bf..7731565ad01e61 100644
--- a/model-optimizer/README.md
+++ b/model-optimizer/README.md
@@ -10,7 +10,7 @@ Model Optimizer requires:
 
 1. Go to the Model Optimizer folder:
 <pre>
-    cd PATH_TO_INSTALL_DIR/deployment_tools/model_optimizer
+    cd PATH_TO_INSTALL_DIR/tools/model_optimizer
 </pre>
 
 2. Create virtual environment and activate it. This option is strongly recommended as it creates a Python sandbox and
diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt
index 618f988a4c843e..f24ade4eed8cb6 100644
--- a/model-optimizer/automation/package_BOM.txt
+++ b/model-optimizer/automation/package_BOM.txt
@@ -12,6 +12,7 @@ extensions/back/AvgPool.py
 extensions/back/blob_normalizer.py
 extensions/back/CellNormalizer.py
 extensions/back/ChangeOutputTypeAttributes.py
+extensions/back/ChangeRandomUniformOutputType.py
 extensions/back/ClampNormalizer.py
 extensions/back/compress_quantized_weights.py
 extensions/back/ConvolutionNormalizer.py
@@ -52,11 +53,9 @@ extensions/back/ResultNormalizer.py
 extensions/back/ResultRename.py
 extensions/back/ReverseInputChannels.py
 extensions/back/RNNSequenceTypeRename.py
-extensions/back/ScalarConstNormalize.py
 extensions/back/SelectBroadcast.py
 extensions/back/ShapeOfConstFolding.py
 extensions/back/ShuffleChannelPatternOptimization.py
-extensions/back/ShufflenetReLUReorder.py
 extensions/back/SpecialNodesFinalization.py
 extensions/back/StridedSliceMasksNormalizer.py
 extensions/back/TopKNormalizer.py
@@ -69,6 +68,7 @@ extensions/front/ATenToEmbeddingBag.py
 extensions/front/AttributedClampNormalizer.py
 extensions/front/AttributedGatherNormalizer.py
 extensions/front/AttributedPadToPad.py
+extensions/front/AttributedRandomUniformToRandomUniform.py
 extensions/front/AttributedRollToRoll.py
 extensions/front/binary_quantize_normalization.py
 extensions/front/broadcast_with_range.py
@@ -127,7 +127,6 @@ extensions/front/ChangePlaceholderTypes.py
 extensions/front/create_tensor_nodes.py
 extensions/front/disable_weights_quantize_value_propagation.py
 extensions/front/div.py
-extensions/front/DropoutWithRandomUniformReplacer.py
 extensions/front/eltwise_n.py
 extensions/front/ExpandDimsToUnsqueeze.py
 extensions/front/FillToBroadcast.py
@@ -213,6 +212,7 @@ extensions/front/mxnet/pad_ext.py
 extensions/front/mxnet/pooling_ext.py
 extensions/front/mxnet/proposal_ext.py
 extensions/front/mxnet/psroi_pooling_ext.py
+extensions/front/mxnet/random_uniform_ext.py
 extensions/front/mxnet/repeat_ext.py
 extensions/front/mxnet/reshape_ext.py
 extensions/front/mxnet/RNN_ext.py
@@ -321,6 +321,7 @@ extensions/front/onnx/priorgridgenerator_ext.py
 extensions/front/onnx/proposal_ext.py
 extensions/front/onnx/quantize_ext.py
 extensions/front/onnx/quantize_linear_ext.py
+extensions/front/onnx/random_uniform_ext.py
 extensions/front/onnx/range_ext.py
 extensions/front/onnx/reduce_ext.py
 extensions/front/onnx/reshape_ext.py
@@ -462,6 +463,8 @@ extensions/front/tf/placeholder_ext.py
 extensions/front/tf/placeholder_with_default_ext.py
 extensions/front/tf/pooling_ext.py
 extensions/front/tf/prelu.py
+extensions/front/tf/random_uniform_ext.py
+extensions/front/tf/random_uniform_int_ext.py
 extensions/front/tf/range_ext.py
 extensions/front/tf/reduce_ext.py
 extensions/front/tf/reshape_related_ext.py
@@ -729,6 +732,7 @@ extensions/ops/proposal_onnx.py
 extensions/ops/proposal_python_example.py
 extensions/ops/psroipooling.py
 extensions/ops/quantize_linear.py
+extensions/ops/random_uniform.py
 extensions/ops/range.py
 extensions/ops/rank.py
 extensions/ops/ReduceOps.py
@@ -831,7 +835,6 @@ mo/front/common/partial_infer/elemental.py
 mo/front/common/partial_infer/eltwise.py
 mo/front/common/partial_infer/multi_box_detection.py
 mo/front/common/partial_infer/multi_box_prior.py
-mo/front/common/partial_infer/random_uniform.py
 mo/front/common/partial_infer/roipooling.py
 mo/front/common/partial_infer/utils.py
 mo/front/common/register_custom_ops.py
@@ -914,7 +917,6 @@ mo/front/tf/extractors/fused_bn.py
 mo/front/tf/extractors/identity.py
 mo/front/tf/extractors/native_tf.py
 mo/front/tf/extractors/pack.py
-mo/front/tf/extractors/random_uniform.py
 mo/front/tf/extractors/strided_slice.py
 mo/front/tf/extractors/subgraph_utils.py
 mo/front/tf/extractors/utils.py
@@ -1051,6 +1053,7 @@ mo/utils/ir_reader/extenders/parameter_extender.py
 mo/utils/ir_reader/extenders/pooling_extender.py
 mo/utils/ir_reader/extenders/priorbox_clustered_extender.py
 mo/utils/ir_reader/extenders/priorbox_extender.py
+mo/utils/ir_reader/extenders/random_uniform_extender.py
 mo/utils/ir_reader/extenders/range_extender.py
 mo/utils/ir_reader/extenders/reorg_yolo_extender.py
 mo/utils/ir_reader/extenders/RNNCell_extender.py
diff --git a/model-optimizer/extensions/analysis/tf_od_api.py b/model-optimizer/extensions/analysis/tf_od_api.py
index 8fe6d78964a036..214f8963694bbc 100644
--- a/model-optimizer/extensions/analysis/tf_od_api.py
+++ b/model-optimizer/extensions/analysis/tf_od_api.py
@@ -16,62 +16,73 @@ class TensorFlowObjectDetectionAPIAnalysis(AnalyzeAction):
     """
     graph_condition = [lambda graph: graph.graph['fw'] == 'tf']
 
-    model_scopes = [('MaskRCNN', ['Preprocessor',
-                                  'FirstStageFeatureExtractor',
+    file_patterns = {'MaskRCNN': 'mask_rcnn_support.*\\.json',
+                     'RFCN': 'rfcn_support.*\\.json',
+                     'FasterRCNN': 'faster_rcnn_support.*\\.json',
+                     'SSD': 'ssd.*_support.*\\.json',
+                     }
+    model_scopes = {'MaskRCNN': (['FirstStageFeatureExtractor',
                                   'SecondStageFeatureExtractor',
                                   'SecondStageBoxPredictor',
                                   'SecondStageBoxPredictor_1',
                                   'SecondStageFeatureExtractor_1',
-                                  ]),
-                    ('RFCN', ['Preprocessor',
-                              'FirstStageFeatureExtractor',
+                                  ],),
+                    'RFCN': (['FirstStageFeatureExtractor',
                               'SecondStageFeatureExtractor',
                               'SecondStageBoxPredictor',
                               'SecondStageBoxPredictor/map',
                               'SecondStageBoxPredictor/map_1',
                               'SecondStagePostprocessor',
-                              ]),
-                    ('FasterRCNN', ['Preprocessor',
-                                    'FirstStageFeatureExtractor',
+                              ],),
+                    'FasterRCNN': (['FirstStageFeatureExtractor',
                                     'SecondStageFeatureExtractor',
                                     'SecondStageBoxPredictor',
                                     'SecondStagePostprocessor',
-                                    ]),
-                    ('SSD', ['Preprocessor',
-                             'FeatureExtractor',
-                             'Postprocessor',
-                             ]),
-                    ]
-
-    file_patterns = {'MaskRCNN': 'mask_rcnn_support.*\\.json',
-                     'RFCN': 'rfcn_support.*\\.json',
-                     'FasterRCNN': 'faster_rcnn_support.*\\.json',
-                     'SSD': 'ssd.*_support.*\\.json',
-                     }
+                                    ],
+                                   ['FirstStageRPNFeatures',
+                                    'FirstStageBoxPredictor',
+                                    'SecondStagePostprocessor',
+                                    'mask_rcnn_keras_box_predictor',
+                                    ],),
+                    'SSD': ([('FeatureExtractor', 'ssd_mobile_net_v2keras_feature_extractor',
+                              'ssd_mobile_net_v1fpn_keras_feature_extractor',
+                              'ssd_mobile_net_v2fpn_keras_feature_extractor', 'ResNet50V1_FPN', 'ResNet101V1_FPN',
+                              'ResNet152V1_FPN'
+                              ),
+                             'Postprocessor']
+                            ),
+                    }
 
     def analyze(self, graph: Graph):
-        if any([name not in graph.nodes() for name in ['image_tensor', 'detection_classes', 'detection_boxes',
-                                                       'detection_scores']]):
+        tf_1_names = ['image_tensor', 'detection_classes', 'detection_boxes', 'detection_scores',
+                      ('Preprocessor', 'map')]
+        tf_1_cond = all([graph_contains_scope(graph, scope) for scope in tf_1_names])
+
+        tf_2_names = ['input_tensor', 'output_control_node', 'Identity_', ('Preprocessor', 'map')]
+        tf_2_cond = all([graph_contains_scope(graph, scope) for scope in tf_2_names])
+
+        if not tf_1_cond and not tf_2_cond:
             log.debug('The model does not contain nodes that must exist in the TF OD API models')
             return None, None
 
-        for flavor, scopes in __class__.model_scopes:
-            if all([graph_contains_scope(graph, scope) for scope in scopes]):
-                result = dict()
-                result['flavor'] = flavor
-                result['mandatory_parameters'] = {'tensorflow_use_custom_operations_config':
-                                                      files_by_pattern(get_mo_root_dir() + '/extensions/front/tf',
-                                                                       __class__.file_patterns[flavor],
-                                                                       add_prefix=True),
-                                                  'tensorflow_object_detection_api_pipeline_config': None,
-                                                  }
-                message = "Your model looks like TensorFlow Object Detection API Model.\n" \
-                          "Check if all parameters are specified:\n" \
-                          "\t--tensorflow_use_custom_operations_config\n" \
-                          "\t--tensorflow_object_detection_api_pipeline_config\n" \
-                          "\t--input_shape (optional)\n" \
-                          "\t--reverse_input_channels (if you convert a model to use with the Inference Engine sample applications)\n" \
-                          "Detailed information about conversion of this model can be found at\n" \
-                          "https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_Object_Detection_API_Models.html"
-                return {'model_type': {'TF_OD_API': result}}, message
+        for flavor, scopes_tuple in self.model_scopes.items():
+            for scopes in scopes_tuple:
+                if all([graph_contains_scope(graph, scope) for scope in scopes]):
+                    result = dict()
+                    result['flavor'] = flavor
+                    result['mandatory_parameters'] = {'tensorflow_use_custom_operations_config':
+                                                          files_by_pattern(get_mo_root_dir() + '/extensions/front/tf',
+                                                                           __class__.file_patterns[flavor],
+                                                                           add_prefix=True),
+                                                      'tensorflow_object_detection_api_pipeline_config': None,
+                                                      }
+                    message = "Your model looks like TensorFlow Object Detection API Model.\n" \
+                              "Check if all parameters are specified:\n" \
+                              "\t--transformations_config\n" \
+                              "\t--tensorflow_object_detection_api_pipeline_config\n" \
+                              "\t--input_shape (optional)\n" \
+                              "\t--reverse_input_channels (if you convert a model to use with the Inference Engine sample applications)\n" \
+                              "Detailed information about conversion of this model can be found at\n" \
+                              "https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_Object_Detection_API_Models.html"
+                    return {'model_type': {'TF_OD_API': result}}, message
         return None, None
diff --git a/model-optimizer/extensions/analysis/tf_retinanet.py b/model-optimizer/extensions/analysis/tf_retinanet.py
index 35fdcf9d49c04a..6d78c81f5905bd 100644
--- a/model-optimizer/extensions/analysis/tf_retinanet.py
+++ b/model-optimizer/extensions/analysis/tf_retinanet.py
@@ -59,7 +59,7 @@ def analyze(self, graph: Graph):
                       "To generate the IR, provide model to the Model Optimizer with the following parameters:\n" \
                       "\t--input_model <path_to_model>/<model>.pb\n" \
                       "\t--input_shape [1,600,600,3]\n" \
-                      "\t--tensorflow_use_custom_operations_config <OPENVINO_INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf/retinanet.json\n" \
+                      "\t--tensorflow_use_custom_operations_config <OPENVINO_INSTALL_DIR>/tools/model_optimizer/extensions/front/tf/retinanet.json\n" \
                       "\t--reverse_input_channels"
 
             return {'model_type': {'TF_RetinaNet': result}}, message
diff --git a/model-optimizer/extensions/analysis/tf_yolo.py b/model-optimizer/extensions/analysis/tf_yolo.py
index 626187b25f508b..f409cf283135b0 100644
--- a/model-optimizer/extensions/analysis/tf_yolo.py
+++ b/model-optimizer/extensions/analysis/tf_yolo.py
@@ -72,7 +72,7 @@ def analyze(self, graph: Graph):
                       "To generate the IR, provide TensorFlow YOLOv1 or YOLOv2 Model to the Model Optimizer with the following parameters:\n" \
                       "\t--input_model <path_to_model>/<model_name>.pb\n" \
                       "\t--batch 1\n" \
-                      "\t--tensorflow_use_custom_operations_config <OPENVINO_INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf/<yolo_config>.json\n" \
+                      "\t--tensorflow_use_custom_operations_config <OPENVINO_INSTALL_DIR>/tools/model_optimizer/extensions/front/tf/<yolo_config>.json\n" \
                       "All detailed information about conversion of this model can be found at\n" \
                       "https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_YOLO_From_Tensorflow.html"
             return {'model_type': {'YOLO': get_YOLO_params_by_flavor(flavor)}}, message
@@ -99,7 +99,7 @@ def analyze(self, graph: Graph):
                       "To generate the IR, provide TensorFlow YOLOv3 Model to the Model Optimizer with the following parameters:\n" \
                       "\t--input_model <path_to_model>/yolo_v3.pb\n" \
                       "\t--batch 1\n" \
-                      "\t--tensorflow_use_custom_operations_config <OPENVINO_INSTALL_DIR>/deployment_tools/model_optimizer/extensions/front/tf/yolo_v3.json\n" \
+                      "\t--tensorflow_use_custom_operations_config <OPENVINO_INSTALL_DIR>/tools/model_optimizer/extensions/front/tf/yolo_v3.json\n" \
                       "Detailed information about conversion of this model can be found at\n" \
                       "https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_YOLO_From_Tensorflow.html"
             return {'model_type': {'YOLO': get_YOLO_params_by_flavor(flavor)}}, message
diff --git a/model-optimizer/extensions/back/ChangeRandomUniformOutputType.py b/model-optimizer/extensions/back/ChangeRandomUniformOutputType.py
new file mode 100644
index 00000000000000..0ba69f2364a89f
--- /dev/null
+++ b/model-optimizer/extensions/back/ChangeRandomUniformOutputType.py
@@ -0,0 +1,44 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import numpy as np
+
+from extensions.ops.Cast import Cast
+from mo.back.replacement import BackReplacementPattern
+from mo.graph.graph import Graph
+from mo.middle.passes.convert_data_type import data_type_str_to_np
+
+
+class ChangeRandomUniformOutputType(BackReplacementPattern):
+    """
+    This transformation adds Cast to IR data_type after RandomUniform operation
+    when RandomUniform output type is not equal to IR data_type and RandomUniform output type
+    is floating point type.
+    'output_type' attribute determines the generation algorithm of RandomUniform, so output numbers
+    generated for different values of 'output_type' may not be equal. For this reason 'output_type'
+    attribute shouldn't be changed for matching of inference results. So in cases when we need
+    to change the data type of RandomUniform we need to insert Cast node after RandomUniform.
+    """
+    enabled = True
+    force_shape_inference = True
+
+    def run_after(self):
+        from extensions.back.MarkNodesWithShapeValues import MarkNodesWithShapeValues
+        return [MarkNodesWithShapeValues]
+
+    def run_before(self):
+        return []
+
+    def find_and_replace_pattern(self, graph: Graph):
+        ir_data_type = data_type_str_to_np(graph.graph['cmd_params'].data_type)
+
+        for node in graph.get_op_nodes(op='RandomUniform'):
+            assert node.has_valid('output_type')
+
+            if node.has_and_set('returns_shape_value'):
+                continue
+
+            if node.output_type != ir_data_type and np.issubdtype(node.output_type, np.floating):
+                node_name = node.soft_get('name', node.id)
+                convert_node = Cast(graph, {'name': node_name + "/cast", 'dst_type': ir_data_type}).create_node()
+                node.out_port(0).get_connection().insert_node(convert_node)
diff --git a/model-optimizer/extensions/back/ReduceMerge.py b/model-optimizer/extensions/back/ReduceMerge.py
index 418f3a18ffc3b0..3ec28a86535c7d 100644
--- a/model-optimizer/extensions/back/ReduceMerge.py
+++ b/model-optimizer/extensions/back/ReduceMerge.py
@@ -5,7 +5,6 @@
 
 import numpy as np
 
-from extensions.back.ScalarConstNormalize import ScalarNormalize
 from extensions.ops.ReduceOps import reduce_map
 from mo.back.replacement import BackReplacementPattern
 from mo.front.common.partial_infer.utils import int64_array
@@ -23,9 +22,6 @@ class ReduceMerge(BackReplacementPattern):
     enabled = True
     force_clean_up = True
 
-    def run_before(self):
-        return [ScalarNormalize]
-
     @staticmethod
     def fuse_reduces(first_reduce, second_reduce):
         first_reduce_name = first_reduce.soft_get('name', first_reduce.id)
diff --git a/model-optimizer/extensions/back/ReverseInputChannels.py b/model-optimizer/extensions/back/ReverseInputChannels.py
index 088130e0bf26e1..ce0cbb952ae363 100644
--- a/model-optimizer/extensions/back/ReverseInputChannels.py
+++ b/model-optimizer/extensions/back/ReverseInputChannels.py
@@ -114,7 +114,7 @@ def pass_rc_through(node: Node, reverse_channels: Node):
         returns boolean value whatever we should continue propagating current ReverseChannels operation down or not
         """
         # detaching reverse_channels node from the graph
-        if reverse_channels.is_in_port_connected(0) and reverse_channels.is_out_port_connected(0)\
+        if reverse_channels.is_in_port_connected(0) and reverse_channels.is_out_port_connected(0) \
                 and node.is_out_port_connected(0):
             reverse_channels.out_port(0).get_connection().set_source(
                 reverse_channels.in_port(0).get_connection().get_source())
@@ -137,7 +137,7 @@ def pass_rc_through_conv(node, reverse_channels):
         ReverseChannels    weights   previous_op   ReverseChannels
                      \     /                 \     /
                       Conv                    Conv
-            
+
         For grouped convolution:
         BEFORE                          AFTER
 
@@ -295,12 +295,11 @@ class ReverseChannelsPropagationUp(BackReplacementPattern):
         'Subtract': lambda node, rc: ReverseChannelsPropagationUp.lift_up_through_eltwise(node, rc),
         'Pow': lambda node, rc: ReverseChannelsPropagationUp.lift_up_through_eltwise(node, rc),
         'Convert': lambda node, rc: ReverseChannelsPropagationUp.lift_up_through_eltwise(node, rc),
-
-        'Pad': lambda node, rc: ReverseChannelsPropagationUp.lift_up_through(node, rc),
+        'Pad': lambda node, rc: ReverseChannelsPropagationUp.lift_up_through_pad(node, rc),
     }
 
     @staticmethod
-    def lift_up_through(node: Node, reverse_channels: Node):
+    def lift_up_through_pad(node: Node, reverse_channels: Node):
         r"""
         BEFORE                       AFTER
 
@@ -308,25 +307,29 @@ def lift_up_through(node: Node, reverse_channels: Node):
                                           \
         previous_op  previous_op       ReverseChannels  previous_op
                  \     /                           \     /
-                   Node                             Node
+                   Pad                              Pad
                     |                                |
               ReverseChannels                      next_op
                     |
                  next_op
 
-        returns boolean value whatever we should continue propagating current ReverseChannels operation up or not
+        returns two objects:
+        first - boolean value whatever we should continue propagating current ReverseChannels operation up or not
+        second - list of ReverseChannels operations that were produced while propagating reverse_channels up
         """
         if node.is_in_port_connected(0):
             node_input_port_0 = node.in_port(0)
-            reverse_channels_out_npde = reverse_channels.out_port(0).get_connection().get_destination().node
+            reverse_channels_out_nodes = reverse_channels.out_port(0).get_connection().get_destinations()
             reverse_channels.out_port(0).disconnect()
-
+            reverse_channels.in_port(0).disconnect()
             src = node_input_port_0.get_connection().get_source()
             node_input_port_0.get_connection().set_source(reverse_channels.out_port(0))
             src.connect(reverse_channels.in_port(0))
-            node.out_port(0).get_connection().set_destination(reverse_channels_out_npde.in_port(0))
-            return True
-        return False
+            for reverse_channels_destination in reverse_channels_out_nodes:
+                node.out_port(0).get_connection().add_destination(reverse_channels_destination)
+
+            return True, [reverse_channels]
+        return False, []
 
     @staticmethod
     def lift_up_through_eltwise(node: Node, reverse_channels: Node):
diff --git a/model-optimizer/extensions/back/ScalarConstNormalize.py b/model-optimizer/extensions/back/ScalarConstNormalize.py
deleted file mode 100644
index 923f68b8929dbf..00000000000000
--- a/model-optimizer/extensions/back/ScalarConstNormalize.py
+++ /dev/null
@@ -1,36 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-from extensions.back.ReshapeMutation import ReshapeMutation
-from mo.back.replacement import BackReplacementPattern
-from mo.front.common.partial_infer.utils import int64_array
-from mo.front.tf.graph_utils import create_op_node_with_second_input
-from mo.graph.graph import Graph
-from mo.ops.reshape import Reshape
-
-
-# Temporary nGraph workaround. TODO: REMOVE
-class ScalarNormalize(BackReplacementPattern):
-    enabled = False
-    force_clean_up = True
-
-    def run_before(self):
-        return [ReshapeMutation]
-
-    @staticmethod
-    def pattern():
-        return dict(
-            nodes=[
-                ('op', dict(kind='op', type='Const'))],
-            edges=[]
-        )
-
-    @staticmethod
-    def replace_pattern(graph: Graph, match: dict):
-        node = match['op']
-        if node.value.ndim == 0:
-            reshape = create_op_node_with_second_input(graph, Reshape, int64_array([1]),
-                                                       {'name': node.id + '/Dims'})
-            node.out_port(0).get_connection().set_source(reshape.out_port(0))
-            node.out_port(0).connect(reshape.in_port(0))
-            reshape.infer(reshape)
diff --git a/model-optimizer/extensions/back/ShufflenetReLUReorder.py b/model-optimizer/extensions/back/ShufflenetReLUReorder.py
deleted file mode 100644
index 89cd9d7629790a..00000000000000
--- a/model-optimizer/extensions/back/ShufflenetReLUReorder.py
+++ /dev/null
@@ -1,62 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import numpy as np
-
-from mo.back.replacement import BackReplacementPattern
-from mo.graph.graph import Graph
-
-
-class ShufflenetReLUReorder(BackReplacementPattern):
-    """
-    This pass is workaround for GPU plugin
-    """
-    enabled = False
-
-    def pattern(self):
-        return dict(
-            nodes=[
-                ('relu', dict(kind='op', type='ReLU')),
-                ('relu_data', dict(kind='data')),
-                ('reshape1', dict(kind='op', type='Reshape')),
-                ('reshape1_data', dict(kind='data')),
-                ('transpose', dict(kind='op', type='Transpose')),
-                ('transpose_data', dict(kind='data')),
-                ('reshape2', dict(kind='op', type='Reshape')),
-                ('reshape2_data', dict(kind='data')),
-                ('conv', dict(kind='op', type='Convolution'))
-            ],
-            edges=[('relu', 'relu_data'),
-                   ('relu_data', 'reshape1'),
-                   ('reshape1', 'reshape1_data'),
-                   ('reshape1_data', 'transpose'),
-                   ('transpose', 'transpose_data'),
-                   ('transpose_data', 'reshape2'),
-                   ('reshape2', 'reshape2_data'),
-                   ('reshape2_data', 'conv'),
-                   ]
-        )
-
-    def replace_pattern(self, graph: Graph, match: dict):
-        relu = match['relu']
-        reshape1 = match['reshape1']
-        reshape2_data = match['reshape2_data']
-        conv = match['conv']
-
-        if np.max(conv.pad) == 0:
-            return
-
-        relu_input = relu.in_node()
-
-        # Disconnect InputData-x->ReLU->Data-x->Reshape1
-        edge_attrs = graph.get_edge_data(relu.out_node().id, reshape1.id)[0]
-        graph.remove_edge(relu_input.id, relu.id)
-        graph.remove_edge(relu.out_node().id, reshape1.id)
-
-        # Connect InputData-->Reshape1
-        graph.add_edges_from([(relu_input.id, reshape1.id, edge_attrs)])
-
-        # Insert ReLU:  Reshape2Data->ReLU->Data->Convolution
-        edge_attrs = graph.get_edge_data(reshape2_data.id, conv.id)[0]
-        graph.remove_edge(reshape2_data.id, conv.id)
-        graph.add_edges_from([(reshape2_data.id, relu.id, {'in': 0}), (relu.out_node().id, conv.id, edge_attrs)])
diff --git a/model-optimizer/extensions/back/TopKNormalizer.py b/model-optimizer/extensions/back/TopKNormalizer.py
index 6fc3f33e3a9401..90c43d641a187b 100644
--- a/model-optimizer/extensions/back/TopKNormalizer.py
+++ b/model-optimizer/extensions/back/TopKNormalizer.py
@@ -2,7 +2,6 @@
 # SPDX-License-Identifier: Apache-2.0
 
 from extensions.back.Reshape0DToSqueeze import Reshape0DToSqueeze
-from extensions.back.ScalarConstNormalize import ScalarNormalize
 from mo.back.replacement import BackReplacementPattern
 from mo.front.common.partial_infer.utils import int64_array
 from mo.front.tf.graph_utils import create_op_node_with_second_input
@@ -23,9 +22,6 @@ class TopKNormalizer(BackReplacementPattern):
     """
     enabled = True
 
-    def run_after(self):
-        return [ScalarNormalize]
-
     def run_before(self):
         return [Reshape0DToSqueeze]
 
diff --git a/model-optimizer/extensions/front/AttributedRandomUniformToRandomUniform.py b/model-optimizer/extensions/front/AttributedRandomUniformToRandomUniform.py
new file mode 100644
index 00000000000000..840f59f5d39bfa
--- /dev/null
+++ b/model-optimizer/extensions/front/AttributedRandomUniformToRandomUniform.py
@@ -0,0 +1,56 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from extensions.ops.random_uniform import RandomUniform
+from mo.front.common.replacement import FrontReplacementPattern
+from mo.front.tf.graph_utils import create_op_with_const_inputs
+from mo.graph.graph import Graph, rename_nodes
+from mo.utils.error import Error
+
+
+class AttributedRandomUniformToRandomUniform(FrontReplacementPattern):
+    """
+    This transformation converts AttributedRandomUniform operation (output shape, min value and max value
+    can be specified as attribute) to RandomUniform operation (Inference Engine semantic).
+    """
+    enabled = True
+
+    def find_and_replace_pattern(self, graph: Graph):
+        for attr_random_uniform in graph.get_op_nodes(op='AttributedRandomUniform'):
+            original_name = attr_random_uniform.soft_get('name', attr_random_uniform.id)
+
+            if not attr_random_uniform.has_valid('output_type'):
+                raise Error("RandomUniform should have valid ''output_type'' attribute.")
+            output_type = attr_random_uniform.soft_get('output_type')
+
+            if attr_random_uniform.has_valid('min_val'):
+                min_val = attr_random_uniform['min_val']
+            else:
+                min_val = output_type(0)
+            if attr_random_uniform.has_valid('max_val'):
+                max_val = attr_random_uniform['max_val']
+            else:
+                max_val = output_type(1)
+
+            port_value_dict = {1: min_val, 2: max_val}
+
+            if not attr_random_uniform.has_port('in', 0) or attr_random_uniform.in_port(0).disconnected():
+                if not attr_random_uniform.has_valid('shape'):
+                    raise Error("RandomUniform should have valid ''shape'' attribute or input node on 0 port.")
+                else:
+                    port_value_dict.update({0: attr_random_uniform.shape})
+
+            attrs = {'global_seed': attr_random_uniform.soft_get('global_seed', 0), 'op_seed': attr_random_uniform.soft_get('op_seed', 0),
+                     'output_type': output_type}
+
+            new_random_uniform = create_op_with_const_inputs(graph, op=RandomUniform, port_value_dict=port_value_dict,
+                                                             op_attrs=attrs)
+            rename_nodes([(attr_random_uniform, original_name + '/to_be_removed'), (new_random_uniform, original_name)])
+            attr_random_uniform.out_port(0).get_connection().set_source(new_random_uniform.out_port(0))
+            if new_random_uniform.in_port(0).disconnected():
+                if attr_random_uniform.in_port(0).disconnected():
+                    raise Error('RandomUniform should have input node on 0 port.')
+                else:
+                    new_random_uniform.in_port(0).connect(attr_random_uniform.in_port(0).get_connection().get_source())
+
+            graph.remove_node(attr_random_uniform.id)
diff --git a/model-optimizer/extensions/front/DropoutWithRandomUniformReplacer.py b/model-optimizer/extensions/front/DropoutWithRandomUniformReplacer.py
deleted file mode 100644
index 2001765be7b5ed..00000000000000
--- a/model-optimizer/extensions/front/DropoutWithRandomUniformReplacer.py
+++ /dev/null
@@ -1,73 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import logging as log
-import numpy as np
-
-from mo.front.common.replacement import FrontReplacementSubgraph
-from mo.front.tf.graph_utils import create_op_with_const_inputs
-from mo.graph.graph import Graph, Node, rename_nodes
-from mo.middle.pattern_match import check_value
-from mo.ops.broadcast import Broadcast
-
-
-class DropoutWithRandomUniformReplacer(FrontReplacementSubgraph):
-    r"""
-    This transformation replaces possible Dropout block (in inference mode) with RandomUniform
-    to Broadcast of half-ones in a sub-graph.
-    WARNING: the transformation can be triggered for other block with RandomUniform by mistake,
-    i.e. replace the detected sub-graph to functionally non-equivalent sub-graph
-
-    Dropout block:
-    ShapeOf -> RandomUniform -> Mul ---> Add ---> Add -> Floor
-                                         /\
-                                         |
-                                     Const(0)
-
-    Resulted block:
-    ShapeOf --> Broadcast --> Mul ---> Add ---> Add -> Floor
-                  /\                   /\
-                  |                    |
-               Const(0.5)           Const(0)
-    """
-    enabled = True
-
-    @staticmethod
-    def pattern(**kwargs):
-        return dict(
-            nodes=[
-                ('shape', dict(op='ShapeOf')),
-                ('random_uniform', dict(op='RandomUniform')),
-                ('mul', dict(op='Mul')),
-                ('add_const', dict(op='Const', value=lambda v: check_value(v, lambda x: np.allclose(x, 0.0, atol=0)))),
-                ('add', dict(op='Add')),
-                ('add2', dict(op='Add')),
-                ('floor', dict(op='Floor')),
-            ],
-            edges=[
-                ('shape', 'random_uniform'),
-                ('random_uniform', 'mul'),
-                ('mul', 'add', {'in': 0}),
-                ('add_const', 'add', {'in': 1}),
-                ('add', 'add2'),
-                ('add2', 'floor'),
-            ]
-        )
-
-    @staticmethod
-    def replace_sub_graph(graph: Graph, match: dict, **kwargs):
-        random_uniform_node = match['random_uniform']
-        random_uniform_node_name = random_uniform_node.soft_get('name', random_uniform_node.id)
-        log.error("Possible dropout block with RandomUniform is detected. "
-                  "Replace {} with a Broadcast with constant value of 0.5 "
-                  "assuming that it is executed in inference mode.".format(random_uniform_node_name),
-                  extra={'is_warning': True})
-        data_type = match['add_const'].data_type
-        broadcast_node = create_op_with_const_inputs(graph, Broadcast,
-                                                     {0: np.array([0.5], dtype=data_type)},
-                                                     {'mode': 'numpy',
-                                                      'name': random_uniform_node_name + '/Broadcast'})
-        rename_nodes([(random_uniform_node, random_uniform_node_name + '/ToBeRemoved'),
-                      (broadcast_node, random_uniform_node_name)])
-        random_uniform_node.in_port(0).get_connection().set_destination(broadcast_node.in_port(1))
-        random_uniform_node.out_port(0).get_connection().set_source(broadcast_node.out_port(0))
diff --git a/model-optimizer/extensions/front/mxnet/random_uniform_ext.py b/model-optimizer/extensions/front/mxnet/random_uniform_ext.py
new file mode 100644
index 00000000000000..a1a74e4a4eef39
--- /dev/null
+++ b/model-optimizer/extensions/front/mxnet/random_uniform_ext.py
@@ -0,0 +1,24 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import numpy as np
+
+from extensions.ops.random_uniform import AttributedRandomUniform
+from mo.front.extractor import FrontExtractorOp
+from mo.front.mxnet.extractors.utils import get_mxnet_layer_attrs
+
+
+class RandomUniformExtractor(FrontExtractorOp):
+    op = '_random_uniform'
+    enabled = True
+
+    @classmethod
+    def extract(cls, node):
+        attrs = get_mxnet_layer_attrs(node.symbol_dict)
+        shape = list(attrs.tuple("shape", int, None))
+        high = attrs.float("high", 1.0)
+        low = attrs.float("low", 0.0)
+        out_type = attrs.dtype("dtype", np.float32)
+        new_attrs = {'shape': shape, 'min_val': out_type(low), 'max_val': out_type(high), 'output_type': out_type}
+        AttributedRandomUniform.update_node_stat(node, new_attrs)
+        return cls.enabled
diff --git a/model-optimizer/extensions/front/onnx/random_uniform_ext.py b/model-optimizer/extensions/front/onnx/random_uniform_ext.py
new file mode 100644
index 00000000000000..e0ba2f223414d6
--- /dev/null
+++ b/model-optimizer/extensions/front/onnx/random_uniform_ext.py
@@ -0,0 +1,27 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from extensions.ops.random_uniform import AttributedRandomUniform
+from mo.front.common.partial_infer.utils import int64_array
+from mo.front.extractor import FrontExtractorOp
+from mo.front.onnx.extractors.utils import onnx_attr, get_onnx_datatype_as_numpy
+from mo.graph.graph import Node
+
+
+class RandomUniformFrontExtractor(FrontExtractorOp):
+    op = 'RandomUniform'
+    enabled = True
+
+    @classmethod
+    def extract(cls, node: Node):
+        shape = onnx_attr(node, 'shape', 'ints', default=None, dst_type=int64_array)
+        out_type = get_onnx_datatype_as_numpy(onnx_attr(node, 'dtype', 'i', default=1))
+        seed = onnx_attr(node, 'seed', 'f', default=0.0)
+        min_val = onnx_attr(node, 'low', 'f', default=0.0)
+        max_val = onnx_attr(node, 'high', 'f', default=1.0)
+        AttributedRandomUniform.update_node_stat(node, {'shape': shape,
+                                                        'output_type': out_type,
+                                                        'seed': seed,
+                                                        'min_val': out_type(min_val),
+                                                        'max_val': out_type(max_val)})
+        return cls.enabled
diff --git a/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py b/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py
index ec3a357fa900e9..a09bbc16e142ad 100644
--- a/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py
+++ b/model-optimizer/extensions/front/tf/ObjectDetectionAPI.py
@@ -1,6 +1,23 @@
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+"""
+The file contains necessary transformations to convert models created with a TensorFlow Object Detection framework from
+the https://github.com/tensorflow/models/blob/master/research/object_detection/ repository. There is a dedicated
+OpenVINO document describing overall procedure of conversion these models with the Model Optimizer:
+https://docs.openvinotoolkit.org/latest/openvino_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_Object_Detection_API_Models.html
+
+Conversion of most of the TF OD API models requires execution of several transformations defined in this file. The list
+of transformations to be executed for a particular model type (meta-architecture) is defined in the transformation
+configuration JSON file located in the "extensions/front/tf/" directory. A file should be specified using the
+"--transformations_config" command line parameter. An additional parameter
+"--tensorflow_object_detection_api_pipeline_config" should be specified with the path to the pipeline.config used for
+the model training.
+
+Refer to the code comments of a particular transformation for the explanation of its purpose and low-level
+implementation details.
+"""
+import collections
 import logging as log
 from math import sqrt
 
@@ -29,17 +46,15 @@
 from extensions.ops.split import Split
 from extensions.ops.transpose import Transpose
 from mo.front.common.layout import get_batch_dim, get_height_dim, get_width_dim
-from mo.front.common.partial_infer.utils import int64_array
+from mo.front.common.partial_infer.utils import int64_array, dynamic_dimension
 from mo.front.common.replacement import FrontReplacementPattern
 from mo.front.extractor import output_user_data_repack, add_output_ops
 from mo.front.subgraph_matcher import SubgraphMatch
 from mo.front.tf.custom_subgraph_call import skip_nodes_by_condition
 from mo.front.tf.graph_utils import add_activation_function_after_node, add_convolution_to_swap_xy_coordinates, \
-    mark_squeeze_reshape_concat_before_detection_output, add_fake_background_loc, create_op_node_with_second_input, \
-    create_op_with_const_inputs
+    add_fake_background_loc, create_op_node_with_second_input, create_op_with_const_inputs
 from mo.front.tf.replacement import FrontReplacementFromConfigFileSubGraph, FrontReplacementFromConfigFileGeneral
 from mo.graph.graph import Graph, Node
-from mo.middle.passes.convert_data_type import data_type_str_to_np
 from mo.ops.clamp import AttributedClamp
 from mo.ops.concat import Concat
 from mo.ops.const import Const
@@ -354,21 +369,18 @@ def swap_weights_xy(graph: Graph, nodes: list):
                 insert_weights_swap_xy_sub_graph(graph, m.in_port(1).get_connection())
 
 
-def calculate_shape_keeping_aspect_ratio(height: int, width: int, min_size: int, max_size: int,
-                                         pad_to_max_dimension: bool = False):
+def calculate_shape_keeping_aspect_ratio(height: int, width: int, min_size: int, max_size: int):
     """
-    The function scales spatial sizes of the image keeping aspect ratio to satisfy provided requirements.
-    The behavior of this function is equivalent to the output shape calculation of the Preprocessor block of TensorFlow
+    The function changes spatial sizes of the image keeping aspect ratio to satisfy provided requirements.
+    The behavior of this function is equivalent to the output shape calculation of the pre-processor block of TensorFlow
     Object Detection API models with keep aspect ratio resizer.
+
     :param height: input height.
     :param width: input width.
     :param min_size: size limit.
     :param max_size: size limit.
-    :param pad_to_max_dimension: scale the input image size to the maximum value specified
     :return: the tuple with scaled image height, width.
     """
-    if pad_to_max_dimension:
-        return max_size, max_size
     ratio_min = min_size / min(height, width)
     ratio_max = max_size / max(height, width)
     ratio = min(ratio_min, ratio_max)
@@ -385,7 +397,9 @@ def calculate_placeholder_spatial_shape(graph: Graph, match: SubgraphMatch, pipe
            prints warning. If the '--input_shape' is not defined then use values from the pipeline configuration file.
         b. If the keep aspect ratio resizer is used then scale the size passed via '--input_shape' using the provided
            limits. If the '--input_shape' is not defined then use shape as (min_dimension_size, min_dimension_size)
-           defined in the pipeline configuration file.
+           defined in the pipeline configuration file. If the "pad_to_max_dimension" attribute is set to true then the
+           output shape will always be (max_dimension_size, max_dimension_size).
+
     :param graph: graph with the topology.
     :param match: the object containing matching sub-graph and custom attributes from the sub-graph replacement file.
     :param pipeline_config: the object contain information from the pipeline configuration file.
@@ -410,19 +424,11 @@ def calculate_placeholder_spatial_shape(graph: Graph, match: SubgraphMatch, pipe
             user_defined_height = user_defined_shape[1]
             user_defined_width = user_defined_shape[2]
 
+    # the parameters below are set if the fixed_shape_resizer is used
     resizer_height = pipeline_config.get_param('resizer_image_height')
     resizer_width = pipeline_config.get_param('resizer_image_width')
     if resizer_height and resizer_width:
         log.debug('The model resizes image to a fixed shape: ({}, {})'.format(resizer_height, resizer_width))
-
-    resizer_min_dimension = pipeline_config.get_param('resizer_min_dimension')
-    resizer_max_dimension = pipeline_config.get_param('resizer_max_dimension')
-    if resizer_min_dimension and resizer_max_dimension:
-        log.debug('The model resizes image using keep aspect ratio with minimum size {}, maximum size {}.'.format(
-            resizer_min_dimension, resizer_max_dimension))
-
-    # if the model is created with an input image resizer to a fixed shape
-    if resizer_width and resizer_height:
         if user_defined_height and user_defined_width:
             if user_defined_width != resizer_width or user_defined_width != resizer_width:
                 log.error('The model expects that the input image is resized to a fixed shape ({}, {}), but the shape '
@@ -434,35 +440,44 @@ def calculate_placeholder_spatial_shape(graph: Graph, match: SubgraphMatch, pipe
             height = resizer_height
             width = resizer_width
 
-    # if the model is created with an input image resizer keeping aspect ratio
+    # the parameters below are set if keep_aspect_ratio_resizer is used
+    resizer_min_dimension = pipeline_config.get_param('resizer_min_dimension')
+    resizer_max_dimension = pipeline_config.get_param('resizer_max_dimension')
+    pad_to_max_dimension = pipeline_config.get_param('pad_to_max_dimension')
     if resizer_min_dimension and resizer_max_dimension:
-        pad_to_max_dimension = pipeline_config.get_param('pad_to_max_dimension')
-        print('[ WARNING ] Model Optimizer removes pre-processing block of the model which resizes image keeping '
-              'aspect ratio. The Inference Engine does not support dynamic image size so the Intermediate '
-              'Representation file is generated with the input image size of a fixed size.')
-        if user_defined_height and user_defined_width:
-            scaled_height, scaled_width = calculate_shape_keeping_aspect_ratio(user_defined_height,
-                                                                               user_defined_width,
-                                                                               resizer_min_dimension,
-                                                                               resizer_max_dimension,
-                                                                               pad_to_max_dimension)
-            if scaled_height != user_defined_height or scaled_width != user_defined_width:
-                log.error('The model resizes the input image keeping aspect ratio with min dimension {}, max '
-                          'dimension {}. The provided input height {}, width {} is transformed to height {}, width '
-                          '{}.'.format(resizer_min_dimension, resizer_max_dimension, user_defined_height,
-                                       user_defined_width, scaled_height, scaled_width), extra={'is_warning': True})
-            height = scaled_height
-            width = scaled_width
+        log.debug('The model resizes image using keep aspect ratio with minimum size {}, maximum size {}, pad {}.'
+                  ''.format(resizer_min_dimension, resizer_max_dimension, pad_to_max_dimension))
+        if pad_to_max_dimension:
+            if user_defined_height and user_defined_width:
+                log.error('The model contains pre-processing block which resizes image keeping aspect ratio with a '
+                          'padding to max dimension. The only valid model input image spatial shape after '
+                          'pre-processing is ({}, {}). Ignoring the user provided input shapes.'
+                          ''.format(resizer_max_dimension, resizer_max_dimension), extra={'is_warning': True})
+            height = width = resizer_max_dimension
         else:
-            if pad_to_max_dimension:
-                height = width = resizer_max_dimension
+            log.error('Model Optimizer removes pre-processing block of the model which resizes image keeping aspect '
+                      'ratio. Inference Engine does not support dynamic image size so the Intermediate Representation '
+                      'file is generated with the input image size of a fixed size.', extra={'is_warning': True})
+            if user_defined_height and user_defined_width:
+                scaled_height, scaled_width = calculate_shape_keeping_aspect_ratio(user_defined_height,
+                                                                                   user_defined_width,
+                                                                                   resizer_min_dimension,
+                                                                                   resizer_max_dimension)
+                if scaled_height != user_defined_height or scaled_width != user_defined_width:
+                    log.error('The model resizes the input image keeping aspect ratio with min dimension {}, max '
+                              'dimension {}. The provided input height {}, width {} is transformed to height {}, width '
+                              '{}.'.format(resizer_min_dimension, resizer_max_dimension, user_defined_height,
+                                           user_defined_width, scaled_height, scaled_width), extra={'is_warning': True})
+                height = scaled_height
+                width = scaled_width
             else:
                 height = width = resizer_min_dimension
-            print('Specify the "--input_shape" command line parameter to override the default shape which is equal to '
-                  '({}, {}).'.format(height, width))
+                log.error('Specify the "--input_shape" command line parameter to override the default shape which is '
+                          'equal to ({}, {}).'.format(height, width), extra={'is_warning': True})
 
     if height is None or width is None:
-        raise Error('Failed to determine the placeholder shape.')
+        raise Error('Failed to determine the placeholder shape. Unsupported image resizer from the pipeline.config was '
+                    'used to create the model.')
     return height, width
 
 
@@ -471,8 +486,8 @@ def update_parameter_shape(graph: Graph, match: [SubgraphMatch, None]):
     Updates the shape of the model Parameter node based on the user provided input shape or values provided in the
     pipeline.config configuration file used for model training.
     :param graph: model graph
-    :param match: Match object with information abouot matched sub-graph
-    :return: tupe with input node names and Parameter Node
+    :param match: Match object with information about matched sub-graph
+    :return: tuple with input node names and Parameter Node
     """
     argv = graph.graph['cmd_params']
     if argv.tensorflow_object_detection_api_pipeline_config is None:
@@ -491,26 +506,67 @@ def update_parameter_shape(graph: Graph, match: [SubgraphMatch, None]):
     # set default value of the batch size to 1 if user didn't specify batch size and input shape
     layout = graph.graph['layout']
     batch_dim = get_batch_dim(layout, 4)
-    if argv.batch is None and parameter_node.shape[batch_dim] == -1:
+    if argv.batch is None and parameter_node.shape[batch_dim] is dynamic_dimension:
         parameter_node.shape[batch_dim] = 1
     height, width = calculate_placeholder_spatial_shape(graph, match, pipeline_config)
     parameter_node.shape[get_height_dim(layout, 4)] = height
     parameter_node.shape[get_width_dim(layout, 4)] = width
-
-    # save the pre-processed image spatial sizes to be used in the other replacers
-    graph.graph['preprocessed_image_height'] = parameter_node.shape[get_height_dim(layout, 4)]
-    graph.graph['preprocessed_image_width'] = parameter_node.shape[get_width_dim(layout, 4)]
     return initial_input_node_name, parameter_node
 
 
+def mark_squeeze_reshape_concat_before_detection_output(start_nodes: list):
+    """
+    The function looks for Reshape, Concat and Squeeze ops after the 'start_nodes' with 4D output and marks them with
+    proper attributes to infer them in original NHWC layout. This is a case of the TensorFlow Object Detection API
+    models for the SSD heads output which produces 4D tensor with bounding box deltas.
+
+    :param start_nodes: list of nodes to start search from.
+    :return: None
+    """
+    q = collections.deque()
+    visited = set()
+    q.extend(start_nodes)
+    while len(q) != 0:
+        cur_node = q.popleft()
+        visited.add(cur_node.id)
+        if cur_node.has_valid('type'):
+            if cur_node.soft_get('type') == 'DetectionOutput':  # do not go beyond the DetectionOutput node
+                continue
+            # the input to Reshape comes from Convolution so it will be converted from NCHW to NHWC layout in the
+            # InsertLayoutPropagationTransposes transformation. But the output should be kept in the original layout
+            if cur_node.soft_get('type') == 'Reshape':
+                mark_output_as_in_correct_layout(cur_node, 0)
+
+            # Concat should be inferred in the original layout so the input with concatenation axis should not be
+            # updated from NHWC to NCHW layout
+            if cur_node.soft_get('type') == 'Concat':
+                cur_node.in_port(1).__setattr__('input_permutation', None)
+                cur_node['nchw_layout'] = True
+                cur_node.out_node(0)['nchw_layout'] = True
+
+            # Squeeze should be inferred in the original layout so the input with squeeze axis should not be updated
+            # from NHWC to NCHW layout. The input is marked as in correct layout to prevent from inserting Transpose
+            # from NHWC to NCHW.
+            if cur_node.soft_get('type') == 'Squeeze':
+                cur_node.in_port(1).__setattr__('input_permutation', None)
+                mark_input_as_in_correct_layout(cur_node, 0)
+
+        if cur_node.has_port('out', 0):
+            [q.append(port.node) for port in cur_node.out_port(0).get_destinations() if port.node.id not in visited]
+
+
 class ObjectDetectionAPITransformationsStart(FrontReplacementPattern):
     """
     This is a anchor transformation which is used to distinguish TF OD API models related transformations.
+    All transformations have a dependency to be executed after this transformation (or some other TF OD API
+    transformation which is executed after this one).
+    Some transformation which swap convolution weights using the "swap_weights_xy" function relies on the fact that the
+    "FakeQuantWithMinMaxVars" operations are decomposed into "FakeQuantize"s.
     """
     enabled = True
 
     def run_after(self):
-        return [CropAndResizeReplacement, FakeQuantWithMinMaxVarsToQuantize]
+        return [FakeQuantWithMinMaxVarsToQuantize]
 
     def find_and_replace_pattern(self, graph: Graph):
         pass
@@ -518,7 +574,18 @@ def find_and_replace_pattern(self, graph: Graph):
 
 class ObjectDetectionAPITransformationsFinish(FrontReplacementPattern):
     """
-    This is a anchor transformation which is used to distinguish TF OD API models related transformations.
+    This is a anchor transformation which is used to separate TF OD API models related transformations.
+    All transformations have a dependency to be executed before this transformation (or some other TF OD API
+    transformation which is executed before this one).
+    1. This anchor transformation is executed before any other standard MO transformations which may break the model
+    conversion. For example, PadTFToPad replaces PadTF operation nodes with the Pad operation nodes and re-uses an
+    input node defining the pad value. The scope pattern matcher will remove the node defining the pad value and the
+    newly created Pad operation become invalid.
+    2. Another common issue that some transformations should be executed after TF OD API transformations is that these
+    transformations replace some nodes with new nodes but different "id" attribute. Since the pattern matcher is based
+    on node "id" (not "name") attribute the matching will be broken.
+    3. Some TF OD API transformations mark TF CropAndResize nodes with specific flag which is then handled in the
+    CropAndResizeReplacement transformation that is why latter one should be executed after this transformation.
     """
     enabled = True
     # cleanup the graph after applying of TF OD API transformations to remove a lot of unconnected nodes to avoid issues
@@ -526,12 +593,8 @@ class ObjectDetectionAPITransformationsFinish(FrontReplacementPattern):
     force_clean_up = True
 
     def run_before(self):
-        # PadTFToPad inserts Transpose ops for Pad ops inside the sub-graph corresponding to DetectionOutput.
-        # But the inputs corresponding to padding values is re-used as inputs for newly created Pad node. This input
-        # is removed during removing nodes from the DO sub-graph so the first input to Transpose is missing which
-        # results in TransposeOrderNormalizer transformation failure.
-        return [Pack, TransposeOrderNormalizer, PadTFToPad, SqueezeAxis, TFSliceToSliceReplacer,
-                MapFNOutputConcatenation, MapFNInputSlicing]
+        return [Pack, TransposeOrderNormalizer, PadTFToPad, SqueezeAxis, TFSliceToSliceReplacer, MapFNInputSlicing,
+                MapFNOutputConcatenation, CropAndResizeReplacement]
 
     def find_and_replace_pattern(self, graph: Graph):
         pass
@@ -591,10 +654,43 @@ def get_preprocessing_ops(graph: Graph, start_node_id_suffix: str, end_node_id_s
     return preprocessing_nodes, trailing
 
 
+""" 
+Object Detection API models contain the sub-graph that performs some (not necessarily all) of the following tasks
+(possibly in different order):
+* Resizes image according to the constraints defined in the pipeline.config file.
+* Applies mean and scale values.
+* Pads the resized image to the size specified in the pipeline.config file.
+This sub-graph is called "Preprocessor" in TF1 OD API models and early versions of the TF2 OD API models. Starting from
+version 2.4 the block is called "map". The sub-graph has one output with the pre-processed input image and optionally
+has a second output which contains either the original image size or the resized image size (before padding). When the
+second output exists it is used to map predicted bounding boxes of the resized image to the original image coordinates.
+
+Model Optimizer removes nodes performing image resize and padding, but keeps nodes applying mean and scale values. 
+Historically, Model Optimizer didn't support converting TF sub-graphs into TensorIterator/Loop from TF 1 models so this
+was the only option to convert the model and avoid dynamism which occurs when keep_aspect_ratio resizer is used. And the
+user should resize the image the same way as it is implemented in the model before feeding the data to the Inference
+Engine.
+
+If the "keep_aspect_ratio" resizer with "pad_to_max_dimension" parameter equal to "true" is used and mean/scale
+operations are applied before the resize like this:
+
+input_tensor -> mean/scale -> resize -> pad -> ... 
+
+then it is not allowed to remove the resize and padding operations and pre-process the input data before feeding the
+model like this:
+
+resized_padded_input_data -> mean/scale -> ...
+
+because the output results will be different because mean/scale operations will be applied for padding area as well. So
+the only option in this case is to remove all pre-processing operations from the model and expect that user perform them
+before feeding the model.
+"""
+
+
 class ObjectDetectionAPIPreprocessorReplacement(FrontReplacementFromConfigFileSubGraph):
     """
-    The class replaces the "Preprocessor" block resizing input image and applying mean/scale values. Only nodes related
-    to applying mean/scaling values are kept.
+    The transformation is triggered for the pre-processing block which resizes the input image and applies mean/scale
+    values in the TF1 OD API models.
     """
     replacement_id = 'ObjectDetectionAPIPreprocessorReplacement'
     run_not_recursively = True
@@ -632,18 +728,23 @@ def is_preprocessing_applied_before_resize(self, to_float: Node, mul: Node, sub:
 
     def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
         sub_node = match.output_node(0)[0]
+        # sanity check whether this is really TF OD API model. The Sub operation always exists in TF1 OD API models
+        # pre-processing sub-graph
         if sub_node.soft_get('op') != 'Sub':
             raise Error('The output op of the Preprocessor sub-graph is not of type "Sub". Looks like the topology is '
                         'not created with TensorFlow Object Detection API.')
 
+        # identify the node performing scale (if it exists)
         mul_node = None
         if sub_node.in_port(0).get_source().node.soft_get('op') == 'Mul':
             log.info('There is image scaling node in the Preprocessor block.')
             mul_node = sub_node.in_port(0).get_source().node
 
+        # update the model Parameter node shape based on MO command line parameters and values in the pipeline.config
         initial_input_node_name, placeholder_node = update_parameter_shape(graph, match)
 
         to_float_node = placeholder_node.out_port(0).get_destination().node
+        # one more sanity check
         if to_float_node.soft_get('op') != 'Cast':
             raise Error('The output of the node "{}" is not Cast operation. Cannot apply transformation.'.format(
                 initial_input_node_name))
@@ -663,15 +764,20 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
             else:
                 to_float_node.out_port(0).connect(mul_node.in_port(1))
 
-        print('The Preprocessor block has been removed. Only nodes performing mean value subtraction and scaling (if'
-              ' applicable) are kept.')
+        log.error('The Preprocessor block has been removed. Only nodes performing mean value subtraction and scaling '
+                  '(if applicable) are kept.', extra={'is_warning': True})
+        # the pre-processing sub-graph is connected with the main graph, so there is no need to return new nodes mapping
+        # dictionary
         return {}
 
 
 class ObjectDetectionAPIPreprocessor2Replacement(FrontReplacementFromConfigFileGeneral):
     """
-    The class replaces the "Preprocessor" block resizing input image and applying mean/scale values. Only nodes related
-    to applying mean/scaling values are kept. The transformation is used for TensorFlow 2.X models.
+    The transformation is triggered for the pre-processing block which resizes the input image and applies mean/scale
+    values in the TF2 OD API model. Only nodes related to applying mean/scaling values are kept.
+    If the mean/scale values are applied before the resize and the pre-processing includes padding then mean/scale
+    values are removed as well. Refer to the comments section before the ObjectDetectionAPIPreprocessorReplacement
+    transformation.
 
     There are 6 possible cases:
     1. ... -> Scale -> Start -> Resize -> End -> ...
@@ -689,7 +795,7 @@ class ObjectDetectionAPIPreprocessor2Replacement(FrontReplacementFromConfigFileG
     - "Resize" - the Resize sub-graph being removed
 
     The transformation creates a new sub-graph of pre-processing nodes if in the original model it is inside the Loop,
-    or keeps the existing one if they are in the main graph originally.
+    or keeps the existing one if they are in the main graph already.
     """
     replacement_id = 'ObjectDetectionAPIPreprocessor2Replacement'
     run_not_recursively = True
@@ -701,8 +807,18 @@ def run_after(self):
         return [ObjectDetectionAPITransformationsStart]
 
     def transform_graph(self, graph: Graph, replacement_descriptions: dict):
+        argv = graph.graph['cmd_params']
+        if argv.tensorflow_object_detection_api_pipeline_config is None:
+            raise Error(missing_param_error)
+
+        pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
+        pad_to_max_dimension = pipeline_config.get_param('pad_to_max_dimension')
+
+        # update the model Parameter node shape based on MO command line parameters and values in the pipeline.config
         update_parameter_shape(graph, None)
 
+        # NOTE: this transformation can be implemented as a "scope" or "points" transformation since we need to match
+        # some sub-graph between specific nodes
         start_nodes = replacement_descriptions['start_nodes']
         end_nodes = replacement_descriptions['end_nodes']
 
@@ -723,7 +839,7 @@ def transform_graph(self, graph: Graph, replacement_descriptions: dict):
         # If the pre-processing block contains Loop operation then mean and scale value should be obtained from it using
         # some pre-defined marker nodes existing for all pre-processing blocks.
         # If there is no Loop then pre-processing nodes are in the main graph and they should be obtained from it
-        loop_nodes_ids = [node_id for node_id in sub_graph_node_ids if graph.node[node_id].get('op') == 'Loop']
+        loop_nodes_ids = [node_id for node_id in sub_graph_node_ids if graph.nodes[node_id].get('op') == 'Loop']
         if len(loop_nodes_ids):
             assert len(loop_nodes_ids) == 1, 'There should be exactly one Loop node in the pre-processor block.'
             pre_processing_in_loop = True
@@ -738,6 +854,7 @@ def transform_graph(self, graph: Graph, replacement_descriptions: dict):
         else:
             pre_processing_ops, trailing = get_preprocessing_ops(graph, start_node.id, end_node.id)
 
+        mean_scale_kept = True
         if len(pre_processing_ops):
             # if the pre-processing is applied before the resize then reverse them to be in the topological order
             if not trailing:
@@ -765,22 +882,38 @@ def transform_graph(self, graph: Graph, replacement_descriptions: dict):
                     source_port.disconnect()
                     end_node.out_port(0).get_connection().set_source(source_port)
                 else:  # case 1
-                    # change output of the end_node to be produced with the last preprocessing op
-                    end_node.out_port(0).get_connection().set_source(pre_processing_ops[-1][0].out_port(0))
-                    start_node.in_port(0).disconnect()
+                    # if padding is specified then need to remove mean/scale as well. Refer to the transformation
+                    # comments for more details
+                    if pad_to_max_dimension:
+                        # change output of the end_node to be produced with the node producing data for the first
+                        # preprocessing op
+                        mean_scale_kept = False
+                        first_pre_processing_node = pre_processing_ops[0][0]
+                        consumer_port = first_pre_processing_node.in_port(int(not pre_processing_ops[0][1]))
+                        end_node.out_port(0).get_connection().set_source(consumer_port.get_connection().get_source())
+                    else:
+                        # change output of the end_node to be produced with the last preprocessing op
+                        end_node.out_port(0).get_connection().set_source(pre_processing_ops[-1][0].out_port(0))
+                        start_node.in_port(0).disconnect()
         else:  # simply remove the nodes in between start_node and end_node (including them). Case 3 and 6
             end_node.out_port(0).get_connection().set_source(start_node.in_port(0).get_source())
 
-        print('The Preprocessor block has been removed. Only nodes performing mean value subtraction and scaling (if'
-              ' applicable) are kept.')
+        if mean_scale_kept:
+            log.error('The pre-processing block has been removed. Only nodes performing mean value subtraction and '
+                      'scaling (if applicable) are kept. It is necessary to resize an input image using the same '
+                      'algorithm as in the original model before feeding it to the Inference Engine.',
+                      extra={'is_warning': True})
+        else:
+            log.error('The Preprocessor block has been removed including mean value subtraction and scaling (if '
+                      'applicable). It is necessary to resize, scale and pad an input image using the same algorithm '
+                      'as in the original model before feeding it to the Inference Engine.', extra={'is_warning': True})
 
 
 class ObjectDetectionAPIDetectionOutputReplacement(FrontReplacementFromConfigFileSubGraph):
     """
-    Replaces the sub-graph that is equal to the DetectionOutput layer from Inference Engine. This replacer is used for
-    Faster R-CNN, R-FCN and Mask R-CNN topologies conversion.
-    The replacer uses a value of the custom attribute 'coordinates_swap_method' from the sub-graph replacement
-    configuration file to choose how to swap box coordinates of the 0-th input of the generated DetectionOutput layer.
+    Replaces the sub-graph that is equal to the DetectionOutput layer from Inference Engine (similarly to the
+    ObjectDetectionAPISSDPostprocessorReplacement). This transformation is used for Faster R-CNN, R-FCN and Mask R-CNN
+    topologies conversion.
     Refer to the code for more details.
     """
     replacement_id = 'ObjectDetectionAPIDetectionOutputReplacement'
@@ -828,152 +961,145 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
         activation_conf_node = add_activation_function_after_node(graph, match.single_input_node(1)[0].in_node(0),
                                                                   activation_function)
 
-        # IE DetectionOutput layer consumes flattened tensors so need add a Reshape layer.
+        # IE DetectionOutput operation consumes flattened tensors so need add a Reshape layer.
         # The batch value of the input tensor is not equal to the batch of the topology, so it is not possible to use
         # "0" value in the Reshape layer attribute to refer to the batch size, but we know how to
         # calculate the second dimension so the batch value will be deduced from it with help of "-1".
         reshape_conf_node = create_op_node_with_second_input(graph, Reshape,
                                                              int64_array([-1, (num_classes + 1) * max_proposals]),
                                                              dict(name='do_reshape_conf'), activation_conf_node)
-
         mark_as_correct_data_layout(reshape_conf_node)
 
-        # Workaround for TransposeForReshape pass.
         # We looking for first not Reshape-typed node before match.single_input_node(0)[0].in_node(0).
-        # And add  reshape_loc node after this first not Reshape-typed node.
+        # And add reshape_offsets node after this first not Reshape-typed node to avoid issues with Reshape-like
+        # operations which may trigger insert of Transpose operations before/after them
         current_node = skip_nodes_by_condition(match.single_input_node(0)[0].in_node(0),
                                                lambda x: x['kind'] == 'op' and x.has_and_set('reinterp_shape'))
 
+        # if share_box_across_classes=1 then the same set of bounding boxes shape offsets is used for all classes,
+        # otherwise per-class set of shape offsets is used and we need to use appropriate Reshape output shape
         share_box_across_classes = _value_or_raise(match, pipeline_config, 'share_box_across_classes')
-        background_label_id = int(custom_attributes.get('background_label_id', 0))
         if share_box_across_classes:
-            reshape_loc_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 1, 1, 4]),
-                                                                dict(name='reshape_loc'), current_node)
+            reshape_offsets_shape = int64_array([-1, 1, 1, 4])
         else:
-            reshape_loc_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, num_classes, 1, 4]),
-                                                                dict(name='reshape_loc'), current_node)
-        mark_as_correct_data_layout(reshape_loc_node)
-
-        # constant node with variances
-        variances_const_op = Const(graph, dict(value=_variance_from_pipeline_config(pipeline_config)))
-        variances_const_node = variances_const_op.create_node([])
+            reshape_offsets_shape = int64_array([-1, num_classes, 1, 4])
+        reshape_offsets = create_op_node_with_second_input(graph, Reshape, reshape_offsets_shape,
+                                                           dict(name='reshape_loc'), current_node)
+        mark_as_correct_data_layout(reshape_offsets)
 
         if share_box_across_classes:
-            loc_node = reshape_loc_node
+            offsets = reshape_offsets
         else:
-            # TF produces locations tensor without boxes for background.
-            # Inference Engine DetectionOutput layer requires background boxes so we generate them
-            loc_node = add_fake_background_loc(graph, reshape_loc_node)
-            PermuteAttrs.set_permutation(reshape_loc_node, loc_node, None)
-
-        # reshape locations tensor to 2D so it could be passed to Eltwise which will be converted to ScaleShift
-        reshape_loc_2d_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 4]),
-                                                               dict(name='reshape_locs_2d'), loc_node)
-        mark_as_correct_data_layout(reshape_loc_2d_node)
-
-        # element-wise multiply locations with variances
-        eltwise_locs_op = Mul(graph, dict())
-        eltwise_locs_node = eltwise_locs_op.create_node([reshape_loc_2d_node, variances_const_node],
-                                                        dict(name='scale_locs'))
+            # TF produces shape offsets tensor without boxes corresponding to "background" class
+            # Inference Engine DetectionOutput layer requires "background" class data be included so we generate them
+            offsets = add_fake_background_loc(graph, reshape_offsets)
+            PermuteAttrs.set_permutation(reshape_offsets, offsets, None)
+
+        # reshape offsets tensor to 2D so it could be multiplied with variances
+        reshape_offsets_2d = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 4]),
+                                                              dict(name='reshape_locs_2d'), offsets)
+        mark_as_correct_data_layout(reshape_offsets_2d)
+
+        # multiply bounding boxes shape offsets with variances as it is expected when variance_encoded_in_target=1 for
+        # the DetectionOutput operation
+        variances = Const(graph, dict(value=_variance_from_pipeline_config(pipeline_config))).create_node([])
+        scaled_offsets = Mul(graph, dict()).create_node([reshape_offsets_2d, variances], dict(name='scale_locs'))
+
+        # there are Convolution/MatMul nodes before the post-processing block in all models except RFCN. So for most of
+        # the models we can just update Convolution/MatMul weights to perform swapping of coordinates. But for the RFCN
+        # models we use approach with adding special Convolution node which perform the same swap. Previously we used a
+        # dedicated parameter in the transformation config but now it is not needed and the get this information from
+        # the model automatically by performing graph traversal until CropAndResize (RFCN case) or Conv/MatMul nodes are
+        # found
+        if 'coordinates_swap_method' in custom_attributes:
+            log.error('The "coordinates_swap_method" parameter is not needed anymore. Consider removing it from the '
+                      '"ObjectDetectionAPIDetectionOutputReplacement" transformation custom attributes.',
+                      extra={'is_warning': True})
+        matmul_or_conv_nodes = backward_bfs_for_operation(scaled_offsets, ['MatMul', 'Conv2D'], ['ShapeOf',
+                                                                                                 'CropAndResize'])
+        if len(matmul_or_conv_nodes) == 0:
+            swapped_offsets = add_convolution_to_swap_xy_coordinates(graph, scaled_offsets, 4)
+            flattened_offsets = Reshape(graph, dict(name='do_reshape_locs')).create_node([swapped_offsets])
+        else:
+            swap_weights_xy(graph, matmul_or_conv_nodes)
+            flattened_offsets = Reshape(graph, dict(name='do_reshape_locs')).create_node([scaled_offsets])
 
         # IE DetectionOutput layer consumes flattened tensors so need add a Reshape layer.
         # The batch value of the input tensor is not equal to the batch of the topology, so it is not possible to use
         # "0" value in the Reshape layer attribute to refer to the batch size, but we know how to
         # calculate the second dimension so the batch value will be deduced from it with help of "-1".
-        reshape_loc_do_op = Reshape(graph, dict(name='do_reshape_locs'))
-
-        coordinates_swap_method = 'add_convolution'
-        if 'coordinates_swap_method' not in custom_attributes:
-            log.error('The ObjectDetectionAPIDetectionOutputReplacement sub-graph replacement configuration file '
-                      'must contain "coordinates_swap_method" in the "custom_attributes" dictionary. Two values are '
-                      'supported: "swap_weights" and "add_convolution". The first one should be used when there is '
-                      'a MatMul or Conv2D node before the "SecondStagePostprocessor" block in the topology. With this '
-                      'solution the weights of the MatMul or Conv2D nodes are permutted, simulating the swap of XY '
-                      'coordinates in the tensor. The second could be used in any other cases but it is worse in terms '
-                      'of performance because it adds the Conv2D node which performs permutting of data. Since the '
-                      'attribute is not defined the second approach is used by default.')
-        else:
-            coordinates_swap_method = custom_attributes['coordinates_swap_method']
-        supported_swap_methods = ['swap_weights', 'add_convolution']
-        if coordinates_swap_method not in supported_swap_methods:
-            raise Error('Unsupported "coordinates_swap_method" defined in the sub-graph replacement configuration '
-                        'file. Supported methods are: {}'.format(', '.join(supported_swap_methods)))
-
-        if coordinates_swap_method == 'add_convolution':
-            swapped_locs_node = add_convolution_to_swap_xy_coordinates(graph, eltwise_locs_node, 4)
-            reshape_loc_do_node = reshape_loc_do_op.create_node([swapped_locs_node])
-        else:
-            reshape_loc_do_node = reshape_loc_do_op.create_node([eltwise_locs_node])
-
         if share_box_across_classes:
-            reshape_loc_do_dims = Const(graph, {'value': int64_array([-1, max_proposals * 4]),
-                                                'name': reshape_loc_do_node.name + '/Dim'}).create_node()
+            reshape_shape = int64_array([-1, max_proposals * 4])
         else:
-            reshape_loc_do_dims = Const(graph, {'value': int64_array([-1, (num_classes + 1) * max_proposals * 4]),
-                                                'name': reshape_loc_do_node.name + '/Dim'}).create_node()
-        reshape_loc_do_dims.out_port(0).connect(reshape_loc_do_node.in_port(1))
-
-        mark_as_correct_data_layout(reshape_loc_do_node)
+            reshape_shape = int64_array([-1, (num_classes + 1) * max_proposals * 4])
+        Const(graph, {'value': reshape_shape, 'name': flattened_offsets.name + '/Dim'}).create_node().out_port(0).\
+            connect(flattened_offsets.in_port(1))
+        mark_as_correct_data_layout(flattened_offsets)
 
         # find Proposal output which has the data layout as in TF: YXYX coordinates without batch indices.
         proposal_nodes_ids = [node_id for node_id, attrs in graph.nodes(data=True)
                               if 'name' in attrs and attrs['name'] == 'crop_proposals']
         if len(proposal_nodes_ids) != 1:
             raise Error("Found the following nodes '{}' with name 'crop_proposals' but there should be exactly 1. "
-                        "Looks like ObjectDetectionAPIProposalReplacement replacement didn't work.".
-                        format(proposal_nodes_ids))
-        proposal_node = Node(graph, proposal_nodes_ids[0])
+                        "Looks like ObjectDetectionAPIProposalReplacement transformation didn't work."
+                        "".format(proposal_nodes_ids))
+        proposal = Node(graph, proposal_nodes_ids[0])
 
-        # check whether it is necessary to permute proposals coordinates before passing them to the DetectionOutput
-        # currently this parameter is set for the RFCN topologies
-        if 'swap_proposals' in custom_attributes and custom_attributes['swap_proposals']:
-            proposal_node = add_convolution_to_swap_xy_coordinates(graph, proposal_node, 4)
+        # Need to swap proposals coordinates before passing them to the DetectionOutput for the RFCN topologies
+        if len(matmul_or_conv_nodes) == 0:
+            proposal = add_convolution_to_swap_xy_coordinates(graph, proposal, 4)
 
         # reshape priors boxes as Detection Output expects
-        reshape_priors_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 1, max_proposals * 4]),
-                                                               dict(name='DetectionOutput_reshape_priors_'),
-                                                               proposal_node)
-        mark_as_correct_data_layout(reshape_priors_node)
+        reshape_priors = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 1, max_proposals * 4]),
+                                                          dict(name='DetectionOutput_reshape_priors_'), proposal)
+        mark_as_correct_data_layout(reshape_priors)
 
         detection_output_op = DetectionOutput(graph, {})
         for key in ('clip_before_nms', 'clip_after_nms'):
             if key in match.custom_replacement_desc.custom_attributes:
                 detection_output_op.attrs[key] = int(match.custom_replacement_desc.custom_attributes[key])
 
-        detection_output_node = detection_output_op.create_node(
-            [reshape_loc_do_node, reshape_conf_node, reshape_priors_node],
-            dict(name=detection_output_op.attrs['type'],
-                 share_location=int(share_box_across_classes),
-                 variance_encoded_in_target=1,
-                 background_label_id=background_label_id,
-                 code_type='caffe.PriorBoxParameter.CENTER_SIZE', pad_mode='caffe.ResizeParameter.CONSTANT',
-                 resize_mode='caffe.ResizeParameter.WARP',
-                 num_classes=num_classes + 1,
-                 confidence_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_score_threshold'),
-                 top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_detections_per_class'),
-                 keep_top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_total_detections'),
-                 nms_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_iou_threshold')))
-        # sets specific name to the node so we can find it in other replacers
-        detection_output_node.name = 'detection_output'
-
-        if coordinates_swap_method == 'swap_weights':
-            swap_weights_xy(graph, backward_bfs_for_operation(detection_output_node.in_node(0), ['MatMul', 'Conv2D'],
-                                                              ['ShapeOf']))
+        detection_output = detection_output_op.create_node([flattened_offsets, reshape_conf_node, reshape_priors], dict(
+            name=detection_output_op.attrs['type'],
+            share_location=int(share_box_across_classes),
+            variance_encoded_in_target=1,
+            background_label_id=int(custom_attributes.get('background_label_id', 0)),
+            code_type='caffe.PriorBoxParameter.CENTER_SIZE',
+            pad_mode='caffe.ResizeParameter.CONSTANT',
+            resize_mode='caffe.ResizeParameter.WARP',
+            num_classes=num_classes + 1,
+            confidence_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_score_threshold'),
+            top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_detections_per_class'),
+            keep_top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_total_detections'),
+            nms_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_iou_threshold')))
+        # sets specific name to the node so we can find it in other transformations
+        detection_output.name = 'detection_output'
 
         # when the use_matmul_crop_and_resize = True then the prior boxes were not swapped and we need to swap them from
         # YXYX to XYXY before passing to the DetectionOutput operation
         if pipeline_config.get_param('use_matmul_crop_and_resize'):
-            insert_weights_swap_xy_sub_graph(graph, detection_output_node.in_port(2).get_connection())
-        output_op = Result(graph, dict(name='do_OutputOp'))
-        output_op.create_node([detection_output_node])
+            insert_weights_swap_xy_sub_graph(graph, detection_output.in_port(2).get_connection())
 
-        print('The graph output nodes have been replaced with a single layer of type "DetectionOutput". Refer to the '
-              'operation set specification documentation for more information about the operation.')
+        # create Result since after the transformation other Results are removed
+        Result(graph, dict(name='do_OutputOp')).create_node([detection_output])
 
-        return {'detection_output_node': detection_output_node}
+        log.error('The graph output nodes have been replaced with a single layer of type "DetectionOutput". Refer to '
+                  'the operation set specification documentation for more information about the operation.',
+                  extra={'is_warning': True})
+        return {'detection_output_node': detection_output}
 
 
 class ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement(FrontReplacementFromConfigFileSubGraph):
+    """
+    There are two TensorFlow CropAndResize (corresponding to Inference Engine ROIPooling with bilinear interpolation
+    mode) operations in the Mask-RCNN model. The second CropAndResize gets bounding boxes coordinates as input from the
+    part of the model which is replaced with the DetectionOutput operation using the transformation
+    ObjectDetectionAPIDetectionOutputReplacement. DetectionOutput operation produces tensor with 7-element tuples
+    [batch_id, class_id, confidence, x_1, y_1, x_2, y_2]. The ROIPooling operation expects input defining bounding boxes
+    with the following format [batch_id, x_1, y_1, x_2, y_2]. The ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement
+    transformation inserts ROIPooling operation instead of the CropAndResize and crops slices of data from the
+    DetectionOutput operation and concatenates them to produce a tensor with correct content.
+    """
     replacement_id = 'ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement'
     run_not_recursively = True
 
@@ -991,63 +1117,61 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
         if argv.tensorflow_object_detection_api_pipeline_config is None:
             raise Error(missing_param_error)
         pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
+
+        # the output spatial dimensions of the ROIPooling operation are defined in the pipeline.config
         roi_pool_size = _value_or_raise(match, pipeline_config, 'initial_crop_size')
 
+        # find the DetectionOutput operation by name to get tensor with information about bounding boxes from it.
+        # the layout of bounding boxes is XYXY already, so no need to swap them
         detection_output_nodes_ids = [node_id for node_id, attrs in graph.nodes(data=True)
                                       if 'name' in attrs and attrs['name'] == 'detection_output']
         if len(detection_output_nodes_ids) != 1:
-            raise Error("Found the following nodes '{}' with 'detection_output' but there should be exactly 1.".
+            raise Error("Found the following nodes '{}' with name 'detection_output' but there should be exactly 1.".
                         format(detection_output_nodes_ids))
-        detection_output_node = Node(graph, detection_output_nodes_ids[0])
-        output_nodes = [port.node for port in detection_output_node.out_port(0).get_destinations() if port.node.soft_get('type') == 'Result']
-        if len(output_nodes) == 1:
-            graph.remove_node(output_nodes[0].id)
+        detection_output = Node(graph, detection_output_nodes_ids[0])
+        do_outputs = [port.node for port in detection_output.out_port(0).get_destinations() if port.node.op == 'Result']
+        if len(do_outputs) == 1:
+            graph.remove_node(do_outputs[0].id)
 
-        # add reshape of Detection Output so it can be an output of the topology
-        reshape_detection_output_2d_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 7]),
-                                                                            dict(name='reshape_do_2d'),
-                                                                            detection_output_node)
-        mark_as_correct_data_layout(reshape_detection_output_2d_node)
+        # add reshape of Detection Output so it can be an output of the topology.
+        # this looks like some legacy not relevant constraint anymore
+        flatten_do = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 7]), dict(name='reshape_do_2d'),
+                                                      detection_output)
+        mark_as_correct_data_layout(flatten_do)
 
-        # adds special node of type "Output" that is a marker for the output nodes of the topology
-        output_op = Result(graph, dict(name='do_reshaped_OutputOp'))
-        output_node = output_op.create_node([reshape_detection_output_2d_node])
+        # adds "Result" node so this output is returned by IE by default for the backward compatibility
+        do_result = Result(graph, dict(name='do_reshaped_OutputOp')).create_node([flatten_do])
 
         # add attribute 'output_sort_order' so it will be used as a key to sort output nodes before generation of IR
-        output_node.in_edge()['data_attrs'].append('output_sort_order')
-        output_node.in_edge()['output_sort_order'] = [('detection_boxes', 0)]
-
-        # creates two Crop operations which get input from the DetectionOutput layer, cuts of slices of data with class
-        # ids and probabilities and produce a tensor with batch ids and bounding boxes only (as it is expected by the
-        # ROIPooling layer)
-        crop_batch_op = Crop(graph, dict(axis=int64_array([3]), offset=int64_array([0]), dim=int64_array([1]),
-                                         nchw_layout=True))
-        crop_batch_node = crop_batch_op.create_node([detection_output_node], dict(name='crop_do_batch_ids'))
-
-        crop_coordinates_op = Crop(graph, dict(axis=int64_array([3]), offset=int64_array([3]), dim=int64_array([4]),
-                                               nchw_layout=True))
-        crop_coordinates_node = crop_coordinates_op.create_node([detection_output_node], dict(name='crop_do_coords'))
+        do_result.in_edge()['data_attrs'].append('output_sort_order')
+        do_result.in_edge()['output_sort_order'] = [('detection_boxes', 0)]
 
-        concat_op = Concat(graph, dict(axis=3))
-        concat_node = concat_op.create_node([crop_batch_node, crop_coordinates_node], dict(name='batch_and_coords',
-                                                                                           nchw_layout=True))
+        # creates two Crop operations which get input from the DetectionOutput, cuts off slices of data with class ids
+        # and probabilities and produces a tensor with batch ids and bounding boxes only (as it is expected by the
+        # ROIPooling operation)
+        batch_ids = Crop(graph, dict(axis=int64_array([1]), offset=int64_array([0]), dim=int64_array([1]))).create_node(
+            [flatten_do], dict(name='crop_do_batch_ids'))
+        coords = Crop(graph, dict(axis=int64_array([1]), offset=int64_array([3]), dim=int64_array([4]))).create_node(
+            [flatten_do], dict(name='crop_do_coords'))
+        batch_and_coords = Concat(graph, dict(axis=1)).create_node([batch_ids, coords], dict(name='batch_and_coords'))
 
-        # reshape bounding boxes as required by ROIPooling
-        reshape_do_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 5]),
-                                                           dict(name='reshape_do'), concat_node)
-        mark_as_correct_data_layout(reshape_do_node)
-
-        roi_pooling_op = ROIPooling(graph, dict(method="bilinear", spatial_scale=1, pooled_h=roi_pool_size,
-                                                pooled_w=roi_pool_size))
-        roi_pooling_node = roi_pooling_op.create_node([match.single_input_node(0)[0].in_node(), reshape_do_node],
-                                                      dict(name='ROI_pooling_2'))
-        return {'roi_pooling_node': roi_pooling_node}
+        roi_pooling = ROIPooling(graph, dict(method="bilinear", spatial_scale=1, pooled_h=roi_pool_size,
+                                             pooled_w=roi_pool_size)).create_node(
+            [match.single_input_node(0)[0].in_node(), batch_and_coords], dict(name='ROI_pooling_2'))
+        return {'roi_pooling_node': roi_pooling}
 
 
 class ObjectDetectionAPIMaskRCNNSigmoidReplacement(FrontReplacementFromConfigFileGeneral):
     """
-    This replacer is used to convert Mask R-CNN topologies only.
-    Adds activation with sigmoid function to the end of the network producing masks tensors.
+    The transformation is used to convert Mask R-CNN topologies only.
+
+    The post-processing part of Mask-RCNN models is to select masks from the output tensor which correspond to bounding
+    boxes with probability exceeding specific threshold. The final step of the post-processing is to apply Sigmoid
+    activation function to the tensor with selected masks so the values become in range [0, 1]. The post-processing part
+    of the model is not supported so it is removed using the transformation ObjectDetectionAPIOutputReplacement.
+    This transformation adds back the activation function to the end of the network producing masks tensors. So the
+    post-processing with selecting masks corresponding to bounding boxes with high probabilities should be implemented
+    in the application.
     """
     replacement_id = 'ObjectDetectionAPIMaskRCNNSigmoidReplacement'
     run_not_recursively = True
@@ -1059,6 +1183,8 @@ def run_after(self):
         return [ObjectDetectionAPIMaskRCNNROIPoolingSecondReplacement]
 
     def transform_graph(self, graph: Graph, replacement_descriptions):
+        # there could be multiple Result nodes in the graph. We identify the one containing masks data using the node
+        # name prefix
         masks_node_prefix_name = replacement_descriptions.get('masks_node_prefix_name', 'SecondStageBoxPredictor')
         op_outputs = graph.get_op_nodes(op='Result')
         for op_output in op_outputs:
@@ -1067,17 +1193,28 @@ def transform_graph(self, graph: Graph, replacement_descriptions):
                 sigmoid_node = Sigmoid(graph, dict(name='masks')).create_node()
                 op_output.in_port(0).get_connection().insert_node(sigmoid_node)
 
-        print('The predicted masks are produced by the "masks" layer for each bounding box generated with a '
-              '"detection_output" operation.\n Refer to operation specification in the documentation for information '
-              'about the DetectionOutput operation output data interpretation.\n'
-              'The model can be inferred using the dedicated demo "mask_rcnn_demo" from the OpenVINO Open Model Zoo.')
+        log.error('The predicted masks are produced by the "masks" layer for each bounding box generated with a '
+                  '"detection_output" operation.\n Refer to operation specification in the documentation for the '
+                  'information about the DetectionOutput operation output data interpretation.\nThe model can be '
+                  'inferred using the dedicated demo "mask_rcnn_demo" from the OpenVINO Open Model Zoo.',
+                  extra={'is_warning': True})
 
 
 class ObjectDetectionAPIProposalReplacement(FrontReplacementFromConfigFileSubGraph):
     """
-    This class replaces sub-graph of operations with Proposal layer and additional layers transforming
-    tensors from layout of TensorFlow to layout required by Inference Engine.
-    Refer to comments inside the function for more information about performed actions.
+    The outputs of the Region Proposal Network which produces shape offsets and probabilities whether anchors contain
+    object or not is fed to the part of the model which decodes bounding boxes and performs non-maximum suppression.
+    There are two operations in the Inference Engine which can perform such calculations: Proposal and DetectionOutput.
+    Historically, the Proposal operation was inserted by this transformation, but now a DetectionOutput can be inserted
+    instead if the "operation_to_add" parameter in the JSON configuration file is set to "DetectionOutput". There was a
+    model for which inserting DetectionOutput instead of Proposal operation results in generation more accurate results.
+    Another reason why Proposal operation is not preferable is that it requires addition model input which defines
+    original image size and special scale value (refer to the operation specification for more details). So even though
+    the original TensorFlow model has one input (actual image), the generated IR contains two inputs (actual image and
+    a special input for the Proposal operation). It is not possible to switch to inserting DetectionOutput operation
+    by default because it is not backward compatible change and some customer script may start to fail since one input
+    disappears.
+    Refer to the code for details on the conversion process and operations inserted.
     """
     replacement_id = 'ObjectDetectionAPIProposalReplacement'
     run_not_recursively = True
@@ -1115,33 +1252,39 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
         proposal_scales = _value_or_raise(match, pipeline_config, 'anchor_generator_scales')
         anchors_count = len(proposal_ratios) * len(proposal_scales)
 
-        # Convolution/matmul node that produces classes predictions
-        # Transpose result of the tensor with classes permissions so it will be in a correct layout for Softmax
-        predictions_node = backward_bfs_for_operation(match.single_input_node(1)[0], ['Add'])[0]
-
-        reshape_classes_node = create_op_node_with_second_input(graph, Reshape, int64_array([0, anchors_count, 2, -1]),
-                                                                dict(name='predictions/Reshape'))
-        predictions_node.insert_node_after(reshape_classes_node, 0)
-        mark_as_correct_data_layout(reshape_classes_node)
-
-        softmax_conf_op = Softmax(graph, dict(axis=2, nchw_layout=True, name=reshape_classes_node.id + '/Softmax'))
-        softmax_conf_node = softmax_conf_op.create_node([reshape_classes_node])
+        # Find Convolution/MatMul node that produces classes confidence
+        class_conf = backward_bfs_for_operation(match.single_input_node(1)[0], ['Add'])[0]
+
+        # size of 'C' dimension of the tensor with class predictions is equal to base_anchors_count * 2, where 2
+        # corresponds to a number of classes (background and foreground) and base_anchors_count is equal to number of
+        # anchors applied to each position of 'H' and 'W' dimensions. Therefore, there are H * W * base_anchors_count
+        # bounding boxes. Inference Engine Proposal operation interprets the input tensor as a tensor
+        # [batch, 2 * base_anchors_count, H, W] but in TensorFlow model it is calculated as
+        # [batch, base_anchors_count, H, W] (after NHWC->NCHW layout conversion), so it is necessary to decompose the
+        # 'C' dimension into base_anchors_count and 2 and swap these two dimensions
+        reshape_class_conf = create_op_node_with_second_input(graph, Reshape, int64_array([0, anchors_count, 2, -1]),
+                                                              dict(name='predictions/Reshape'))
+        class_conf.insert_node_after(reshape_class_conf, 0)
+        mark_as_correct_data_layout(reshape_class_conf)
+
+        # the part of the sub-graph being removed contains the SoftMax operation, so here we insert it back
+        softmax_conf_op = Softmax(graph, dict(axis=2, nchw_layout=True, name=reshape_class_conf.id + '/Softmax'))
+        softmax_conf = softmax_conf_op.create_node([reshape_class_conf])
 
         order_const = Const(graph, dict(value=int64_array([0, 2, 1, 3]),
-                                        name=softmax_conf_node.name + '/TransposeOrder')).create_node()
+                                        name=softmax_conf.name + '/TransposeOrder')).create_node()
         permute_reshape_softmax_op = Transpose(graph, dict())
-        permute_reshape_softmax_node = permute_reshape_softmax_op.create_node([softmax_conf_node, order_const], dict(
-            name=softmax_conf_node.name + '/Transpose'))
-        mark_input_as_in_correct_layout(permute_reshape_softmax_node, 1)
-        mark_output_as_in_correct_layout(permute_reshape_softmax_node, 0)
+        permute_reshape_softmax = permute_reshape_softmax_op.create_node([softmax_conf, order_const], dict(
+            name=softmax_conf.name + '/Transpose'))
+        mark_input_as_in_correct_layout(permute_reshape_softmax, 1)
+        mark_output_as_in_correct_layout(permute_reshape_softmax, 0)
 
-        initial_shape_op = Shape(graph, dict(name=predictions_node.id + '/Shape'))
-        initial_shape_node = initial_shape_op.create_node([predictions_node])
+        initial_shape = Shape(graph, dict(name=class_conf.id + '/Shape')).create_node([class_conf])
 
-        reshape_permute_op = Reshape(graph, dict(name='Reshape_Transpose_Class'))
-        reshape_permute_node = reshape_permute_op.create_node([permute_reshape_softmax_node, initial_shape_node])
-        mark_input_as_in_correct_layout(reshape_permute_node, 0)
-        mark_output_as_in_correct_layout(reshape_permute_node, 0)
+        reshape_conf_initial = Reshape(graph, dict(name='Reshape_Transpose_Class')).create_node(
+            [permute_reshape_softmax, initial_shape])
+        mark_input_as_in_correct_layout(reshape_conf_initial, 0)
+        mark_output_as_in_correct_layout(reshape_conf_initial, 0)
 
         variance_height = pipeline_config.get_param('frcnn_variance_height')
         variance_width = pipeline_config.get_param('frcnn_variance_width')
@@ -1160,8 +1303,8 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
                       'results will be inaccurate.'.format(variance_x, variance_y))
         if anchor_generator_height_stride != anchor_generator_width_stride:
             log.error('The values for the anchor generator height stride "{}" is not equal to the anchor generator '
-                      'width stride "{}". The detection results will be inaccurate.'.format(
-                anchor_generator_height_stride, anchor_generator_width_stride))
+                      'width stride "{}". The detection results will be inaccurate.'
+                      ''.format(anchor_generator_height_stride, anchor_generator_width_stride))
         if anchor_generator_height != anchor_generator_width:
             log.error('The values for the anchor generator height "{}" is not equal to the anchor generator width '
                       'stride "{}". The detection results will be inaccurate.'.format(anchor_generator_height,
@@ -1184,24 +1327,18 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
             if key in match.custom_replacement_desc.custom_attributes:
                 proposal_op.attrs[key] = int(match.custom_replacement_desc.custom_attributes[key])
 
-        anchors_node = backward_bfs_for_operation(match.single_input_node(0)[0], ['Add'])[0]
-
-        # creates input to store input image height, width and scales (usually 1.0s)
-        # the batch size for this input is fixed because it is allowed to pass images of the same size only as input
-        input_op_with_image_size = Parameter(graph, dict(shape=int64_array([1, 3]), fixed_batch=True))
-        input_with_image_size_node = input_op_with_image_size.create_node([], dict(name='image_info'))
+        bboxes_offsets = backward_bfs_for_operation(match.single_input_node(0)[0], ['Add'])[0]
 
-        proposal_node = proposal_op.create_node([reshape_permute_node, anchors_node, input_with_image_size_node],
-                                                dict(name='proposals'))
-        # models with use_matmul_crop_and_resize = True should not swap order of elements (YX to XY) after the Proposal
-        swap_proposals = not match.custom_replacement_desc.custom_attributes.get('do_not_swap_proposals', False) and \
-                         not pipeline_config.get_param('use_matmul_crop_and_resize')
-        if swap_proposals:
-            proposal_node = add_convolution_to_swap_xy_coordinates(graph, proposal_node, 5)
+        # creates input to store input image height, width and scales (usually 1.0s) which is a mandatory input to the
+        # Proposal operation. The batch size for this input is fixed because it is allowed to pass images of the same
+        # size only as input
+        im_info = Parameter(graph, dict(shape=int64_array([1, 3]), fixed_batch=True)).create_node(
+            [], dict(name='image_info'))
 
-        return {'proposal_node': ObjectDetectionAPIProposalReplacement.ie_to_tf_proposals(graph, proposal_node, match,
-                                                                                          max_proposals,
-                                                                                          swap_proposals)}
+        proposal = proposal_op.create_node([reshape_conf_initial, bboxes_offsets, im_info], dict(name='proposals'))
+        return {'proposal_node': ObjectDetectionAPIProposalReplacement.ie_to_tf_proposals(graph, proposal, match,
+                                                                                          pipeline_config,
+                                                                                          max_proposals)}
 
     @staticmethod
     def insert_detection_output_instead_of_proposal(graph: Graph, match: SubgraphMatch,
@@ -1210,10 +1347,8 @@ def insert_detection_output_instead_of_proposal(graph: Graph, match: SubgraphMat
         The function inserts DetectionOutput operation instead of Proposal operation which may result in an increase of
         the accuracy for some models. The function is enabled with the custom attribute "operation_to_insert" with
         value "DetectionOutput" in the transformation configuration file section for the
-        "ObjectDetectionAPIProposalReplacement" transformation. However, this transformation should not be applied in
-        case when an input image should be scaled before feeding the IR because the DetectionOutput operation does not
-        have information about the original input image size, whilst the Proposal operation has an input which contains
-        this information.
+        "ObjectDetectionAPIProposalReplacement" transformation.
+
         :param graph: the graph to operate on
         :param match: the object containing information about the matched sub-graph
         :param pipeline_config: object containing information from the pipeline.config file of the model
@@ -1221,42 +1356,38 @@ def insert_detection_output_instead_of_proposal(graph: Graph, match: SubgraphMat
         """
         max_proposals = _value_or_raise(match, pipeline_config, 'first_stage_max_proposals')
 
-        # Convolution/matmul node that produces classes predictions
-        # Transpose result of the tensor with classes permissions so it will be in a correct layout for Softmax
-        predictions_nodes = backward_bfs_for_operation(match.single_input_node(1)[0], ['Add'])
-        assert len(predictions_nodes) >= 1, 'Expected to find nodes of type "Add" starting from the node "{}" in ' \
-                                            'backward direction'.format(match.single_input_node(1)[0].id)
-        predictions_node = predictions_nodes[0]
+        # Convolution/matmul node that produces classes confidence
+        # Transpose result of the tensor with classes confidences so it will be in a correct layout for Softmax
+        class_conf_nodes = backward_bfs_for_operation(match.single_input_node(1)[0], ['Add'])
+        assert len(class_conf_nodes) >= 1, 'Expected to find nodes of type "Add" starting from the node "{}" in ' \
+                                           'backward direction'.format(match.single_input_node(1)[0].id)
+        class_conf = class_conf_nodes[0]
 
-        # prepare input with class probabilities. The DetectionOutput operation which will consume this tensor as a
+        # prepare input with class confidences. The DetectionOutput operation which will consume this tensor as a
         # second input expects probabilities to be normalized with SoftMax operation per each bounding box class. In
-        # order to do this we first reshape the tensor so the last dimension contain probability for 2 classes
+        # order to do this we first reshape the tensor so the last dimension contains probability for 2 classes
         # (background and foreground) for each bounding box. Before feeding this tensor to the DO operation the tensor
         # is flattened to the shape [num_batches, num_classes * num_bounding_boxes]
-        reshape_classes_node = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1, 2]),
-                                                                dict(name='predictions/Reshape'))
+        reshape_conf = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1, 2]),
+                                                        dict(name='predictions/Reshape'))
         # transpose from NCHW to NHWC will be inserted as input to the Reshape automatically. This is expected
-        predictions_node.out_port(0).disconnect()
-        predictions_node.out_port(0).connect(reshape_classes_node.in_port(0))
-        softmax_conf_node = Softmax(graph, dict(axis=2, name=reshape_classes_node.id + '/Softmax')).create_node([
-            reshape_classes_node])
+        class_conf.out_port(0).disconnect()
+        class_conf.out_port(0).connect(reshape_conf.in_port(0))
+        softmax_conf = Softmax(graph, dict(axis=2, name=reshape_conf.id + '/Softmax')).create_node([reshape_conf])
         flattened_conf = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1]),
-                                                          dict(name=softmax_conf_node.name + '/Flatten'),
-                                                          softmax_conf_node)
-
-        # prepare input with box logits
-        boxes_logit = backward_bfs_for_operation(match.single_input_node(0)[0], ['Add'])[0]
-        reshape_box_logits = create_op_node_with_second_input(
-            graph, Reshape, int64_array([0, -1]), dict(name=boxes_logit.soft_get('name', boxes_logit.id) + '/Flatten'),
-            boxes_logit)
-
+                                                          dict(name=softmax_conf.name + '/Flatten'), softmax_conf)
+        # prepare input with bounding boxes shape offsets
+        offsets = backward_bfs_for_operation(match.single_input_node(0)[0], ['Add'])[0]
+        flatten_offsets = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1]),
+                                                           dict(name=offsets.soft_get('name', offsets.id) + '/Flatten'),
+                                                           offsets)
+
+        # TensorFlow produces anchor boxes in absolute coordinates in YXYX order. Need to normalize them to [0, 1]
+        # interval and append a tensor with variances. Refer to the ObjectDetectionAPISSDPostprocessorReplacement
+        # transformation comments about variances. The YXYX->XYXY order change will be performed with the output of the
+        # inserted DetectionOutput operation
         yxyx_anchors = match.single_input_node(2)[0]
 
-        variance_height = pipeline_config.get_param('frcnn_variance_height')
-        variance_width = pipeline_config.get_param('frcnn_variance_width')
-        variance_x = pipeline_config.get_param('frcnn_variance_x')
-        variance_y = pipeline_config.get_param('frcnn_variance_y')
-
         # get the input image height and width to divide the anchors values by it
         initial_input_node_name = 'input_tensor' if 'input_tensor' in graph.nodes else 'image_tensor'
         if initial_input_node_name not in graph.nodes():
@@ -1268,13 +1399,12 @@ def insert_detection_output_instead_of_proposal(graph: Graph, match: SubgraphMat
         input_image_hw = node_to_get_shape_value_of_indices(input_shape, [1, 2])  # NHWC layout
         hwhw = create_op_with_const_inputs(graph, Tile, {1: int64_array([2])}, {'name': 'image_hwhw'}, input_image_hw)
 
-        hwhw_float = Cast(graph,
-                          {'dst_type': data_type_str_to_np(graph.graph['cmd_params'].data_type)}).create_node([hwhw])
+        hwhw_float = Cast(graph, {'dst_type': np.float32}).create_node([hwhw])
         scaled_anchors = Div(graph, {'name': 'scaled_anchors'}).create_node([yxyx_anchors, hwhw_float])
 
         flattened_anchors = create_op_with_const_inputs(graph, Reshape, {1: int64_array([1, 1, -1])},
                                                         {'name': 'flattened_anchors'}, scaled_anchors)
-        cropped_anchors = AttributedClamp(graph, {'min': 0.0, 'max': 1.0, 'name': 'clamped_xyxy',
+        cropped_anchors = AttributedClamp(graph, {'min': 0.0, 'max': 1.0, 'name': 'clamped_yxyx',
                                                   'nchw_layout': True}).create_node([flattened_anchors])
         # the input tensor "scaled_anchors" for the "flattened_anchors" may be 4D. In order to avoid inserting Transpose
         # operation mark the "flattened_anchors" with the correct data layout
@@ -1282,8 +1412,7 @@ def insert_detection_output_instead_of_proposal(graph: Graph, match: SubgraphMat
 
         # create tensor of shape [4] with variance values which then are tiled by the number of boxes which is obtained
         # from the 'yxyx_anchors' node
-        variances = Const(graph, {'value': np.float32([1.0 / variance_x, 1.0 / variance_y, 1.0 / variance_width,
-                                                       1.0 / variance_height])}).create_node()
+        variances = Const(graph, {'value': _variance_from_pipeline_config(pipeline_config)}).create_node()
 
         anchors_shape = Shape(graph, {'name': 'anchors_shape'}).create_node([yxyx_anchors])
         anchors_count = node_to_get_shape_value_of_indices(anchors_shape, [0])
@@ -1314,7 +1443,7 @@ def insert_detection_output_instead_of_proposal(graph: Graph, match: SubgraphMat
                               'variance_encoded_in_target': False,
                               'nms_threshold': _value_or_raise(match, pipeline_config, 'first_stage_nms_iou_threshold'),
                               'name': 'first_do',
-                              }).create_node([reshape_box_logits, flattened_conf, duplicate_anchors])
+                              }).create_node([flatten_offsets, flattened_conf, duplicate_anchors])
         # DetectionOutput output tensor has YXYX box coordinates order
         # switch to 3D to avoid issues that part of the model with 4D shapes should be inferred in NCHW layout
         do_3d = create_op_with_const_inputs(graph, Squeeze, {1: int64_array(0)}, {'name': do.name + '/SqueezeDO'}, do)
@@ -1325,50 +1454,56 @@ def insert_detection_output_instead_of_proposal(graph: Graph, match: SubgraphMat
         # tensors with each of these elements for predictions. Then we crop predicted box coordinates (scaled) to be
         # within [0, 1] range (as it is predicted in the TF model) and then combine tensors back to the Proposal
         # operation output format: [batch_id, x1, y1, x2, y2].
-        do_split = create_op_node_with_second_input(graph, Split, int64_array(2), {'num_splits': 7, 'nchw_layout': True,
+        do_split = create_op_node_with_second_input(graph, Split, int64_array(2), {'num_splits': 7,
                                                                                    'name': do.name + '/Split'}, do_3d)
 
-        xyxy_coord = Concat(graph, {'axis': -1, 'nchw_layout': True, 'in_ports_count': 4,
-                                    'name': do_split.name + '/xyxy'}).create_node()
-        # change output from YXYX to XYXY order
-        do_split.out_port(3).connect(xyxy_coord.in_port(1))
-        do_split.out_port(4).connect(xyxy_coord.in_port(0))
-        do_split.out_port(5).connect(xyxy_coord.in_port(3))
-        do_split.out_port(6).connect(xyxy_coord.in_port(2))
+        coords = Concat(graph, {'axis': -1, 'in_ports_count': 4, 'name': do_split.name + '/coords'}).create_node()
+        # concat bounding boxes with the same order (XYXY) as Proposal produces
+        for port_idx in range(4):
+            do_split.out_port(3 + port_idx).connect(coords.in_port(port_idx))
 
-        clamped_xyxy_coord = AttributedClamp(graph, {'min': 0.0, 'max': 1.0, 'name': 'clamped_xyxy',
-                                                     'nchw_layout': True}).create_node([xyxy_coord])
+        clamped_coords = AttributedClamp(graph, {'min': 0.0, 'max': 1.0, 'name': 'clamped_xyxy'}).create_node([coords])
 
         # prepare final proposal boxes [batch_id, x1, y1, x2, y2]
-        proposal_node = Concat(graph, {'axis': -1, 'nchw_layout': True,  'in_ports_count': 2,
-                                       'name': 'proposals'}).create_node()
+        proposal_node = Concat(graph, {'axis': -1, 'in_ports_count': 2, 'name': 'proposals'}).create_node()
         do_split.out_port(0).connect(proposal_node.in_port(0))
-        clamped_xyxy_coord.out_port(0).connect(proposal_node.in_port(1))
+        clamped_coords.out_port(0).connect(proposal_node.in_port(1))
         return {'proposal_node': ObjectDetectionAPIProposalReplacement.ie_to_tf_proposals(graph, proposal_node, match,
-                                                                                          max_proposals, True)}
+                                                                                          pipeline_config,
+                                                                                          max_proposals)}
 
     @staticmethod
-    def ie_to_tf_proposals(graph: Graph, proposal_node: Node, match: SubgraphMatch, max_proposals: int,
-                           swap_proposals: bool = False):
+    def ie_to_tf_proposals(graph: Graph, proposal: Node, match: SubgraphMatch, pipeline_config: PipelineConfig,
+                           max_proposals: int):
         """
         Builds a graph which converts the proposals data in IE format to the format of TensorFlow. This includes
-        swapping of XYXY to YXYX (if needed), and cropping the IE output of format [batch, x1, y1, x2, y2] to simply
-        [x1, y1, x2, y2] and reshaping tensor to an appropriate shape.
+        cropping the IE output of format [batch, x1, y1, x2, y2] to simply [x1, y1, x2, y2] and reshaping tensor to an
+        appropriate shape. Swapping of the Proposal output is performed when necessary.
 
         :param graph: the graph to operate on
-        :param proposal_node: the node producing IE proposals
+        :param proposal: the node producing IE proposals
         :param match: the object containing information about matched sub-graph
+        :param pipeline_config: object containing information from the pipeline.config file of the model
         :param max_proposals: maximum number of proposal boxes. Needed for the reshaping of the tensor
-        :param swap_proposals: flag to force swapping proposals for CropAndResize op
         :return: the node producing output in the TF format.
         """
-        proposal_reshape_2d_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 5]),
-                                                                    dict(name="reshape_swap_proposals_2d"),
-                                                                    proposal_node)
-        mark_input_as_in_correct_layout(proposal_reshape_2d_node, 0)
+        # models with use_matmul_crop_and_resize = True should not swap order of elements (YX to XY) after the Proposal
+        # because the TF output has XYXY layout originally.
+        # Also old version of RFCN model (1.9) does not require proposal swap since the output has proper layout
+        # already. The swap is controlled with the 'do_not_swap_proposals' parameter from the transformation file
+        swap_proposals = not match.custom_replacement_desc.custom_attributes.get('do_not_swap_proposals', False) and \
+                         not pipeline_config.get_param('use_matmul_crop_and_resize')
+        if swap_proposals:
+            proposal = add_convolution_to_swap_xy_coordinates(graph, proposal, 5)
+
+        # the "reshape_swap_proposals_2d" is used in the ObjectDetectionAPIPSROIPoolingReplacement transformation. It
+        # is important that this input may be swapped several lines above
+        proposal_reshape_2d = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 5]),
+                                                               dict(name="reshape_swap_proposals_2d"), proposal)
+        mark_input_as_in_correct_layout(proposal_reshape_2d, 0)
 
         crop_and_resize_nodes_ids = [node_id for node_id in bfs_search(graph, [match.single_input_node(0)[0].id]) if
-                                     graph.node[node_id]['op'] == 'CropAndResize']
+                                     graph.nodes[node_id]['op'] == 'CropAndResize']
         if len(crop_and_resize_nodes_ids) != 0 and swap_proposals:
             # feed the CropAndResize node with a correct boxes information produced with the Proposal layer
             # find the first CropAndResize node in the BFS order. This is needed in the case when we already swapped
@@ -1378,26 +1513,44 @@ def ie_to_tf_proposals(graph: Graph, proposal_node: Node, match: SubgraphMatch,
             # transform doesn't try to merge the second and the third inputs
             crop_and_resize_node['inputs_preprocessed'] = True
             crop_and_resize_node.in_port(1).disconnect()
-            proposal_reshape_2d_node.out_port(0).connect(crop_and_resize_node.in_port(1))
+            proposal_reshape_2d.out_port(0).connect(crop_and_resize_node.in_port(1))
 
-        tf_proposal_reshape_4d_node = create_op_node_with_second_input(graph, Reshape,
-                                                                       int64_array([-1, 1, max_proposals, 5]),
-                                                                       dict(name="reshape_proposal_4d"),
-                                                                       proposal_node)
+        tf_proposal_reshape_4d = create_op_node_with_second_input(graph, Reshape,
+                                                                  int64_array([-1, 1, max_proposals, 5]),
+                                                                  dict(name="reshape_proposal_4d"), proposal)
+        mark_as_correct_data_layout(tf_proposal_reshape_4d)
 
         crop_op = Crop(graph, dict(axis=int64_array([3]), offset=int64_array([1]), dim=int64_array([4]),
                                    nchw_layout=True))
-        crop_node = crop_op.create_node([tf_proposal_reshape_4d_node], dict(name='crop_proposals'))
-
-        mark_as_correct_data_layout(tf_proposal_reshape_4d_node)
+        # the crop_proposals node is used in the ObjectDetectionAPIDetectionOutputReplacement transformation
+        crop = crop_op.create_node([tf_proposal_reshape_4d], dict(name='crop_proposals'))
 
         tf_proposals_crop_reshape_3d_node = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1, 4]),
-                                                                             dict(name="reshape_crop_3d"), crop_node)
+                                                                             dict(name="reshape_crop_3d"), crop)
         mark_input_as_in_correct_layout(tf_proposals_crop_reshape_3d_node, 0)
         return tf_proposals_crop_reshape_3d_node
 
 
+"""
+An important part of many object detection models is an operation DetectionOutput which decodes final detection boxes
+using predicted bounding boxes shape offsets and prior boxes inputs. And finally performs non-maximum-suppression based
+on decoded boxes and their confidences (scores). There is no DetectionOutput operation in TensorFlow operation set, it
+is implemented as a sub-graph of primitive operations instead. There are two transformations which replace the sub-graph
+implementing DetectionOutput operation in this file: ObjectDetectionAPISSDPostprocessorReplacement and 
+ObjectDetectionAPIDetectionOutputReplacement. The first one is used for SSD models, the second one for Faster-RCNN,
+Mask-RCNN and RFCN models. These transformations also prepare input data for the DetectionOutput operation because the
+layout and shape of the data is different between the TensorFlow and the Inference Engine. The most notable difference
+is that bounding boxes and deltas are calculated with YXYX order in the TensorFlow model whilst Inference Engine
+operation DetectionOutput, ROIPooling and Proposal expects them and produce the output with XYXY order. Refer to the
+transformation code and operations specifications for more details.
+"""
+
+
 class ObjectDetectionAPISSDPostprocessorReplacement(FrontReplacementFromConfigFileSubGraph):
+    """
+    The transformation replaces the TensorFlow sub-graph performing DetectionOutput with the DetectionOutput operation
+    and adds some nodes to prepare input data in correct layout and shape.
+    """
     replacement_id = 'ObjectDetectionAPISSDPostprocessorReplacement'
     run_not_recursively = True
 
@@ -1421,35 +1574,47 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
         has_background_class = _value_or_raise(match, pipeline_config, 'add_background_class')
         num_classes = _value_or_raise(match, pipeline_config, 'num_classes') + has_background_class
 
-        # reshapes confidences to 4D before applying activation function and do not convert from NHWC to NCHW this node
-        expand_dims_node = create_op_node_with_second_input(graph, Reshape, int64_array([0, 1, -1, num_classes]),
-                                                            {'name': 'do_ExpandDims_conf'})
-        expand_dims_node.in_port(0).connect(match.input_nodes(1)[0][0].in_node(0).out_port(0))
-
-        mark_as_correct_data_layout(expand_dims_node)
-
+        # reshapes confidences to 4D before applying activation function and do not convert from NHWC to NCHW this node.
+        # the add_activation_function_after_node function may insert the Softmax operation which is performed over the
+        # last dimension which should have a specific size = num_classes. In the original model the last dimension may
+        # be different, so this Reshape is absolutely necessary
+        reshape_conf_before_ac = create_op_node_with_second_input(graph, Reshape, int64_array([0, 1, -1, num_classes]),
+                                                                  {'name': 'do_ExpandDims_conf'})
+        reshape_conf_before_ac.in_port(0).connect(match.input_nodes(1)[0][0].in_node(0).out_port(0))
+        mark_as_correct_data_layout(reshape_conf_before_ac)
+
+        # the transformation nodes are selected such a way that the confidences/scores post-processing activation
+        # function is removed. This was done in order to support several versions of the model using one JSON config
+        # file. Therefore, it is necessary to manually add this operation back to the graph
         activation_function = _value_or_raise(match, pipeline_config, 'postprocessing_score_converter')
-        activation_conf_node = add_activation_function_after_node(graph, expand_dims_node, activation_function)
+        activation_conf_node = add_activation_function_after_node(graph, reshape_conf_before_ac, activation_function)
 
-        # IE DetectionOutput layer consumes flattened tensors
-        # reshape operation to flatten locations tensor
-        reshape_loc_node = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1]),
-                                                            {'name': 'do_reshape_loc'})
+        # IE DetectionOutput operation expects flattened tensor with bounding boxes shape offsets, so reshaping it
+        reshape_offsets = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1]),
+                                                           {'name': 'do_reshape_offsets'})
 
+        # skip all Identity nodes and Reshape/Squeeze/Unsqueeze ops which may break the conversion because add or split
+        # unnecessary dimensions
         current_node = skip_nodes_by_condition(match.input_nodes(0)[0][0].in_node(0),
                                                lambda x: x.op == 'Identity' or x.has_and_set('reinterp_shape'))
-        reshape_loc_node.in_port(0).connect(current_node.out_port(0))
-        mark_as_correct_data_layout(reshape_loc_node)
+        reshape_offsets.in_port(0).connect(current_node.out_port(0))
+        mark_as_correct_data_layout(reshape_offsets)
 
-        # IE DetectionOutput layer consumes flattened tensors
-        # reshape operation to flatten confidence tensor
+        # IE DetectionOutput operation expects flattened tensor with class confidences, so reshaping it
         reshape_conf_node = create_op_node_with_second_input(graph, Reshape, int64_array([0, -1]),
                                                              {'name': 'do_reshape_conf'}, activation_conf_node)
         mark_as_correct_data_layout(reshape_conf_node)
 
-        custom_attributes = match.custom_replacement_desc.custom_attributes
-        if ('disable_prior_boxes_layers_generator' not in custom_attributes or
-            not custom_attributes['disable_prior_boxes_layers_generator']) and \
+        need_swap_priors = False
+        # the SSD model is a fully convolutional model so it can perform detection for the arbitrary input shape image
+        # if the input with prior boxes is properly generated based on the input image size. There were some TensorFlow
+        # models where this input was hardcoded as a constant and so the model can predict images of the specific input
+        # size only. The code below inserts PriorBox or PriorBoxClustered operations which generate prior boxes and a
+        # function call "_relax_reshape_nodes" to fix hardcoded output shapes specified for some Reshape operations in
+        # the original model. These workarounds can be disabled by specifying parameter
+        # 'disable_prior_boxes_layers_generator' in the JSON transformation configuration file or is automatically
+        # disabled if necessary information about prior box generators is not known
+        if not match.custom_replacement_desc.custom_attributes.get('disable_prior_boxes_layers_generator', False) and \
                 (pipeline_config.get_param('ssd_anchor_generator_num_layers') is not None or
                  pipeline_config.get_param('multiscale_anchor_generator_min_level') is not None):
             # change the Reshape operations with hardcoded number of output elements of the convolution nodes to be
@@ -1459,83 +1624,82 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
             # create PriorBoxClustered nodes instead of a constant value with prior boxes so the model could be reshaped
             if pipeline_config.get_param('ssd_anchor_generator_num_layers') is not None:
                 priors_node = _create_prior_boxes_node(graph, pipeline_config)
-            elif pipeline_config.get_param('multiscale_anchor_generator_min_level') is not None:
+            else:
                 priors_node = _create_multiscale_prior_boxes_node(graph, pipeline_config)
         else:
             log.info('The anchor generator is not known. Save constant with prior-boxes to IR.')
-            priors_node = match.input_nodes(2)[0][0].in_node(0)
+            tf_priors_node = match.input_nodes(2)[0][0].in_node(0)
+            # original prior boxes are stored as YXYX while DetectionOutput expects them to be represented as XYXY.
+            # also variances should be encoded into this input. Variances are the values which are used during decoding
+            # of bounding boxes from prior boxes and shape offsets. Refer to the DetectionOutput operation
+            # implementation for more details
+            flattened_priors = create_op_with_const_inputs(graph, Reshape, {1: int64_array([1, 1, -1])},
+                                                           {'name': 'flattened_priors'}, tf_priors_node)
+            mark_as_correct_data_layout(flattened_priors)
+
+            # create tensor of shape [4] with variance values which then are tiled by the number of boxes which is
+            # obtained from the 'priors_node' node
+            priors_shape = Shape(graph, {'name': 'priors_shape'}).create_node([tf_priors_node])
+            priors_count = node_to_get_shape_value_of_indices(priors_shape, [-2])
+
+            # replicating the variance values for all prior-boxes
+            variances = Const(graph, {'value': _variance_from_pipeline_config(pipeline_config)}).create_node()
+            tiled_variances = Tile(graph, {'name': 'tiled_variances'}).create_node([variances, priors_count])
+            flattened_tiled_variances = create_op_with_const_inputs(graph, Reshape, {1: int64_array([1, 1, -1])},
+                                                                    {'name': 'flattened_tiled_variances'},
+                                                                    tiled_variances)
+            # now we can concatenate priors with a tensor with variances as it is expected by the DetectionOutput
+            priors_node = Concat(graph, {'axis': 1, 'name': 'priors_with_variances'}).create_node(
+                [flattened_priors, flattened_tiled_variances])
+
+            # set a flag that priors should we swapped from YXYX to XYXY
+            need_swap_priors = True
 
-        # creates DetectionOutput Node object from Op class
         detection_output_op = DetectionOutput(graph, match.custom_replacement_desc.custom_attributes)
-        for key in ('clip_before_nms', 'clip_after_nms'):
-            if key in match.custom_replacement_desc.custom_attributes:
-                detection_output_op.attrs[key] = int(match.custom_replacement_desc.custom_attributes[key])
-        detection_output_op.attrs['old_infer'] = detection_output_op.attrs['infer']
-        detection_output_op.attrs['infer'] = __class__.do_infer
+        # during the bounding boxes detection the intermediate boxes are clipped to be in range [0, 1]. Different
+        # versions of the TF OD API SSD models have this clipping at different stages. Special attributes
+        # "clip_before_nms" and "clip_after_nms" were introduced to the operation DetectionOutput to handle these cases.
+        # These attributes are specified in the JSON transformation configuration file
         detection_output_node = detection_output_op.create_node(
-            [reshape_loc_node, reshape_conf_node, priors_node],
+            [reshape_offsets, reshape_conf_node, priors_node],
             dict(name=detection_output_op.attrs['type'],
+                 background_label_id=0 if has_background_class else -1,
                  num_classes=num_classes,
+                 variances_encoded_in_target=False,
                  confidence_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_score_threshold'),
                  top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_detections_per_class'),
                  keep_top_k=_value_or_raise(match, pipeline_config, 'postprocessing_max_total_detections'),
                  nms_threshold=_value_or_raise(match, pipeline_config, 'postprocessing_iou_threshold')))
 
-        # compared to the IE's DetectionOutput, the TF keeps the locations in YXYX, need to get back to the XYXY
-        # for last convolutions that operate the locations need to swap the X and Y for output feature weights & biases
+        # the TensorFlow model keeps the bounding boxes shape offsets as YXYX, while IE DetectionOutput expects them to
+        # be specified as XYXY. The solution is to update last convolutions weights and biases to produce XY->YX swapped
+        # bounding boxes offsets
         conv_nodes = backward_bfs_for_operation(detection_output_node.in_node(0), ['Conv2D'], ['ShapeOf'])
         swap_weights_xy(graph, conv_nodes)
 
-        # As outputs are replaced with a postprocessing node, outgoing tensor names are no longer
-        # correspond to original tensors and should be removed from output->Result edges
-        out_nodes = []
-        for out in range(match.outputs_count()):
-            out_nodes.append(match.output_node(out)[0])
-        clear_tensor_names_info(out_nodes)
-
-        return {'detection_output_node': detection_output_node}
+        # also need to swap priors from YXYX to XYXY if this input was used from the original model. If the input was
+        # not with PriorBox or PriorBoxClustered operations above then the layout will be XYXY
+        if need_swap_priors:
+            insert_weights_swap_xy_sub_graph(graph, detection_output_node.in_port(2).get_connection())
 
-    @staticmethod
-    def do_infer(node: Node):
-        graph = node.graph
-        prior_boxes = node.in_node(2).value
-        if prior_boxes is not None:
-            argv = node.graph.graph['cmd_params']
-            if argv.tensorflow_object_detection_api_pipeline_config is None:
-                raise Error(missing_param_error)
-            pipeline_config = PipelineConfig(argv.tensorflow_object_detection_api_pipeline_config)
-            variance = _variance_from_pipeline_config(pipeline_config)
-            # replicating the variance values for all prior-boxes
-            variances = np.tile(variance, [prior_boxes.shape[-2], 1])
-            # DetectionOutput Inference Engine expects the prior-boxes in the following layout: (values, variances)
-            prior_boxes = prior_boxes.reshape([-1, 4])
-            prior_boxes = np.concatenate((prior_boxes, variances), 0)
-            # compared to the IE's DetectionOutput, the TF keeps the prior-boxes in YXYX, need to get back to the XYXY
-            prior_boxes = np.concatenate((prior_boxes[:, 1:2], prior_boxes[:, 0:1],
-                                          prior_boxes[:, 3:4], prior_boxes[:, 2:3]), 1)
-            #  adding another dimensions, as the prior-boxes are expected as 3d tensors
-            prior_boxes = prior_boxes.reshape((1, 2, -1))
-            node.in_node(2).shape = int64_array(prior_boxes.shape)
-            node.in_node(2).value = prior_boxes
-
-            # create Const node with an updated prior boxes values. Cannot use Port/Connection API here because we are
-            # in the middle of the partial inference phase and graph is in the intermediate step
-            graph.remove_edge(node.in_node(2).in_node(0).id, node.in_node(2).id)
-            const = Const(graph, {'name': 'prior_boxes', 'executable': True, 'value': prior_boxes}).create_node()
-            graph.create_edge(const, node.in_node(2))
-
-        node.old_infer(node)
-
-        conv_nodes = backward_bfs_for_operation(node.in_node(0), ['Conv2D'], ['ShapeOf'])
+        # need to mark some Squeeze, Reshape and Concat operations to not change the layout
         mark_squeeze_reshape_concat_before_detection_output(conv_nodes)
 
+        # As outputs are replaced with a postprocessing node, outgoing tensor names are no longer correspond to the
+        # original tensors and should be removed from output->Result edges
+        clear_tensor_names_info([match.output_node(out)[0] for out in range(match.outputs_count())])
+
+        # return dictionary with mapping of nodes that is used in the `output_edges_match` function to finish sub-graph
+        # replacement by re-connecting output from the original matched output node to the DetectionOutput node
+        return {'detection_output_node': detection_output_node}
+
 
 class ObjectDetectionAPIOutputReplacement(FrontReplacementFromConfigFileGeneral):
     """
     This replacer is used to cut-off the network by specified nodes for models generated with Object Detection API.
     The custom attribute for the replacer contains one value for key "outputs". This string is a comma separated list
     of outputs alternatives. Each output alternative is a '|' separated list of node name which could be outputs. The
-    first node from each alternative that exits in the graph is chosen. Others are ignored.
+    first node from each alternative group that exits in the graph is chosen. Others are ignored.
     For example, if the "outputs" is equal to the following string:
 
         "Reshape_16,SecondStageBoxPredictor_1/Conv_3/BiasAdd|SecondStageBoxPredictor_1/Conv_1/BiasAdd"
@@ -1572,6 +1736,14 @@ def transform_graph(self, graph: Graph, replacement_descriptions: dict):
 
 
 class ObjectDetectionAPIPSROIPoolingReplacement(FrontReplacementFromConfigFileSubGraph):
+    """
+    RFCN models contain a unique block ("SecondStageBoxPredictor") performing bounding boxes predictions which is
+    called Position Sensitive ROI Pooling (PSROIPooling). The combination of "CropAndResize operations located in the
+    "while" loop forms a single PSROIPooling operation with bilinear interpolation. The transformation matches two
+    "while" loops with PSROIPooling layers applied to the tensors with box coordinates and classes predictions. The
+    sub-graph being replaced also contains a Reduce operation performing mean calculation over the spatial dimensions,
+    so the transformation adds this operation as well.
+    """
     replacement_id = 'ObjectDetectionAPIPSROIPoolingReplacement'
     run_not_recursively = True
 
@@ -1605,24 +1777,23 @@ def generate_sub_graph(self, graph: Graph, match: SubgraphMatch):
             raise Error('Different "crop_height" and "crop_width" parameters from the pipeline config are not '
                         'supported: {} vs {}'.format(crop_height, crop_width))
 
-        if 'reshape_swap_proposals_2d' in graph.nodes():
-            reshape_swap_proposals_node = Node(graph, 'reshape_swap_proposals_2d')
-        else:
-            swap_proposals_node = add_convolution_to_swap_xy_coordinates(graph, Node(graph, 'proposals'), 5)
-            reshape_swap_proposals_node = create_op_node_with_second_input(graph, Reshape, int64_array([-1, 5]),
-                                                                           {'name': 'reshape_swap_proposals_2d'},
-                                                                           swap_proposals_node)
-            mark_input_as_in_correct_layout(reshape_swap_proposals_node, 0)
+        proposal_nodes = graph.get_op_nodes(name='reshape_swap_proposals_2d')
+        if len(proposal_nodes) != 1:
+            raise Error("Found the following nodes '{}' with name 'reshape_swap_proposals_2d' but there should be "
+                        "exactly 1. Looks like ObjectDetectionAPIProposalReplacement transformation didn't work."
+                        "".format(proposal_nodes))
+        reshape_swap_proposals_node = proposal_nodes[0]
 
         psroipooling_node = PSROIPoolingOp(graph, {'name': input_node.soft_get('name') + '/PSROIPooling',
                                                    'output_dim': psroipooling_output_dim,
-                                                   'group_size': crop_width / num_spatial_bins_width,
+                                                   'group_size': crop_width // num_spatial_bins_width,
                                                    'spatial_bins_x': num_spatial_bins_width,
                                                    'spatial_bins_y': num_spatial_bins_height,
                                                    'mode': 'bilinear',
                                                    'spatial_scale': 1,
                                                    }).create_node([input_node, reshape_swap_proposals_node])
 
+        # add Reduce operation which is a part of the graph being removed
         reduce_node = create_op_node_with_second_input(graph, ReduceMean, int64_array([1, 2]),
                                                        {'name': 'mean', 'keep_dims': True}, psroipooling_node)
 
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support.json b/model-optimizer/extensions/front/tf/faster_rcnn_support.json
index c535044f7d9f94..d143ae53000f94 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support.json
@@ -60,8 +60,7 @@
     {
         "custom_attributes": {
             "clip_before_nms": true,
-            "clip_after_nms": false,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": false
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.10.json b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.10.json
index b28376f6535336..94e0d871e6a648 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.10.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.10.json
@@ -61,8 +61,7 @@
     {
         "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.13.json b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.13.json
index 7f290c37eaac72..1ce6b0a59a76c9 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.13.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.13.json
@@ -61,8 +61,7 @@
     {
         "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.14.json b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.14.json
index a049c7d288d7cb..8439fa05e9f2ff 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.14.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.14.json
@@ -61,8 +61,7 @@
     {
         "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.15.json b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.15.json
index 7e06ded418f563..3c45df9133e74e 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.15.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.15.json
@@ -61,8 +61,7 @@
     {
         "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.7.json b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.7.json
index 1fde146e509e74..f6ab3ff3195c36 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.7.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v1.7.json
@@ -61,8 +61,7 @@
     {
         "custom_attributes": {
             "clip_before_nms": true,
-            "clip_after_nms": false,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": false
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.0.json b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.0.json
index daa4538a63737c..3a4c575272cdc8 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.0.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.0.json
@@ -38,8 +38,7 @@
         "custom_attributes": {
             "clip_before_nms": false,
             "clip_after_nms": true,
-            "background_label_id": 0,
-            "coordinates_swap_method": "swap_weights"
+            "background_label_id": 0
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.4.json b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.4.json
index a66a7aeefb81fc..01d4f2facbbba6 100644
--- a/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.4.json
+++ b/model-optimizer/extensions/front/tf/faster_rcnn_support_api_v2.4.json
@@ -38,8 +38,7 @@
         "custom_attributes": {
             "clip_before_nms": false,
             "clip_after_nms": true,
-            "background_label_id": 0,
-            "coordinates_swap_method": "swap_weights"
+            "background_label_id": 0
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support.json b/model-optimizer/extensions/front/tf/mask_rcnn_support.json
index 76b31ceeaa7ba7..33a2aa1981e729 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support.json
@@ -61,8 +61,7 @@
     {
        "custom_attributes": {
             "clip_before_nms": true,
-            "clip_after_nms": false,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": false
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.11.json b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.11.json
index bece918e85b241..7abcdf96f821e4 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.11.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.11.json
@@ -61,8 +61,7 @@
     {
        "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.13.json b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.13.json
index f0f585a2fea9cc..bdd113ea81e3f8 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.13.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.13.json
@@ -61,8 +61,7 @@
     {
        "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.14.json b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.14.json
index 9be341c53cd7e9..c825b3eed285a3 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.14.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.14.json
@@ -61,8 +61,7 @@
     {
        "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.15.json b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.15.json
index 39633de5db9dfa..c4db36de05e2cb 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.15.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.15.json
@@ -61,8 +61,7 @@
     {
        "custom_attributes": {
             "clip_before_nms": false,
-            "clip_after_nms": true,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.7.json b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.7.json
index 422006778e9533..c488580d307c90 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.7.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v1.7.json
@@ -61,8 +61,7 @@
     {
        "custom_attributes": {
             "clip_before_nms": true,
-            "clip_after_nms": false,
-            "coordinates_swap_method": "swap_weights"
+            "clip_after_nms": false
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.0.json b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.0.json
index 9562530ac69c31..fc0432c8c29875 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.0.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.0.json
@@ -38,8 +38,7 @@
         "custom_attributes": {
             "clip_before_nms": false,
             "clip_after_nms": true,
-            "background_label_id": 0,
-            "coordinates_swap_method": "swap_weights"
+            "background_label_id": 0
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.4.json b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.4.json
index a54d17d234f27d..3849547e05b38e 100644
--- a/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.4.json
+++ b/model-optimizer/extensions/front/tf/mask_rcnn_support_api_v2.4.json
@@ -38,8 +38,7 @@
         "custom_attributes": {
             "clip_before_nms": false,
             "clip_after_nms": true,
-            "background_label_id": 0,
-            "coordinates_swap_method": "swap_weights"
+            "background_label_id": 0
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "include_inputs_to_sub_graph": true,
diff --git a/model-optimizer/extensions/front/tf/random_uniform_ext.py b/model-optimizer/extensions/front/tf/random_uniform_ext.py
new file mode 100644
index 00000000000000..97422f170c75cc
--- /dev/null
+++ b/model-optimizer/extensions/front/tf/random_uniform_ext.py
@@ -0,0 +1,21 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from extensions.ops.random_uniform import AttributedRandomUniform
+from mo.front.extractor import FrontExtractorOp
+from mo.front.tf.extractors.utils import tf_dtype_extractor
+
+
+class RandomUniformExtractor(FrontExtractorOp):
+    op = 'RandomUniform'
+    enabled = True
+
+    @classmethod
+    def extract(cls, node):
+        attrs = {
+            'output_type': tf_dtype_extractor(node.pb.attr["dtype"].type),
+            'global_seed': node.pb.attr['seed'].i,
+            'op_seed': node.pb.attr['seed2'].i
+        }
+        AttributedRandomUniform.update_node_stat(node, attrs)
+        return cls.enabled
diff --git a/model-optimizer/extensions/front/tf/random_uniform_int_ext.py b/model-optimizer/extensions/front/tf/random_uniform_int_ext.py
new file mode 100644
index 00000000000000..b0e20c2b066070
--- /dev/null
+++ b/model-optimizer/extensions/front/tf/random_uniform_int_ext.py
@@ -0,0 +1,21 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from extensions.ops.random_uniform import RandomUniform
+from mo.front.extractor import FrontExtractorOp
+from mo.front.tf.extractors.utils import tf_dtype_extractor
+
+
+class RandomUniformIntExtractor(FrontExtractorOp):
+    op = 'RandomUniformInt'
+    enabled = True
+
+    @classmethod
+    def extract(cls, node):
+        attrs = {
+            'output_type': tf_dtype_extractor(node.pb.attr["Tout"].type),
+            'global_seed': node.pb.attr['seed'].i,
+            'op_seed': node.pb.attr['seed2'].i
+        }
+        RandomUniform.update_node_stat(node, attrs)
+        return cls.enabled
diff --git a/model-optimizer/extensions/front/tf/rfcn_support.json b/model-optimizer/extensions/front/tf/rfcn_support.json
index 2e250c086ad7c2..e69be6ee1c56b1 100644
--- a/model-optimizer/extensions/front/tf/rfcn_support.json
+++ b/model-optimizer/extensions/front/tf/rfcn_support.json
@@ -62,7 +62,6 @@
         "custom_attributes": {
             "clip_before_nms": true,
             "clip_after_nms": false,
-            "coordinates_swap_method": "add_convolution",
             "swap_proposals": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
diff --git a/model-optimizer/extensions/front/tf/rfcn_support_api_v1.10.json b/model-optimizer/extensions/front/tf/rfcn_support_api_v1.10.json
index 30177547504973..b630bc9c9b26db 100644
--- a/model-optimizer/extensions/front/tf/rfcn_support_api_v1.10.json
+++ b/model-optimizer/extensions/front/tf/rfcn_support_api_v1.10.json
@@ -60,8 +60,7 @@
     {
         "custom_attributes": {
            "clip_before_nms": false,
-           "clip_after_nms": true,
-           "coordinates_swap_method": "add_convolution"
+           "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/rfcn_support_api_v1.13.json b/model-optimizer/extensions/front/tf/rfcn_support_api_v1.13.json
index a9d79f523a60ef..5c014ae51357ab 100644
--- a/model-optimizer/extensions/front/tf/rfcn_support_api_v1.13.json
+++ b/model-optimizer/extensions/front/tf/rfcn_support_api_v1.13.json
@@ -60,8 +60,7 @@
     {
         "custom_attributes": {
            "clip_before_nms": false,
-           "clip_after_nms": true,
-           "coordinates_swap_method": "add_convolution"
+           "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/front/tf/rfcn_support_api_v1.14.json b/model-optimizer/extensions/front/tf/rfcn_support_api_v1.14.json
index 1f59748fcbb221..1b147c79cee82a 100644
--- a/model-optimizer/extensions/front/tf/rfcn_support_api_v1.14.json
+++ b/model-optimizer/extensions/front/tf/rfcn_support_api_v1.14.json
@@ -60,8 +60,7 @@
     {
         "custom_attributes": {
            "clip_before_nms": false,
-           "clip_after_nms": true,
-           "coordinates_swap_method": "add_convolution"
+           "clip_after_nms": true
         },
         "id": "ObjectDetectionAPIDetectionOutputReplacement",
         "inputs": [
diff --git a/model-optimizer/extensions/middle/MulFakeQuantizeFuse.py b/model-optimizer/extensions/middle/MulFakeQuantizeFuse.py
index 70045685e958c3..3bbd670ed16428 100644
--- a/model-optimizer/extensions/middle/MulFakeQuantizeFuse.py
+++ b/model-optimizer/extensions/middle/MulFakeQuantizeFuse.py
@@ -72,6 +72,8 @@ def replace_pattern(self, graph: Graph, match: Dict[str, Node]):
             return
 
         mul_val = value_port.data.get_value()
+        if np.any(mul_val <= 0):
+            return
 
         # Direct modifications to quantize 1-st and 2-nd port inputs are performed.
         # So the data nodes at those inputs shouldn't have more than 1 consumer maximum 2 consumers to the same
@@ -80,33 +82,6 @@ def replace_pattern(self, graph: Graph, match: Dict[str, Node]):
 
         # TODO: need some special processing for values that exactly equal to threshold
 
-        # Need to flip output_low and output_high for those elements that have multiplier < 0
-        if np.all(mul_val < 0):
-            mi_o_node = quantize.in_port(3).get_source()
-            ma_o_node = quantize.in_port(4).get_source()
-
-            quantize.in_port(3).disconnect()
-            quantize.in_port(4).disconnect()
-
-            mi_o_node.connect(quantize.in_port(4))
-            ma_o_node.connect(quantize.in_port(3))
-
-        elif np.any(mul_val < 0):
-            # Flipping values should be done on exclusive inputs of FakeQuantize node, so we duplicate them if needed
-            resolve_shared_inputs(node=quantize, port_ids_to_duplicate=[3, 4])
-
-            # Successful flipping will be done on broadcasted arrays
-            mi_o_val = quantize.in_port(3).data.get_value()
-            ma_o_val = quantize.in_port(4).data.get_value()
-            mul_val, mi_o_val, ma_o_val = [np.array(a) for a in np.broadcast_arrays(mul_val, mi_o_val, ma_o_val)]
-
-            neg_idx = np.where(mul_val < 0)
-            mi_o_val[neg_idx], ma_o_val[neg_idx] = ma_o_val[neg_idx], mi_o_val[neg_idx]
-
-            # TODO: revert broadcasting where unnecessary
-            quantize.in_port(3).data.set_value(mi_o_val)
-            quantize.in_port(4).data.set_value(ma_o_val)
-
         quantize.in_port(1).data.set_value(quantize.in_port(1).data.get_value() / mul_val)
         if quantize.in_node(1).id != quantize.in_node(2).id:
             quantize.in_port(2).data.set_value(quantize.in_port(2).data.get_value() / mul_val)
diff --git a/model-optimizer/extensions/ops/random_uniform.py b/model-optimizer/extensions/ops/random_uniform.py
new file mode 100644
index 00000000000000..86dfcec2656bc6
--- /dev/null
+++ b/model-optimizer/extensions/ops/random_uniform.py
@@ -0,0 +1,75 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import numpy as np
+
+from mo.graph.graph import Graph, Node
+from mo.middle.passes.convert_data_type import np_data_type_to_destination_type
+from mo.ops.op import Op
+
+
+class RandomUniform(Op):
+    """
+    RandomUniform operation that generates a sequence of random values from uniform distribution.
+    """
+    op = 'RandomUniform'
+    enabled = False
+
+    def __init__(self, graph: Graph, attrs: dict):
+        super().__init__(graph, {
+            'type': self.op,
+            'op': self.op,
+            'version': 'opset8',
+            'infer': self.infer,
+            'in_ports_count': 3,
+            'out_ports_count': 1,
+            'type_infer': self.type_infer,
+            'global_seed': 0,
+            'op_seed': 0,
+            'output_type': np.float32,
+        }, attrs)
+
+    def backend_attrs(self):
+        return [('output_type', lambda node: np_data_type_to_destination_type(node.output_type)),
+                'global_seed',
+                'op_seed']
+
+    @staticmethod
+    def type_infer(node: Node):
+        node.out_port(0).set_data_type(node['output_type'])
+
+    @staticmethod
+    def infer(node: Node):
+        assert node.has_valid('output_type')
+
+        node.out_port(0).data.set_shape(node.in_port(0).data.get_value())
+
+        # We need to keep data type in data nodes corresponding to min and max values,
+        # as min and max value type should be the same as output_type attribute of RandomUniform
+        # operation. 'correct_data_type' attribute prevents changes of the data node type when
+        # ir data type is not equal to data node type.
+        node.in_node(1)['correct_data_type'] = True
+        node.in_node(2)['correct_data_type'] = True
+
+
+class AttributedRandomUniform(Op):
+    """ RandomUniform operation that generates a sequence of random values from uniform distribution.
+        This operation uses the same semantics as RandomUniform but output shape, min value or max value
+        can be specified as attribute.
+        Shape is specified as attribute in ONNX. Min value and max value are specified as attributes
+        in RandomUniformInt in TF.
+    """
+    op = 'AttributedRandomUniform'
+    enabled = False
+
+    def __init__(self, graph: Graph, attrs: dict):
+        super().__init__(graph, {
+            'type': None,
+            'op': self.op,
+            'infer': None,
+            'in_ports_count': 1,
+            'out_ports_count': 1,
+            'global_seed': 0,
+            'op_seed': 0,
+            'output_type': np.float32,
+        }, attrs)
diff --git a/model-optimizer/mo/front/common/partial_infer/random_uniform.py b/model-optimizer/mo/front/common/partial_infer/random_uniform.py
deleted file mode 100644
index 542432fc5f896f..00000000000000
--- a/model-optimizer/mo/front/common/partial_infer/random_uniform.py
+++ /dev/null
@@ -1,6 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-
-def tf_random_uniform_infer(node):
-    node.out_port(0).data.set_shape(node.in_port(0).data.get_value())
diff --git a/model-optimizer/mo/front/tf/extractor.py b/model-optimizer/mo/front/tf/extractor.py
index 52a1015f5260bc..de8fcafa3003b0 100644
--- a/model-optimizer/mo/front/tf/extractor.py
+++ b/model-optimizer/mo/front/tf/extractor.py
@@ -5,7 +5,6 @@
 from mo.front.tf.extractors.fused_bn import tf_fused_bn_extractor
 from mo.front.tf.extractors.native_tf import native_tf_node_extractor
 from mo.front.tf.extractors.pack import tf_pack_ext
-from mo.front.tf.extractors.random_uniform import tf_random_uniform_ext
 from mo.front.tf.extractors.utils import get_tf_node_port
 from mo.graph.graph import Node
 
@@ -57,7 +56,6 @@ def node_pb_arg(pb_extractor: callable):
     'FusedBatchNormV3': node_pb_arg(tf_fused_bn_extractor),
     'ConcatV2': node_pb_arg(tf_concat_ext),
     'Pack': node_pb_arg(tf_pack_ext),
-    'RandomUniform': node_pb_arg(tf_random_uniform_ext),
 }
 
 
diff --git a/model-optimizer/mo/front/tf/extractors/random_uniform.py b/model-optimizer/mo/front/tf/extractors/random_uniform.py
deleted file mode 100644
index db898c8c396b34..00000000000000
--- a/model-optimizer/mo/front/tf/extractors/random_uniform.py
+++ /dev/null
@@ -1,10 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-from mo.front.common.partial_infer.random_uniform import tf_random_uniform_infer
-
-
-def tf_random_uniform_ext(pb):
-    return {
-        'infer': tf_random_uniform_infer
-    }
diff --git a/model-optimizer/mo/front/tf/graph_utils.py b/model-optimizer/mo/front/tf/graph_utils.py
index 27ca7fe4db6ba2..536b000be37938 100644
--- a/model-optimizer/mo/front/tf/graph_utils.py
+++ b/model-optimizer/mo/front/tf/graph_utils.py
@@ -1,8 +1,6 @@
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-import collections
-import logging as log
 from typing import Dict
 
 import numpy as np
@@ -52,43 +50,6 @@ def create_op_with_const_inputs(graph: Graph, op: callable, port_value_dict: Dic
     return node
 
 
-def mark_squeeze_reshape_concat_before_detection_output(start_nodes: list):
-    """
-    The function looks for Reshape, Concat and Squeeze ops after the 'start_nodes' with 4D output and marks them with
-    proper attributes to infer them in original NHWC layout. This is a case of the TensorFlow Object Detection API
-    models for the SSD heads output which produces 4D tensor with bounding box deltas.
-    :param start_nodes: list of nodes to start search from.
-    :return: None
-    """
-    q = collections.deque()
-    q.extend(start_nodes)
-    while len(q) != 0:
-        cur_node = q.popleft()
-        if cur_node.has_valid('type'):
-            if cur_node.soft_get('type') == 'DetectionOutput':  # do not go beyond the DetectionOutput node
-                continue
-            # the input to Reshape comes from Convolution so it will be converted from NCHW to NHWC layout in the
-            # InsertLayoutPropagationTransposes transformation. But the output should be kept in the original layout
-            if cur_node.soft_get('type') == 'Reshape' and len(cur_node.out_port(0).data.get_shape()) == 4:
-                mark_output_as_in_correct_layout(cur_node, 0)
-
-            # Concat should be inferred in the original layout so the input with concatenation axis should not be
-            # updated from NHWC to NCHW layout
-            if cur_node.soft_get('type') == 'Concat' and len(cur_node.out_port(0).data.get_shape()) == 4:
-                cur_node.in_port(1).__setattr__('input_permutation', None)
-                cur_node['nchw_layout'] = True
-                cur_node.out_node(0)['nchw_layout'] = True
-
-            # Squeeze should be inferred in the original layout so the input with squeeze axis should not be updated
-            # from NHWC to NCHW layout. The input is marked as in correct layout to prevent from inserting Transpose
-            # from NHWC to NCHW.
-            if cur_node.soft_get('type') == 'Squeeze' and len(cur_node.in_port(0).data.get_shape()) == 4:
-                cur_node.in_port(1).__setattr__('input_permutation', None)
-                mark_input_as_in_correct_layout(cur_node, 0)
-
-        [q.append(port.node) for port in cur_node.out_port(0).get_destinations()]
-
-
 def add_convolution_to_swap_xy_coordinates(graph: Graph, input_node: Node, coordinates_size: int):
     """
     The function add convolution node after the node 'input_node' to swap xy coordinates of the boxes produced
diff --git a/model-optimizer/mo/middle/passes/convert_data_type.py b/model-optimizer/mo/middle/passes/convert_data_type.py
index 85ccbe85813e0f..c4133df2ecbfbb 100644
--- a/model-optimizer/mo/middle/passes/convert_data_type.py
+++ b/model-optimizer/mo/middle/passes/convert_data_type.py
@@ -38,10 +38,11 @@ class packed_I4(np.generic):
     'I32': (np.int32, 'I32', 'i32'),
     'I64': (np.int64, 'I64', 'i64'),
     'int8': (np.int8, 'I8', 'i8'),
-    'uint8': (np.uint8, 'U8', 'u8'),
     'int32': (np.int32, 'I32', 'i32'),
     'int64': (np.int64, 'I64', 'i64'),
     'bool': (np.bool, 'BOOL', 'boolean'),
+    'uint8': (np.uint8, 'U8', 'u8'),
+    'uint32': (np.uint32, 'U32', 'u32'),
     'uint64': (np.uint64, 'U64', 'u64'),
 
     # custom types
diff --git a/model-optimizer/mo/utils/find_ie_version.py b/model-optimizer/mo/utils/find_ie_version.py
index 59fada431fe58a..af0df60dc20d3d 100644
--- a/model-optimizer/mo/utils/find_ie_version.py
+++ b/model-optimizer/mo/utils/find_ie_version.py
@@ -90,9 +90,8 @@ def find_ie_version(silent=False):
         {
             "module": os.path.join(script_path, '../../../../python/', python_version),
             "libs": [
-                os.path.join(script_path, '../../../inference_engine/bin/intel64/Release'),
-                os.path.join(script_path, '../../../inference_engine/external/tbb/bin'),
-                os.path.join(script_path, '../../../ngraph/lib'),
+                os.path.join(script_path, '../../../../runtime/bin/intel64/Release'),
+                os.path.join(script_path, '../../../../runtime/3rdparty/tbb/bin'),
             ],
         },
         # Local builds
@@ -120,9 +119,8 @@ def find_ie_version(silent=False):
         {
             "module": os.path.join(script_path, '../../../../python/', python_version),
             "libs": [
-                os.path.join(script_path, '../../../inference_engine/lib/intel64'),
-                os.path.join(script_path, '../../../inference_engine/external/tbb/lib'),
-                os.path.join(script_path, '../../../ngraph/lib'),
+                os.path.join(script_path, '../../../../runtime/lib/intel64'),
+                os.path.join(script_path, '../../../../runtime/3rdparty/tbb/lib'),
             ],
         },
         # Local builds
diff --git a/model-optimizer/mo/utils/ir_reader/extenders/random_uniform_extender.py b/model-optimizer/mo/utils/ir_reader/extenders/random_uniform_extender.py
new file mode 100644
index 00000000000000..0e7faa2aedbdcf
--- /dev/null
+++ b/model-optimizer/mo/utils/ir_reader/extenders/random_uniform_extender.py
@@ -0,0 +1,16 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from mo.middle.passes.convert_data_type import destination_type_to_np_data_type
+
+from mo.utils.graph import Node
+from mo.utils.ir_reader.extender import Extender
+
+
+class RandomUniformExtender(Extender):
+    op = 'RandomUniform'
+
+    @staticmethod
+    def extend(op: Node):
+        if op.has_valid('output_type'):
+            op['output_type'] = destination_type_to_np_data_type(op.output_type)
diff --git a/model-optimizer/mo/utils/model_analysis.py b/model-optimizer/mo/utils/model_analysis.py
index 2049f8b41ece63..4fe47637b7b029 100644
--- a/model-optimizer/mo/utils/model_analysis.py
+++ b/model-optimizer/mo/utils/model_analysis.py
@@ -112,13 +112,14 @@ def analyze(self, graph: Graph):
         pass
 
 
-def graph_contains_scope(graph: Graph, scope: str):
+def graph_contains_scope(graph: Graph, scope: [str, tuple]):
     """
-    Checks whether the graph contains node(s) which name starts with "scope" string.
+    Checks whether the graph contains node(s) which name includes "scope" string.
     :param graph: graph to check
-    :param scope: string defining the scope
+    :param scope: string or tuple with strings defining the scope
     :return: the result of the check (True/False)
     """
-    if scope[-1] != '/':
-        scope += '/'
-    return any([node.soft_get('name').startswith(scope) for node in graph.get_op_nodes()])
+    if type(scope) is str:
+        return any([node.soft_get('name').find(scope) != -1 for node in graph.get_op_nodes()])
+    else:
+        return any([graph_contains_scope(graph, s) for s in scope])
diff --git a/model-optimizer/requirements.txt b/model-optimizer/requirements.txt
index b54ca23344b580..264ea8c5cf83b6 100644
--- a/model-optimizer/requirements.txt
+++ b/model-optimizer/requirements.txt
@@ -1,4 +1,4 @@
-tensorflow~=2.4.1
+tensorflow~=2.5.0
 mxnet~=1.2.0; sys_platform == 'win32'
 mxnet~=1.7.0.post2; sys_platform != 'win32'
 networkx~=2.5
diff --git a/model-optimizer/requirements_dev.txt b/model-optimizer/requirements_dev.txt
index 67640a482294cd..1a896ac5f8835c 100644
--- a/model-optimizer/requirements_dev.txt
+++ b/model-optimizer/requirements_dev.txt
@@ -1,4 +1,4 @@
-coverage==4.4.2
+coverage>=4.4.2,<=5.5
 astroid==2.4.2
 pylint==2.5.0
 pyenchant==1.6.11
diff --git a/model-optimizer/requirements_tf2.txt b/model-optimizer/requirements_tf2.txt
index 760999011abc68..d7514869e39411 100644
--- a/model-optimizer/requirements_tf2.txt
+++ b/model-optimizer/requirements_tf2.txt
@@ -1,4 +1,4 @@
-tensorflow~=2.4.1
+tensorflow~=2.5.0
 networkx~=2.5
 numpy>=1.16.6,<1.20
 defusedxml>=0.7.1
diff --git a/model-optimizer/unit_tests/extensions/back/ChangeRandomUniformOutputType_test.py b/model-optimizer/unit_tests/extensions/back/ChangeRandomUniformOutputType_test.py
new file mode 100644
index 00000000000000..a1d17e9a5e1107
--- /dev/null
+++ b/model-optimizer/unit_tests/extensions/back/ChangeRandomUniformOutputType_test.py
@@ -0,0 +1,55 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import unittest
+from argparse import Namespace
+
+import numpy as np
+from generator import generator, generate
+
+from extensions.back.ChangeRandomUniformOutputType import ChangeRandomUniformOutputType
+from mo.graph.graph import Node
+from mo.utils.ir_engine.compare_graphs import compare_graphs
+from unit_tests.utils.graph import build_graph, result, connect, regular_op_with_shaped_data
+
+nodes = {
+    **regular_op_with_shaped_data('placeholder', [3], {'type': 'Parameter'}),
+    **regular_op_with_shaped_data('random_uniform', [3, 4, 5], {'type': 'RandomUniform', 'op': 'RandomUniform'}),
+    **regular_op_with_shaped_data('convert', [3, 4, 5], {'type': 'Convert'}),
+    **result('result'),
+
+    # new RandomUniform node and inputs
+    **regular_op_with_shaped_data('min_val', [1], {'type': 'Const'}),
+    **regular_op_with_shaped_data('max_val', [1], {'type': 'Const'}),
+    **regular_op_with_shaped_data('shape', [3], {'type': 'Const'}),
+}
+
+edges = [*connect('placeholder', '0:random_uniform'), *connect('min_val', '1:random_uniform'),
+         *connect('max_val', '2:random_uniform'), *connect('random_uniform', 'result')]
+edges_with_convert = [*connect('placeholder', '0:random_uniform'), *connect('min_val', '1:random_uniform'),
+                      *connect('max_val', '2:random_uniform'), *connect('random_uniform', 'convert'),
+                      *connect('convert', 'result'), ]
+
+
+@generator
+class ChangeRandomUniformOutputTypeTest(unittest.TestCase):
+    @generate(*[
+        ("FP16", np.float32, np.float16),
+        ("FP32", np.float16, np.float32),
+        ("FP32", np.float32, None),
+        ("FP32", np.int64, None)
+    ])
+    def test_change_random_uniform_output_type(self, ir_type, out_type, dst_type):
+        graph = build_graph(nodes, edges, cli=Namespace(data_type=ir_type))
+        graph_ref = build_graph(nodes, edges if dst_type is None else edges_with_convert, {},
+                                nodes_with_edges_only=True)
+        Node(graph, 'random_uniform')['output_type'] = out_type
+
+        ChangeRandomUniformOutputType().find_and_replace_pattern(graph)
+
+        (flag, resp) = compare_graphs(graph, graph_ref, 'result', check_op_attrs=True)
+        self.assertTrue(flag, resp)
+
+        if dst_type is not None:
+            convert_node = Node(graph, 'random_uniform').out_port(0).get_destination().node
+            self.assertTrue(convert_node['dst_type'] == dst_type)
diff --git a/model-optimizer/unit_tests/extensions/back/ReverseInputChannels_test.py b/model-optimizer/unit_tests/extensions/back/ReverseInputChannels_test.py
index 8ac90c8708fdaf..634f3ea9aef39c 100644
--- a/model-optimizer/unit_tests/extensions/back/ReverseInputChannels_test.py
+++ b/model-optimizer/unit_tests/extensions/back/ReverseInputChannels_test.py
@@ -32,6 +32,7 @@
     **regular_op_with_shaped_data('pad', [1, 3, 10, 10], {'type': 'Pad'}),
     **regular_op_with_shaped_data('reverse_channels', [1, 3, 10, 10], {'type': 'ReverseChannels', 'axis': 1}),
     **result('result'),
+    **result('result2'),
 }
 
 class ReverseInputChannelsTest(unittest.TestCase):
@@ -64,7 +65,7 @@ def test_lift_up_through_eltwise(self):
         ReverseChannelsPropagationUp.lift_up_through_eltwise(node, reverse_channels)
         self.check_graph_attrs(graph, ['placeholder1', 'placeholder2'])
 
-    def test_lift_up_through(self):
+    def test_lift_up_through_pad(self):
         graph = build_graph(nodes2, [*connect('placeholder', '0:mul'), *connect('mul_const', '1:mul'),
                                      *connect('mul', '0:pad'), *connect('pad_const_1', '1:pad'),
                                      *connect('pad_const_2', '2:pad'), *connect('pad', 'reverse_channels'),
@@ -74,7 +75,25 @@ def test_lift_up_through(self):
         node = Node(graph, 'pad')
         reverse_channels = Node(graph, 'reverse_channels')
 
-        ReverseChannelsPropagationUp.lift_up_through(node, reverse_channels)
+        keep_moving_up, new_reverses = ReverseChannelsPropagationUp.lift_up_through_pad(node, reverse_channels)
+        self.assertTrue(keep_moving_up is True)
+        self.assertTrue(len(new_reverses) == 1)
+        self.check_graph_attrs(graph, ['placeholder'])
+
+
+    def test_lift_up_through_pad2(self):
+        graph = build_graph(nodes2, [*connect('placeholder', '0:mul'), *connect('mul_const', '1:mul'),
+                                     *connect('mul', '0:pad'), *connect('pad_const_1', '1:pad'),
+                                     *connect('pad_const_2', '2:pad'), *connect('pad', 'reverse_channels'),
+                                     *connect('reverse_channels:0', '0:result'),  *connect('reverse_channels:0', '0:result2')])
+        self.set_graph_attrs(graph, ['placeholder'])
+
+        node = Node(graph, 'pad')
+        reverse_channels = Node(graph, 'reverse_channels')
+
+        keep_moving_up, new_reverses = ReverseChannelsPropagationUp.lift_up_through_pad(node, reverse_channels)
+        self.assertTrue(keep_moving_up is True)
+        self.assertTrue(len(new_reverses) == 1)
         self.check_graph_attrs(graph, ['placeholder'])
 
 
diff --git a/model-optimizer/unit_tests/extensions/back/ShufflenetReLUReorder_test.py b/model-optimizer/unit_tests/extensions/back/ShufflenetReLUReorder_test.py
deleted file mode 100644
index 5b154f22c9d81a..00000000000000
--- a/model-optimizer/unit_tests/extensions/back/ShufflenetReLUReorder_test.py
+++ /dev/null
@@ -1,136 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import unittest
-
-import numpy as np
-
-from extensions.back.ShufflenetReLUReorder import ShufflenetReLUReorder
-from mo.utils.ir_engine.compare_graphs import compare_graphs
-from unit_tests.utils.graph import build_graph
-
-# The dictionary with nodes attributes used to build various graphs. A key is the name of the node and the value is the
-# dictionary with node attributes.
-nodes_attributes = {
-    'placeholder_1': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'},
-    'placeholder_1_data': {'value': None, 'shape': None, 'kind': 'data', 'data_type': None},
-    # ReLU
-    'relu_1': {'type': 'ReLU', 'kind': 'op', 'op': 'ReLU'},
-    'relu_1_data': {'value': None, 'shape': None, 'kind': 'data'},
-    # Reshape layers
-    'reshape_1': {'type': 'Reshape', 'kind': 'op', 'op': 'Reshape'},
-    'reshape_1_data': {'value': None, 'shape': None, 'kind': 'data'},
-    'reshape_2': {'type': 'Reshape', 'kind': 'op', 'op': 'Reshape'},
-    'reshape_2_data': {'value': None, 'shape': None, 'kind': 'data'},
-    'reshape_3': {'type': 'Reshape', 'kind': 'op', 'op': 'Reshape'},
-    'reshape_3_data': {'value': None, 'shape': None, 'kind': 'data'},
-    # Transpose layer
-    'transpose_1': {'type': 'Transpose', 'kind': 'op', 'op': 'Transpose'},
-    'transpose_1_data': {'value': None, 'shape': None, 'kind': 'data'},
-    # Conv layer
-    'conv_1': {'type': 'Convolution', 'kind': 'op', 'op': 'Conv2d'},
-    'conv_1_data': {'value': None, 'shape': None, 'kind': 'data'},
-}
-
-
-class ShufflenetReLUReorderTests(unittest.TestCase):
-    def test_1(self):
-        graph = build_graph(nodes_attributes,
-                            [('placeholder_1', 'placeholder_1_data'),
-                             ('placeholder_1_data', 'relu_1'),
-                             ('relu_1', 'relu_1_data'),
-                             ('relu_1_data', 'reshape_1'),
-                             ('reshape_1', 'reshape_1_data'),
-                             ('reshape_1_data', 'transpose_1'),
-                             ('transpose_1', 'transpose_1_data'),
-                             ('transpose_1_data', 'reshape_2'),
-                             ('reshape_2', 'reshape_2_data'),
-                             ('reshape_2_data', 'conv_1'),
-                             ('conv_1', 'conv_1_data')
-                             ],
-                            {'placeholder_1_data': {'shape': np.array([1, 227, 227, 112])},
-                             'relu_1_data': {'shape': np.array([1, 227, 227, 112])},
-                             'reshape_1_data': {'shape': np.array([227, 227, 4, 28])},
-                             'transpose_1': {'order': np.array([0, 1, 3, 2])},
-                             'transpose_1_data': {'shape': np.array([227, 227, 28, 4])},
-                             'reshape_2_data': {'shape': np.array([1, 227, 227, 112])},
-                             'conv_1_data': {'shape': np.array([1, 227, 227, 112])},
-                             'conv_1': {'pad': np.array([1, 1])}
-                             })
-        graph.graph['layout'] = 'NHWC'
-
-        graph_ref = build_graph(nodes_attributes,
-                                [('placeholder_1', 'placeholder_1_data'),
-                                 ('placeholder_1_data', 'reshape_1'),
-                                 ('reshape_1', 'reshape_1_data'),
-                                 ('reshape_1_data', 'transpose_1'),
-                                 ('transpose_1', 'transpose_1_data'),
-                                 ('transpose_1_data', 'reshape_2'),
-                                 ('reshape_2', 'reshape_2_data'),
-                                 ('reshape_2_data', 'relu_1'),
-                                 ('relu_1', 'relu_1_data'),
-                                 ('relu_1_data', 'conv_1'),
-                                 ('conv_1', 'conv_1_data')
-                                 ],
-                                {'placeholder_1_data': {'shape': np.array([1, 227, 227, 112])},
-                                 'relu_1_data': {'shape': np.array([1, 227, 227, 112])},
-                                 'reshape_1_data': {'shape': np.array([227, 227, 4, 28])},
-                                 'transpose_1': {'order': np.array([0, 1, 3, 2])},
-                                 'transpose_1_data': {'shape': np.array([227, 227, 28, 4])},
-                                 'reshape_2_data': {'shape': np.array([1, 227, 227, 112])},
-                                 'conv_1_data': {'shape': np.array([1, 227, 227, 112])},
-                                 })
-
-        pattern = ShufflenetReLUReorder()
-        pattern.find_and_replace_pattern(graph)
-
-        (flag, resp) = compare_graphs(graph, graph_ref, 'conv_1_data', check_op_attrs=True)
-        self.assertTrue(flag, resp)
-
-    def test_2_neg(self):
-        graph = build_graph(nodes_attributes,
-                            [('placeholder_1', 'placeholder_1_data'),
-                             ('placeholder_1_data', 'reshape_1'),
-                             ('reshape_1', 'reshape_1_data'),
-                             ('reshape_1_data', 'transpose_1'),
-                             ('transpose_1', 'transpose_1_data'),
-                             ('transpose_1_data', 'reshape_2'),
-                             ('reshape_2', 'reshape_2_data'),
-                             ('reshape_2_data', 'conv_1'),
-                             ('conv_1', 'conv_1_data')
-                             ],
-                            {'placeholder_1_data': {'shape': np.array([1, 227, 227, 112])},
-                             'relu_1_data': {'shape': np.array([1, 227, 227, 112])},
-                             'reshape_1_data': {'shape': np.array([227, 227, 4, 28])},
-                             'transpose_1': {'order': np.array([0, 1, 3, 2])},
-                             'transpose_1_data': {'shape': np.array([227, 227, 28, 4])},
-                             'reshape_2_data': {'shape': np.array([1, 227, 227, 112])},
-                             'conv_1_data': {'shape': np.array([1, 227, 227, 112])},
-                             })
-        graph.graph['layout'] = 'NHWC'
-
-        graph_ref = build_graph(nodes_attributes,
-                                [('placeholder_1', 'placeholder_1_data'),
-                                 ('placeholder_1_data', 'reshape_1'),
-                                 ('reshape_1', 'reshape_1_data'),
-                                 ('reshape_1_data', 'transpose_1'),
-                                 ('transpose_1', 'transpose_1_data'),
-                                 ('transpose_1_data', 'reshape_2'),
-                                 ('reshape_2', 'reshape_2_data'),
-                                 ('reshape_2_data', 'conv_1'),
-                                 ('conv_1', 'conv_1_data')
-                                 ],
-                                {'placeholder_1_data': {'shape': np.array([1, 227, 227, 112])},
-                                 'relu_1_data': {'shape': np.array([1, 227, 227, 112])},
-                                 'reshape_1_data': {'shape': np.array([227, 227, 4, 28])},
-                                 'transpose_1': {'order': np.array([0, 1, 3, 2])},
-                                 'transpose_1_data': {'shape': np.array([227, 227, 28, 4])},
-                                 'reshape_2_data': {'shape': np.array([1, 227, 227, 112])},
-                                 'conv_1_data': {'shape': np.array([1, 227, 227, 112])},
-                                 })
-
-        pattern = ShufflenetReLUReorder()
-        pattern.find_and_replace_pattern(graph)
-
-        (flag, resp) = compare_graphs(graph, graph_ref, 'conv_1_data', check_op_attrs=True)
-        self.assertTrue(flag, resp)
diff --git a/model-optimizer/unit_tests/extensions/front/AttributedRandomUniformToRandomUniform_test.py b/model-optimizer/unit_tests/extensions/front/AttributedRandomUniformToRandomUniform_test.py
new file mode 100644
index 00000000000000..c2c9dbf7998a07
--- /dev/null
+++ b/model-optimizer/unit_tests/extensions/front/AttributedRandomUniformToRandomUniform_test.py
@@ -0,0 +1,65 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import unittest
+
+import numpy as np
+
+from extensions.front.AttributedRandomUniformToRandomUniform import AttributedRandomUniformToRandomUniform
+from mo.front.common.partial_infer.utils import int64_array, float32_array
+from mo.utils.ir_engine.compare_graphs import compare_graphs
+from unit_tests.utils.graph import build_graph, const, result, regular_op
+
+nodes = {
+    **regular_op('placeholder', {'type': 'Parameter'}),
+    **regular_op('attr_random_uniform', {'type': 'AttributedRandomUniform', 'op': 'AttributedRandomUniform',
+                                         'output_type': np.float32,
+                                         'min_val': float32_array([-1.5]), 'max_val': float32_array([10.7]),
+                                         'shape': int64_array([5, 4, 3])}),
+    **result('result'),
+
+    # new RandomUniform node and inputs
+    **regular_op('random_uniform', {'type': 'RandomUniform'}),
+    **const('min_val', float32_array([-1.5])),
+    **const('max_val', float32_array([10.7])),
+    **const('shape', int64_array([5, 4, 3])),
+}
+
+
+class AttributedRandomUniformToRandomUniformTest(unittest.TestCase):
+    def test_min_max(self):
+        graph = build_graph(nodes,
+                            [('placeholder', 'attr_random_uniform', {'in': 0, 'out': 0}),
+                             ('attr_random_uniform', 'result', {'in': 0, 'out': 0})], {}, nodes_with_edges_only=True)
+
+        graph_ref = build_graph(nodes,
+                                [('placeholder', 'random_uniform', {'in': 0, 'out': 0}),
+                                 ('min_val', 'random_uniform', {'in': 1, 'out': 0}),
+                                 ('max_val', 'random_uniform', {'in': 2, 'out': 0}),
+                                 ('random_uniform', 'result')], {}, nodes_with_edges_only=True)
+        graph.stage = 'front'
+
+        AttributedRandomUniformToRandomUniform().find_and_replace_pattern(graph)
+
+        (flag, resp) = compare_graphs(graph, graph_ref, 'result', check_op_attrs=True)
+        self.assertTrue(flag, resp)
+        self.assertTrue(
+            graph.node[graph.get_nodes_with_attributes(op='RandomUniform')[0]]['name'] == 'attr_random_uniform')
+
+    def test_min_max_shape(self):
+        graph = build_graph(nodes,
+                            [('attr_random_uniform', 'result', {'in': 0, 'out': 0})], {}, nodes_with_edges_only=True)
+
+        graph_ref = build_graph(nodes,
+                                [('shape', 'random_uniform', {'in': 0, 'out': 0}),
+                                 ('min_val', 'random_uniform', {'in': 1, 'out': 0}),
+                                 ('max_val', 'random_uniform', {'in': 2, 'out': 0}),
+                                 ('random_uniform', 'result')], {}, nodes_with_edges_only=True)
+        graph.stage = 'front'
+
+        AttributedRandomUniformToRandomUniform().find_and_replace_pattern(graph)
+
+        (flag, resp) = compare_graphs(graph, graph_ref, 'result', check_op_attrs=True)
+        self.assertTrue(flag, resp)
+        self.assertTrue(
+            graph.node[graph.get_nodes_with_attributes(op='RandomUniform')[0]]['name'] == 'attr_random_uniform')
diff --git a/model-optimizer/unit_tests/extensions/front/DropoutWithRandomUniformReplacer_test.py b/model-optimizer/unit_tests/extensions/front/DropoutWithRandomUniformReplacer_test.py
deleted file mode 100644
index a95557cf84d641..00000000000000
--- a/model-optimizer/unit_tests/extensions/front/DropoutWithRandomUniformReplacer_test.py
+++ /dev/null
@@ -1,60 +0,0 @@
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import numpy as np
-
-import unittest
-
-from extensions.front.DropoutWithRandomUniformReplacer import DropoutWithRandomUniformReplacer
-from mo.utils.ir_engine.compare_graphs import compare_graphs
-from unit_tests.utils.graph import build_graph, result, regular_op
-
-
-class DropoutWithRandomUniformReplacerTest(unittest.TestCase):
-    def test(self):
-        nodes = {
-            **regular_op('input', {'type': 'Parameter'}),
-            **regular_op('shape', {'type': 'ShapeOf', 'kind': 'op', 'op': 'ShapeOf'}),
-            **regular_op('random_uniform', {'type': 'RandomUniform', 'kind': 'op', 'op': 'RandomUniform',
-                                            'name': 'dropout/RU'}),
-            **regular_op('mul', {'type': 'Mul', 'kind': 'op', 'op': 'Mul'}),
-            **regular_op('add', {'type': 'Add', 'kind': 'op', 'op': 'Add'}),
-            **regular_op('add2', {'type': 'Add', 'kind': 'op', 'op': 'Add'}),
-            **regular_op('floor', {'type': 'Floor', 'kind': 'op', 'op': 'Floor'}),
-            'add_const': {'kind': 'op', 'op': 'Const', 'value': np.array(0.0), 'data_type': np.float32},
-            **result('result'),
-
-            # new nodes to be added
-            'broadcast_const': {'kind': 'op', 'op': 'Const', 'value': np.array(0.5), 'data_type': np.float32},
-            **regular_op('broadcast', {'type': 'Broadcast', 'kind': 'op', 'op': 'Broadcast'}),
-        }
-        edges = [('input', 'shape'),
-                 ('shape', 'random_uniform'),
-                 ('random_uniform', 'mul'),
-                 ('mul', 'add'),
-                 ('add_const', 'add'),
-                 ('add', 'add2'),
-                 ('add2', 'floor'),
-                 ('floor', 'result')]
-        graph = build_graph(nodes, edges, nodes_with_edges_only=True)
-
-        graph.graph['layout'] = 'NCHW'
-        graph.stage = 'front'
-
-        DropoutWithRandomUniformReplacer().find_and_replace_pattern(graph)
-
-        edges_ref = [('input', 'shape'),
-                     ('broadcast_const', 'broadcast'),
-                     ('shape', 'broadcast'),
-                     ('broadcast', 'mul'),
-                     ('mul', 'add'),
-                     ('add_const', 'add'),
-                     ('add', 'add2'),
-                     ('add2', 'floor'),
-                     ('floor', 'result')]
-        graph_ref = build_graph(nodes, edges_ref, nodes_with_edges_only=True)
-
-        # check graph structure after the transformation and output name
-        (flag, resp) = compare_graphs(graph, graph_ref, 'result')
-        self.assertTrue(flag, resp)
-        self.assertTrue(graph.node[graph.get_nodes_with_attributes(op='Broadcast')[0]]['name'] == 'dropout/RU')
diff --git a/model-optimizer/unit_tests/extensions/front/tf/ObjectDetectionAPI_test.py b/model-optimizer/unit_tests/extensions/front/tf/ObjectDetectionAPI_test.py
index 338f77b8c3c70c..b6c2b0e5f2b4db 100644
--- a/model-optimizer/unit_tests/extensions/front/tf/ObjectDetectionAPI_test.py
+++ b/model-optimizer/unit_tests/extensions/front/tf/ObjectDetectionAPI_test.py
@@ -2,9 +2,10 @@
 # SPDX-License-Identifier: Apache-2.0
 
 import unittest
+from argparse import Namespace
+from unittest.mock import patch
 
 from generator import generator, generate
-from unittest.mock import patch
 
 from extensions.front.tf.ObjectDetectionAPI import calculate_shape_keeping_aspect_ratio, \
     calculate_placeholder_spatial_shape, ObjectDetectionAPIPreprocessor2Replacement
@@ -14,6 +15,7 @@
 from mo.utils.custom_replacement_config import CustomReplacementDescriptor
 from mo.utils.error import Error
 from mo.utils.ir_engine.compare_graphs import compare_graphs
+from unit_tests.mo.utils.pipeline_config_test import file_content
 from unit_tests.utils.graph import const, regular_op, result, build_graph, connect_front
 
 
@@ -32,28 +34,24 @@ class TestCalculateShape(unittest.TestCase):
     min_size = 600
     max_size = 1024
 
-    @generate(*[(100, 300, 341, 1024, False),
-                (100, 600, 171, 1024, False),
-                (100, 3000, 34, 1024, False),
-                (300, 300, 600, 600, False),
-                (300, 400, 600, 800, False),
-                (300, 600, 512, 1024, False),
-                (1000, 2500, 410, 1024, False),
-                (1800, 2000, 600, 667, False),
-                (300, 100, 1024, 341, False),
-                (600, 100, 1024, 171, False),
-                (3000, 100, 1024, 34, False),
-                (400, 300, 800, 600, False),
-                (600, 300, 1024, 512, False),
-                (2500, 1000, 1024, 410, False),
-                (2000, 1800, 667, 600, False),
-                (300, 300, 1024, 1024, True),
-                (900, 300, 1024, 1024, True),
-                (1300, 900, 1024, 1024, True),
-                (1025, 1025, 1024, 1024, True),
+    @generate(*[(100, 300, 341, 1024),
+                (100, 600, 171, 1024),
+                (100, 3000, 34, 1024),
+                (300, 300, 600, 600),
+                (300, 400, 600, 800),
+                (300, 600, 512, 1024),
+                (1000, 2500, 410, 1024),
+                (1800, 2000, 600, 667),
+                (300, 100, 1024, 341),
+                (600, 100, 1024, 171),
+                (3000, 100, 1024, 34),
+                (400, 300, 800, 600),
+                (600, 300, 1024, 512),
+                (2500, 1000, 1024, 410),
+                (2000, 1800, 667, 600),
                 ])
-    def test_calculate_shape(self, h, w, th, tw, pad):
-        self.assertTupleEqual(calculate_shape_keeping_aspect_ratio(h, w, self.min_size, self.max_size, pad), (th, tw))
+    def test_calculate_shape(self, h, w, th, tw):
+        self.assertTupleEqual(calculate_shape_keeping_aspect_ratio(h, w, self.min_size, self.max_size), (th, tw))
 
 
 class TestCalculatePlaceholderSpatialShape(unittest.TestCase):
@@ -147,9 +145,33 @@ def build_ref_graph(self, preprocessing: bool):
         ref_graph.stage = 'front'
         return ref_graph
 
-    def test_case_1(self, update_parameter_shape_mock):
+    def test_case_1_pad_to_max_dim(self, update_parameter_shape_mock):
+        # test for case #1 described in the ObjectDetectionAPIPreprocessor2Replacement
+        # sub/mul should be removed because they are applied before prep-processing and pad_to_max_dimension is True
+        update_parameter_shape_mock.return_value = (None, None)
+        edges = [*connect_front('input', '0:mul'),
+                 *connect_front('mul_const', '1:mul'),
+                 *connect_front('sub_const', '0:sub'),
+                 *connect_front('mul', '1:sub'),
+                 *connect_front('sub', self.start_node_name),
+                 *connect_front(self.start_node_name, 'resize'),
+                 *connect_front('resize', self.end_node_name),
+                 *connect_front(self.end_node_name, 'result'),
+                 ]
+        graph = build_graph(self.nodes, edges)
+        graph.stage = 'front'
+        graph.graph['cmd_params'] = Namespace(tensorflow_object_detection_api_pipeline_config=__file__)
+
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=file_content)):
+            ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
+
+        (flag, resp) = compare_graphs(graph, self.build_ref_graph(False), 'result', check_op_attrs=True)
+        self.assertTrue(flag, resp)
+
+    def test_case_1_no_pad_to_max_dim(self, update_parameter_shape_mock):
         # test for case #1 described in the ObjectDetectionAPIPreprocessor2Replacement
-        update_parameter_shape_mock.return_value = None
+        # sub/mul should be kept even though they are applied before prep-processing and pad_to_max_dimension is False
+        update_parameter_shape_mock.return_value = (None, None)
         edges = [*connect_front('input', '0:mul'),
                  *connect_front('mul_const', '1:mul'),
                  *connect_front('sub_const', '0:sub'),
@@ -161,15 +183,19 @@ def test_case_1(self, update_parameter_shape_mock):
                  ]
         graph = build_graph(self.nodes, edges)
         graph.stage = 'front'
+        graph.graph['cmd_params'] = Namespace(tensorflow_object_detection_api_pipeline_config=__file__)
 
-        ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
+        updated_pipeline_config_content = file_content.replace('pad_to_max_dimension: true',
+                                                               'pad_to_max_dimension: false')
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=updated_pipeline_config_content)):
+            ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
 
         (flag, resp) = compare_graphs(graph, self.build_ref_graph(True), 'result', check_op_attrs=True)
         self.assertTrue(flag, resp)
 
     def test_case_2(self, update_parameter_shape_mock):
         # test for case #2 described in the ObjectDetectionAPIPreprocessor2Replacement
-        update_parameter_shape_mock.return_value = None
+        update_parameter_shape_mock.return_value = (None, None)
 
         edges = [*connect_front('input', self.start_node_name),
                  *connect_front(self.start_node_name, 'resize'),
@@ -182,15 +208,17 @@ def test_case_2(self, update_parameter_shape_mock):
                  ]
         graph = build_graph(self.nodes, edges)
         graph.stage = 'front'
+        graph.graph['cmd_params'] = Namespace(tensorflow_object_detection_api_pipeline_config=__file__)
 
-        ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=file_content)):
+            ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
 
         (flag, resp) = compare_graphs(graph, self.build_ref_graph(True), 'result', check_op_attrs=True)
         self.assertTrue(flag, resp)
 
     def test_case_3(self, update_parameter_shape_mock):
         # test for case #3 described in the ObjectDetectionAPIPreprocessor2Replacement
-        update_parameter_shape_mock.return_value = None
+        update_parameter_shape_mock.return_value = (None, None)
 
         edges = [*connect_front('input', self.start_node_name),
                  *connect_front(self.start_node_name, 'resize'),
@@ -199,8 +227,10 @@ def test_case_3(self, update_parameter_shape_mock):
                  ]
         graph = build_graph(self.nodes, edges)
         graph.stage = 'front'
+        graph.graph['cmd_params'] = Namespace(tensorflow_object_detection_api_pipeline_config=__file__)
 
-        ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=file_content)):
+            ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
 
         (flag, resp) = compare_graphs(graph, self.build_ref_graph(False), 'result', check_op_attrs=True)
         self.assertTrue(flag, resp)
@@ -221,7 +251,6 @@ def build_body_graph(pre_processing: str):
                 **regular_op('resize', {'type': 'Interpolate'}),
                 **result('result'),
             }
-            edges = None
             if pre_processing == 'no':
                 edges = [*connect_front('input', self.loop_start_node_name),
                          *connect_front(self.loop_start_node_name, 'resize'),
@@ -265,33 +294,39 @@ def build_body_graph(pre_processing: str):
 
     def test_case_4(self, update_parameter_shape_mock):
         # test for case #4 described in the ObjectDetectionAPIPreprocessor2Replacement
-        update_parameter_shape_mock.return_value = None
+        update_parameter_shape_mock.return_value = (None, None)
 
         graph = self.build_main_graph('leading')
+        graph.graph['cmd_params'] = Namespace(tensorflow_object_detection_api_pipeline_config=__file__)
 
-        ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=file_content)):
+            ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
 
         (flag, resp) = compare_graphs(graph, self.build_ref_graph(True), 'result', check_op_attrs=True)
         self.assertTrue(flag, resp)
 
     def test_case_5(self, update_parameter_shape_mock):
         # test for case #5 described in the ObjectDetectionAPIPreprocessor2Replacement
-        update_parameter_shape_mock.return_value = None
+        update_parameter_shape_mock.return_value = (None, None)
 
         graph = self.build_main_graph('trailing')
+        graph.graph['cmd_params'] = Namespace(tensorflow_object_detection_api_pipeline_config=__file__)
 
-        ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=file_content)):
+            ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
 
         (flag, resp) = compare_graphs(graph, self.build_ref_graph(True), 'result', check_op_attrs=True)
         self.assertTrue(flag, resp)
 
     def test_case_6(self, update_parameter_shape_mock):
         # test for case #6 described in the ObjectDetectionAPIPreprocessor2Replacement
-        update_parameter_shape_mock.return_value = None
+        update_parameter_shape_mock.return_value = (None, None)
 
         graph = self.build_main_graph('no')
+        graph.graph['cmd_params'] = Namespace(tensorflow_object_detection_api_pipeline_config=__file__)
 
-        ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=file_content)):
+            ObjectDetectionAPIPreprocessor2Replacement().transform_graph(graph, self.replacement_desc)
 
         (flag, resp) = compare_graphs(graph, self.build_ref_graph(False), 'result', check_op_attrs=True)
         self.assertTrue(flag, resp)
diff --git a/model-optimizer/unit_tests/extensions/middle/MulQuantizeFuse_test.py b/model-optimizer/unit_tests/extensions/middle/MulQuantizeFuse_test.py
index 34b3fccf810624..0fafb51addfcfa 100644
--- a/model-optimizer/unit_tests/extensions/middle/MulQuantizeFuse_test.py
+++ b/model-optimizer/unit_tests/extensions/middle/MulQuantizeFuse_test.py
@@ -110,7 +110,7 @@ def test_1(self):
     def test_2(self):
         graph = build_graph(nodes, edges, {
             'mul': {'can_be_fused': True},
-            'mul_const_data': {'shape': np.array([1]), 'value': np.array([-1])},
+            'mul_const_data': {'shape': np.array([1]), 'value': np.array([2])},
             'quantize_data': {'shape': np.array([2, 3, 4, 4])},
             'mi_o_data': {'shape': np.array([1]), 'value': np.array([0])},
             'ma_o_data': {'shape': np.array([1]), 'value': np.array([1])},
@@ -118,11 +118,11 @@ def test_2(self):
         graph.stage = 'middle'
         graph_ref = build_graph(nodes, edges_ref, {
             'quantize_data': {'shape': np.array([2, 3, 4, 4])},
-            'mul_const_data': {'shape': np.array([1]), 'value': np.array([-1])},
-            'mi_o_data': {'shape': np.array([1]), 'value': np.array([1])},
-            'ma_o_data': {'shape': np.array([1]), 'value': np.array([0])},
-            'mi_i_data': {'shape': np.array([1]), 'value': np.array([10])},
-            'ma_i_data': {'shape': np.array([1]), 'value': np.array([-10])},
+            'mul_const_data': {'shape': np.array([1]), 'value': np.array([2])},
+            'mi_o_data': {'shape': np.array([1]), 'value': np.array([0])},
+            'ma_o_data': {'shape': np.array([1]), 'value': np.array([1])},
+            'mi_i_data': {'shape': np.array([1]), 'value': np.array([-5])},
+            'ma_i_data': {'shape': np.array([1]), 'value': np.array([5])},
         }, nodes_with_edges_only=True)
 
         MulFakeQuantizeFuse().find_and_replace_pattern(graph)
@@ -131,23 +131,36 @@ def test_2(self):
 
         self.assertTrue(flag, resp)
 
-    def test_3(self):
+    def test_negative_1(self):
+        graph = build_graph(nodes, edges, nodes_with_edges_only=True)
+        graph.stage = 'middle'
+        graph_ref = build_graph(nodes, edges, nodes_with_edges_only=True)
+
+        MulFakeQuantizeFuse().find_and_replace_pattern(graph)
+        (flag, resp) = compare_graphs(graph, graph_ref, 'output', check_op_attrs=True)
+
+        self.assertTrue(flag, resp)
+
+    def test_negative_2(self):
+        graph = build_graph(nodes, edges, {'mul': {'can_be_fused': False}}, nodes_with_edges_only=True)
+        graph.stage = 'middle'
+        graph_ref = build_graph(nodes, edges, {'mul': {'can_be_fused': False}}, nodes_with_edges_only=True)
+
+        MulFakeQuantizeFuse().find_and_replace_pattern(graph)
+        (flag, resp) = compare_graphs(graph, graph_ref, 'output', check_op_attrs=True)
+
+        self.assertTrue(flag, resp)
+
+    def test_negative_3(self):
         graph = build_graph(nodes, edges, {
             'mul': {'can_be_fused': True},
-            'mul_const_data': {'shape': np.array([3, 1, 1]), 'value': np.array([[[-1]], [[1]], [[-1]]])},
+            'mul_const_data': {'shape': np.array([1]), 'value': np.array([-1])},
             'quantize_data': {'shape': np.array([2, 3, 4, 4])},
-            'mi_o_data': {'shape': np.array([1, 1, 1, 1]), 'value': np.broadcast_to(np.array([0]), (1, 1, 1, 1))},
-            'ma_o_data': {'shape': np.array([1, 1, 1, 1]), 'value': np.broadcast_to(np.array([1]), (1, 1, 1, 1))},
+            'mi_o_data': {'shape': np.array([1]), 'value': np.array([0])},
+            'ma_o_data': {'shape': np.array([1]), 'value': np.array([1])},
         }, nodes_with_edges_only=True)
         graph.stage = 'middle'
-        graph_ref = build_graph(nodes, edges_ref, {
-            'quantize_data': {'shape': np.array([2, 3, 4, 4])},
-            'mul_const_data': {'shape': np.array([3, 1, 1]), 'value': np.array([[[-1]], [[1]], [[-1]]])},
-            'mi_o_data': {'shape': np.array([1, 3, 1, 1]), 'value': np.array([[[1]], [[0]], [[1]]])},
-            'ma_o_data': {'shape': np.array([1, 3, 1, 1]), 'value': np.array([[[0]], [[1]], [[0]]])},
-            'mi_i_data': {'shape': np.array([1, 3, 1, 1]), 'value': np.array([[[10]], [[-10]], [[10]]])},
-            'ma_i_data': {'shape': np.array([1, 3, 1, 1]), 'value': np.array([[[-10]], [[10]], [[-10]]])},
-        }, nodes_with_edges_only=True)
+        graph_ref = graph.copy()
 
         MulFakeQuantizeFuse().find_and_replace_pattern(graph)
 
@@ -155,22 +168,36 @@ def test_3(self):
 
         self.assertTrue(flag, resp)
 
-    def negative_test_1(self):
-        graph = build_graph(nodes, edges, nodes_with_edges_only=True)
+    def test_negative_4(self):
+        graph = build_graph(nodes, edges, {
+            'mul': {'can_be_fused': True},
+            'mul_const_data': {'shape': np.array([3, 1, 1]), 'value': np.array([[[-1]], [[1]], [[-1]]])},
+            'quantize_data': {'shape': np.array([2, 3, 4, 4])},
+            'mi_o_data': {'shape': np.array([1, 1, 1, 1]), 'value': np.broadcast_to(np.array([0]), (1, 1, 1, 1))},
+            'ma_o_data': {'shape': np.array([1, 1, 1, 1]), 'value': np.broadcast_to(np.array([1]), (1, 1, 1, 1))},
+        }, nodes_with_edges_only=True)
         graph.stage = 'middle'
-        graph_ref = build_graph(nodes, edges, nodes_with_edges_only=True)
+        graph_ref = graph.copy()
 
         MulFakeQuantizeFuse().find_and_replace_pattern(graph)
+
         (flag, resp) = compare_graphs(graph, graph_ref, 'output', check_op_attrs=True)
 
         self.assertTrue(flag, resp)
 
-    def negative_test_2(self):
-        graph = build_graph(nodes, edges, {'mul': {'can_be_fused': False}}, nodes_with_edges_only=True)
+    def test_negative_5(self):
+        graph = build_graph(nodes, edges, {
+            'mul': {'can_be_fused': True},
+            'mul_const_data': {'shape': np.array([3, 1, 1]), 'value': np.array([[[0]], [[1]], [[2]]])},
+            'quantize_data': {'shape': np.array([2, 3, 4, 4])},
+            'mi_o_data': {'shape': np.array([1, 1, 1, 1]), 'value': np.broadcast_to(np.array([0]), (1, 1, 1, 1))},
+            'ma_o_data': {'shape': np.array([1, 1, 1, 1]), 'value': np.broadcast_to(np.array([1]), (1, 1, 1, 1))},
+        }, nodes_with_edges_only=True)
         graph.stage = 'middle'
-        graph_ref = build_graph(nodes, edges, {'mul': {'can_be_fused': False}}, nodes_with_edges_only=True)
+        graph_ref = graph.copy()
 
         MulFakeQuantizeFuse().find_and_replace_pattern(graph)
+
         (flag, resp) = compare_graphs(graph, graph_ref, 'output', check_op_attrs=True)
 
         self.assertTrue(flag, resp)
diff --git a/model-optimizer/unit_tests/mo/utils/pipeline_config_test.py b/model-optimizer/unit_tests/mo/utils/pipeline_config_test.py
index 8e525464b43c66..40fccae9f6b6cd 100644
--- a/model-optimizer/unit_tests/mo/utils/pipeline_config_test.py
+++ b/model-optimizer/unit_tests/mo/utils/pipeline_config_test.py
@@ -1,9 +1,7 @@
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-import os
-import tempfile
-import unittest
+import unittest.mock
 
 from mo.utils.error import Error
 from mo.utils.pipeline_config import PipelineConfig
@@ -15,6 +13,7 @@
       keep_aspect_ratio_resizer {
         min_dimension: 600
         max_dimension: 1024
+        pad_to_max_dimension: true
       }
     }
     feature_extractor {
@@ -71,8 +70,6 @@
               mode: FAN_AVG
             }
           }
-            }
-          }
         }
         use_dropout: false
         dropout_keep_probability: 1.0
@@ -83,7 +80,7 @@
         score_threshold: 0.300000011921
         iou_threshold: 0.600000023842
         max_detections_per_class: 100
-        max_total_detections: 100
+        max_total_detections: 200
       }
       score_converter: SOFTMAX
     }
@@ -99,20 +96,12 @@ def test_pipeline_config_not_existing_file(self):
         self.assertRaises(Error, PipelineConfig, "/abc/def")
 
     def test_pipeline_config_non_model_file(self):
-        file = tempfile.NamedTemporaryFile('wt', delete=False)
-        file.write("non_model {}")
-        file_name = file.name
-        file.close()
-
-        self.assertRaises(Error, PipelineConfig, file_name)
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data="non_model {}")):
+            self.assertRaises(Error, PipelineConfig, __file__)
 
     def test_pipeline_config_existing_file(self):
-        file = tempfile.NamedTemporaryFile('wt', delete=False)
-        file.write(file_content)
-        file_name = file.name
-        file.close()
-
-        pipeline_config = PipelineConfig(file_name)
+        with unittest.mock.patch('builtins.open', unittest.mock.mock_open(read_data=file_content)):
+            pipeline_config = PipelineConfig(__file__)
         expected_result = {'resizer_min_dimension': 600,
                            'first_stage_nms_score_threshold': 0.0,
                            'anchor_generator_aspect_ratios': [0.5, 1.0, 2.0],
@@ -138,7 +127,11 @@ def test_pipeline_config_existing_file(self):
                            'use_matmul_crop_and_resize': False,
                            'add_background_class': True,
                            'share_box_across_classes': False,
-                           'pad_to_max_dimension': False,
+                           'pad_to_max_dimension': True,
+                           'postprocessing_score_threshold': 0.300000011921,
+                           'postprocessing_score_converter': 'SOFTMAX',
+                           'postprocessing_iou_threshold': 0.600000023842,
+                           'postprocessing_max_detections_per_class': 100,
+                           'postprocessing_max_total_detections': 200,
                            }
-        os.unlink(file_name)
         self.assertDictEqual(pipeline_config._model_params, expected_result)
diff --git a/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_ngraph_frontend/CMakeLists.txt b/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_ngraph_frontend/CMakeLists.txt
index 232ca18727e69c..18a1550e758963 100644
--- a/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_ngraph_frontend/CMakeLists.txt
+++ b/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_ngraph_frontend/CMakeLists.txt
@@ -15,13 +15,11 @@ add_library(${TARGET_FE_NAME} SHARED ${LIBRARY_SRC} ${LIBRARY_HEADERS})
 
 target_include_directories(${TARGET_FE_NAME} PRIVATE ".")
 
-target_link_libraries(${TARGET_FE_NAME} PRIVATE ngraph::frontend_manager::static)
+target_link_libraries(${TARGET_FE_NAME} PRIVATE frontend_manager::static)
 target_link_libraries(${TARGET_FE_NAME} PUBLIC ngraph PRIVATE ngraph::builder)
 
 add_clang_format_target(${TARGET_FE_NAME}_clang FOR_TARGETS ${TARGET_FE_NAME})
 
-set(NGRAPH_INSTALL_LIB "deployment_tools/ngraph/lib")
-
 install(TARGETS ${TARGET_FE_NAME}
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL)
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
diff --git a/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_python_api/CMakeLists.txt b/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_python_api/CMakeLists.txt
index 750a0fcb4732ae..ca12d2e0c44dfb 100644
--- a/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_python_api/CMakeLists.txt
+++ b/model-optimizer/unit_tests/mock_mo_frontend/mock_mo_python_api/CMakeLists.txt
@@ -30,7 +30,7 @@ source_group("src" FILES ${PYBIND_FE_SRC})
 
 pybind11_add_module(${PYBIND_FE_NAME} MODULE ${PYBIND_FE_SRC})
 
-target_link_libraries(${PYBIND_FE_NAME} PRIVATE ngraph::ngraph ngraph::frontend_manager::static)
+target_link_libraries(${PYBIND_FE_NAME} PRIVATE ngraph frontend_manager::static)
 target_link_libraries(${PYBIND_FE_NAME} PRIVATE ${TARGET_FE_NAME})
 
 add_dependencies(${PYBIND_FE_NAME} ${TARGET_FE_NAME})
diff --git a/ngraph/CMakeLists.txt b/ngraph/CMakeLists.txt
index 6ef6b3cdeb6b05..163c395842735b 100644
--- a/ngraph/CMakeLists.txt
+++ b/ngraph/CMakeLists.txt
@@ -16,8 +16,6 @@ project (ngraph)
 # Installation logic...
 #-----------------------------------------------------------------------------------------------
 
-set(NGRAPH_INSTALL_LIB "deployment_tools/ngraph/lib")
-set(NGRAPH_INSTALL_INCLUDE "deployment_tools/ngraph/include")
 set(NGRAPH_TARGETS_FILE "${CMAKE_CURRENT_BINARY_DIR}/ngraphTargets.cmake")
 
 add_definitions(-DPROJECT_ROOT_DIR="${CMAKE_CURRENT_SOURCE_DIR}")
@@ -30,7 +28,3 @@ add_subdirectory(core)
 
 add_subdirectory(frontend)
 add_subdirectory(test)
-
-if(ENABLE_PYTHON)
-    add_subdirectory(python)
-endif()
diff --git a/ngraph/core/CMakeLists.txt b/ngraph/core/CMakeLists.txt
index 70be17b1281eaa..726bc4c7402595 100644
--- a/ngraph/core/CMakeLists.txt
+++ b/ngraph/core/CMakeLists.txt
@@ -71,28 +71,35 @@ set_source_files_properties("${CMAKE_CURRENT_SOURCE_DIR}/src/pass/convert_precis
 
 # Defines macro in C++ to load backend plugin
 target_include_directories(ngraph PUBLIC $<BUILD_INTERFACE:${NGRAPH_INCLUDE_PATH}>
-                                         $<INSTALL_INTERFACE:${NGRAPH_INSTALL_INCLUDE}>
                                   PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src
                                           ${CMAKE_CURRENT_BINARY_DIR}/include)
 
-#Add an alias so that library can be used inside the build tree, e.g. when testing
+# Add an alias so that library can be used inside the build tree, e.g. when testing
 add_library(ngraph::ngraph ALIAS ngraph)
+add_library(openvino::core ALIAS ngraph)
 
 target_link_libraries(ngraph PRIVATE ${CMAKE_DL_LIBS})
 
 #-----------------------------------------------------------------------------------------------
-# Installation logic...
+# Export for build tree
 #-----------------------------------------------------------------------------------------------
 
-export(TARGETS ngraph NAMESPACE ngraph:: APPEND FILE "${NGRAPH_TARGETS_FILE}")
+set_target_properties(ngraph PROPERTIES EXPORT_NAME core)
+export(TARGETS ngraph NAMESPACE openvino::
+       APPEND FILE "${CMAKE_BINARY_DIR}/OpenVINOTargets.cmake")
 
-install(TARGETS ngraph EXPORT ngraphTargets
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        ARCHIVE DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph)
+#-----------------------------------------------------------------------------------------------
+# Installation logic...
+#-----------------------------------------------------------------------------------------------
+
+install(TARGETS ngraph EXPORT OpenVINOTargets
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT ngraph
+        ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT ngraph
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT ngraph
+        INCLUDES DESTINATION runtime/include)
 
 install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/include/
-        DESTINATION ${NGRAPH_INSTALL_INCLUDE}
+        DESTINATION "runtime/include"
         COMPONENT ngraph_dev
         FILES_MATCHING
             PATTERN "*.hpp"
@@ -100,13 +107,7 @@ install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/include/
             PATTERN "*version.in.hpp" EXCLUDE)
 
 install(FILES ${CMAKE_CURRENT_BINARY_DIR}/include/ngraph/version.hpp
-        DESTINATION ${NGRAPH_INSTALL_INCLUDE}/ngraph
-        COMPONENT ngraph_dev)
-
-install(EXPORT ngraphTargets
-        FILE ngraphTargets.cmake
-        NAMESPACE ngraph::
-        DESTINATION "deployment_tools/ngraph/cmake"
+        DESTINATION "runtime/include/ngraph"
         COMPONENT ngraph_dev)
 
 configure_package_config_file(${OpenVINO_SOURCE_DIR}/cmake/templates/ngraphConfig.cmake.in
@@ -119,5 +120,5 @@ write_basic_package_version_file(${ngraph_BINARY_DIR}/ngraphConfigVersion.cmake
 
 install(FILES ${ngraph_BINARY_DIR}/ngraphConfig.cmake
               ${ngraph_BINARY_DIR}/ngraphConfigVersion.cmake
-        DESTINATION "deployment_tools/ngraph/cmake"
+        DESTINATION "runtime/cmake"
         COMPONENT ngraph_dev)
diff --git a/ngraph/core/include/ngraph/check.hpp b/ngraph/core/include/ngraph/check.hpp
index e7a703e49dc0fc..ea80e0c2442889 100644
--- a/ngraph/core/include/ngraph/check.hpp
+++ b/ngraph/core/include/ngraph/check.hpp
@@ -9,168 +9,20 @@
 #include <vector>
 
 #include "ngraph/except.hpp"
+#include "openvino/core/except.hpp"
 
 namespace ngraph {
-static inline std::ostream& write_all_to_stream(std::ostream& str) {
-    return str;
-}
-template <typename T, typename... TS>
-static inline std::ostream& write_all_to_stream(std::ostream& str, const T& arg, TS&&... args) {
-    return write_all_to_stream(str << arg, args...);
-}
+using ov::write_all_to_stream;
 
-struct CheckLocInfo {
-    const char* file;
-    int line;
-    const char* check_string;
-};
-
-/// Base class for check failure exceptions.
-class NGRAPH_API CheckFailure : public ngraph_error {
-public:
-    CheckFailure(const CheckLocInfo& check_loc_info, const std::string& context_info, const std::string& explanation)
-        : ngraph_error(make_what(check_loc_info, context_info, explanation)) {}
-
-private:
-    static std::string make_what(const CheckLocInfo& check_loc_info,
-                                 const std::string& context_info,
-                                 const std::string& explanation);
-};
+using CheckFailure = ov::AssertFailure;
+using ov::CheckLocInfo;
 }  // namespace ngraph
 
-//
-// Helper macro for defining custom check macros, which throw custom exception classes and provide
-// useful context information (the check condition, source filename, line number, and any domain-
-// specific context information [e.g., a summary of the node that was being processed at the time
-// of the check]).
-//
-// For example (actually implemented in node.cpp), let's say we want to define a macro for
-// checking conditions during node validation, usable as follows:
-//
-//    NODE_VALIDATION_CHECK(node_being_checked,
-//                          node_being_checked->get_input_shape(0).size() == 1,
-//                          "Node must have an input rank of 1, but got ",
-//                          node_being_checked->get_input_shape(0).size(), ".");
-//
-// In case of failure, this will throw an exception of type NodeValidationFailure with a what()
-// string something like:
-//
-//      Check 'node_being_checked->get_input_shape(0).size() == 1' failed at foo.cpp:123:
-//      While validating node 'Broadcast[Broadcast_10](Reshape_9: float{1,3,4,5}) -> (??)':
-//      Node must have an input of rank 1, but got 2.
-//
-// To implement this, he first step is to define a subclass of CheckFailure (let's say it's called
-// MyFailure), which must have a constructor of the form:
-//
-//      MyFailure(const CheckLocInfo& check_loc_info,
-//                T context_info, // "T" can be any type; you'll supply a function to convert "T"
-//                                // to std::string
-//                const std::string& explanation)
-//
-// Here, we define a custom class for node validation failures as follows:
-//
-//    static std::string node_validation_failure_loc_string(const Node* node)
-//    {
-//        std::stringstream ss;
-//        ss << "While validating node '" << *node << "'";
-//        return ss.str();
-//    }
-//
-//    class NodeValidationFailure : public CheckFailure
-//    {
-//    public:
-//        NodeValidationFailure(const CheckLocInfo& check_loc_info,
-//                              const Node* node,
-//                              const std::string& explanation)
-//            : CheckFailure(check_loc_info, node_validation_failure_loc_string(node), explanation)
-//        {
-//        }
-//    };
-//
-// Then, we define the macro NODE_VALIDATION_CHECK as follows:
-//
-// #define NODE_VALIDATION_CHECK(node, cond, ...) <backslash>
-//     NGRAPH_CHECK_HELPER(::ngraph::NodeValidationFailure, (node), (cond), ##__VA_ARGS__)
-//
-// The macro NODE_VALIDATION_CHECK can now be called on any condition, with a Node* pointer
-// supplied to generate an informative error message via node_validation_failure_loc_string().
-//
-// Take care to fully qualify the exception class name in the macro body.
-//
-// The "..." may be filled with expressions of any type that has an "operator<<" overload for
-// insertion into std::ostream.
-//
-// TODO(amprocte): refactor NGRAPH_CHECK_HELPER so we don't have to introduce a locally-scoped
-// variable (ss___) and risk shadowing.
-//
-#define NGRAPH_CHECK_HELPER2(exc_class, ctx, check, ...)                                               \
-    do {                                                                                               \
-        if (!(check)) {                                                                                \
-            ::std::stringstream ss___;                                                                 \
-            ::ngraph::write_all_to_stream(ss___, __VA_ARGS__);                                         \
-            throw exc_class((::ngraph::CheckLocInfo{__FILE__, __LINE__, #check}), (ctx), ss___.str()); \
-        }                                                                                              \
-    } while (0)
+#define NGRAPH_CHECK_HELPER2(exc_class, ctx, check, ...) OPENVINO_ASSERT_HELPER2(exc_class, ctx, check, __VA_ARGS__)
 
-#define NGRAPH_CHECK_HELPER1(exc_class, ctx, check)                                           \
-    do {                                                                                      \
-        if (!(check)) {                                                                       \
-            throw exc_class((::ngraph::CheckLocInfo{__FILE__, __LINE__, #check}), (ctx), ""); \
-        }                                                                                     \
-    } while (0)
+#define NGRAPH_CHECK_HELPER1(exc_class, ctx, check) OPENVINO_ASSERT_HELPER1(exc_class, ctx, check)
 
-/// \brief Macro to check whether a boolean condition holds.
-/// \param cond Condition to check
-/// \param ... Additional error message info to be added to the error message via the `<<`
-///            stream-insertion operator. Note that the expressions here will be evaluated lazily,
-///            i.e., only if the `cond` evalutes to `false`.
-/// \throws ::ngraph::CheckFailure if `cond` is false.
-#define NGRAPH_CHECK(...) NGRAPH_CHECK_HELPER(::ngraph::CheckFailure, "", __VA_ARGS__)
+#define NGRAPH_CHECK(...) OPENVINO_ASSERT(__VA_ARGS__)
 
-/// \brief Macro to signal a code path that is unreachable in a successful execution. It's
-/// implemented with NGRAPH_CHECK macro.
-/// \param ... Additional error message that should describe why that execution path is unreachable.
-/// \throws ::ngraph::CheckFailure if the macro is executed.
 #define NGRAPH_UNREACHABLE(...)                  NGRAPH_CHECK(false, "Unreachable: ", __VA_ARGS__)
-#define NGRAPH_CHECK_HELPER(exc_class, ctx, ...) CALL_OVERLOAD(NGRAPH_CHECK_HELPER, exc_class, ctx, __VA_ARGS__)
-
-#define GLUE(x, y) x y
-
-#define RETURN_ARG_COUNT(_1_,   \
-                         _2_,   \
-                         _3_,   \
-                         _4_,   \
-                         _5_,   \
-                         _6,    \
-                         _7,    \
-                         _8,    \
-                         _9,    \
-                         _10,   \
-                         _11,   \
-                         _12,   \
-                         _13,   \
-                         _14,   \
-                         _15,   \
-                         _16,   \
-                         _17,   \
-                         _18,   \
-                         _19,   \
-                         _20,   \
-                         _21,   \
-                         _22,   \
-                         _23,   \
-                         _24,   \
-                         _25,   \
-                         count, \
-                         ...)   \
-    count
-#define EXPAND_ARGS(args) RETURN_ARG_COUNT args
-#define COUNT_ARGS_MAXN(...) \
-    EXPAND_ARGS((__VA_ARGS__, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 0))
-
-#define OVERLOAD_MACRO2(name, count) name##count
-#define OVERLOAD_MACRO1(name, count) OVERLOAD_MACRO2(name, count)
-#define OVERLOAD_MACRO(name, count)  OVERLOAD_MACRO1(name, count)
-
-#define CALL_OVERLOAD(name, exc_class, ctx, ...) \
-    GLUE(OVERLOAD_MACRO(name, COUNT_ARGS_MAXN(__VA_ARGS__)), (exc_class, ctx, __VA_ARGS__))
+#define NGRAPH_CHECK_HELPER(exc_class, ctx, ...) OPENVINO_ASSERT_HELPER(exc_class, ctx, __VA_ARGS__)
diff --git a/ngraph/core/include/ngraph/graph_util.hpp b/ngraph/core/include/ngraph/graph_util.hpp
index 0fc8ae0221b986..7a3900dd10ff64 100644
--- a/ngraph/core/include/ngraph/graph_util.hpp
+++ b/ngraph/core/include/ngraph/graph_util.hpp
@@ -18,11 +18,18 @@
 #include "ngraph/function.hpp"
 #include "ngraph/node.hpp"
 
+namespace ov {
+namespace op {
+namespace v0 {
+class Parameter;
+}
+}  // namespace op
+}  // namespace ov
 namespace ngraph {
 
 namespace op {
 namespace v0 {
-class Parameter;
+using ov::op::v0::Parameter;
 }
 }  // namespace op
 
diff --git a/ngraph/core/include/ngraph/node.hpp b/ngraph/core/include/ngraph/node.hpp
index 8d4259f8c34722..5910b2b90f5765 100644
--- a/ngraph/core/include/ngraph/node.hpp
+++ b/ngraph/core/include/ngraph/node.hpp
@@ -38,6 +38,13 @@
 #include "ngraph/variant.hpp"
 #include "openvino/core/node.hpp"
 
+namespace ov {
+namespace op {
+namespace v0 {
+class Result;
+}
+}  // namespace op
+}  // namespace ov
 namespace ngraph {
 
 using ov::Node;
@@ -52,7 +59,7 @@ using HostTensorVector = std::vector<HostTensorPtr>;
 namespace op {
 
 namespace v0 {
-class Result;
+using ov::op::v0::Result;
 }
 }  // namespace op
 
diff --git a/ngraph/core/include/ngraph/op/abs.hpp b/ngraph/core/include/ngraph/op/abs.hpp
index f85805edde6101..6661027581a060 100644
--- a/ngraph/core/include/ngraph/op/abs.hpp
+++ b/ngraph/core/include/ngraph/op/abs.hpp
@@ -7,37 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/abs.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise absolute value operation.
-///
-class NGRAPH_API Abs : public util::UnaryElementwiseArithmetic {
-public:
-    static constexpr NodeTypeInfo type_info{"Abs", 0};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs an absolute value operation.
-    Abs() = default;
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    /// \brief Constructs an absolute value operation.
-    ///
-    /// \param arg Output that produces the input tensor.<br>
-    /// `[d1, ...]`
-    ///
-    /// Output `[d1, ...]`
-    ///
-    Abs(const Output<Node>& arg);
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Abs;
 }  // namespace v0
 using v0::Abs;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/acos.hpp b/ngraph/core/include/ngraph/op/acos.hpp
index e4dc89f30a6646..d43aedd7ea757b 100644
--- a/ngraph/core/include/ngraph/op/acos.hpp
+++ b/ngraph/core/include/ngraph/op/acos.hpp
@@ -7,35 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/acos.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise inverse cosine (arccos) operation.
-///
-class NGRAPH_API Acos : public util::UnaryElementwiseArithmetic {
-public:
-    static constexpr NodeTypeInfo type_info{"Acos", 0};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs an arccos operation.
-    Acos() = default;
-    /// \brief Constructs an arccos operation.
-    ///
-    /// \param arg Output that produces the input tensor.<br>
-    /// `[d1, ...]`
-    ///
-    /// Output `[d1, ...]`
-    ///
-    Acos(const Output<Node>& arg);
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Acos;
 }  // namespace v0
 using v0::Acos;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/acosh.hpp b/ngraph/core/include/ngraph/op/acosh.hpp
index 95ad7b297f503f..fd1958f0bc02d0 100644
--- a/ngraph/core/include/ngraph/op/acosh.hpp
+++ b/ngraph/core/include/ngraph/op/acosh.hpp
@@ -7,34 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/acosh.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Elementwise inverse hyperbolic cos operation.
-///
-class NGRAPH_API Acosh : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an Acosh operation.
-    Acosh() = default;
-    /// \brief Constructs an Acosh operation.
-    ///
-    /// \param arg Output that produces the input tensor.<br>
-    /// `[d1, ...]`
-    ///
-    /// Output `[d1, ...]`
-    ///
-    Acosh(const Output<Node>& arg);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v3::Acosh;
 }  // namespace v3
 using v3::Acosh;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/adaptive_avg_pool.hpp b/ngraph/core/include/ngraph/op/adaptive_avg_pool.hpp
index 11b7de1699d054..eb0a8b82ed42b4 100644
--- a/ngraph/core/include/ngraph/op/adaptive_avg_pool.hpp
+++ b/ngraph/core/include/ngraph/op/adaptive_avg_pool.hpp
@@ -6,33 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/adaptive_avg_pool.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v8 {
-/// \brief Adaptive average pooling operation.
-///
-class NGRAPH_API AdaptiveAvgPool : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    AdaptiveAvgPool() = default;
-
-    ///
-    /// \brief    Constructs adaptive average pooling operation.
-    ///
-    /// \param    data            Input data
-    ///
-    /// \param    output_shape    1D tensor describing output shape for spatial
-    ///                           dimensions.
-    ///
-    AdaptiveAvgPool(const Output<Node>& data, const Output<Node>& output_shape);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v8::AdaptiveAvgPool;
 }  // namespace v8
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/adaptive_max_pool.hpp b/ngraph/core/include/ngraph/op/adaptive_max_pool.hpp
index 7554ad272cdcaf..6ba0a20f2e64e9 100644
--- a/ngraph/core/include/ngraph/op/adaptive_max_pool.hpp
+++ b/ngraph/core/include/ngraph/op/adaptive_max_pool.hpp
@@ -6,45 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/adaptive_max_pool.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v8 {
-/// \brief Adaptive max pooling operation.
-///
-class NGRAPH_API AdaptiveMaxPool : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    AdaptiveMaxPool() = default;
-
-    ///
-    /// \brief    Constructs adaptive max pooling operation.
-    ///
-    /// \param    data                  Input data
-    ///
-    /// \param    output_shape          1D tensor describing output shape for spatial
-    ///                                 dimensions.
-    ///
-    /// \param    index_element_type    Specifies the output tensor type for indices
-    /// output
-    ///
-    AdaptiveMaxPool(const Output<Node>& data,
-                    const Output<Node>& output_shape,
-                    const ngraph::element::Type& index_element_type = ngraph::element::i64);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    element::Type get_index_element_type() const {
-        return m_index_element_type;
-    }
-
-protected:
-    ngraph::element::Type m_index_element_type = ngraph::element::i64;
-};
+using ov::op::v8::AdaptiveMaxPool;
 }  // namespace v8
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/add.hpp b/ngraph/core/include/ngraph/op/add.hpp
index ac06fc51a344fa..875f7baf56fa11 100644
--- a/ngraph/core/include/ngraph/op/add.hpp
+++ b/ngraph/core/include/ngraph/op/add.hpp
@@ -7,41 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/add.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise addition operation.
-///
-class NGRAPH_API Add : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an uninitialized addition operation
-    Add() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs an addition operation.
-    ///
-    /// \param arg0 Output that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param arg1 Output that produces the second input tensor.<br>
-    /// `[d0, ...]`
-    /// \param auto_broadcast Auto broadcast specification. Default is Numpy-style
-    ///                       implicit broadcasting.
-    ///
-    /// Output `[d0, ...]`
-    ///
-    Add(const Output<Node>& arg0,
-        const Output<Node>& arg1,
-        const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Add;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/and.hpp b/ngraph/core/include/ngraph/op/and.hpp
index ea60b6a7190f1f..1186a86ba99595 100644
--- a/ngraph/core/include/ngraph/op/and.hpp
+++ b/ngraph/core/include/ngraph/op/and.hpp
@@ -7,37 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/binary_elementwise_logical.hpp"
+#include "openvino/op/logical_and.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise logical-and operation.
-///
-class NGRAPH_API LogicalAnd : public util::BinaryElementwiseLogical {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a logical-and operation.
-    LogicalAnd() = default;
-
-    /// \brief Constructs a logical-and operation.
-    ///
-    /// \param arg0 Output that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param arg1 Output that produces the second input tensor.<br>
-    /// `[d0, ...]`
-    /// \param auto_broadcast Auto broadcast specification
-    ///
-    /// Output `[d0, ...]`
-    ///
-    LogicalAnd(const Output<Node>& arg0,
-               const Output<Node>& arg1,
-               const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::LogicalAnd;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/asin.hpp b/ngraph/core/include/ngraph/op/asin.hpp
index 2d0f78378b77b1..d91e863995fb0f 100644
--- a/ngraph/core/include/ngraph/op/asin.hpp
+++ b/ngraph/core/include/ngraph/op/asin.hpp
@@ -7,36 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/asin.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise inverse sine (arcsin) operation.
-///
-class NGRAPH_API Asin : public util::UnaryElementwiseArithmetic {
-public:
-    static constexpr NodeTypeInfo type_info{"Asin", 0};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs an arcsin operation.
-    Asin() = default;
-    /// \brief Constructs an arcsin operation.
-    ///
-    /// \param arg Output that produces the input tensor.<br>
-    /// `[d1, ...]`
-    ///
-    /// Output `[d1, ...]`
-    ///
-    Asin(const Output<Node>& arg);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Asin;
 }  // namespace v0
 using v0::Asin;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/asinh.hpp b/ngraph/core/include/ngraph/op/asinh.hpp
index c3414eee7d447b..c7eb418a95b79f 100644
--- a/ngraph/core/include/ngraph/op/asinh.hpp
+++ b/ngraph/core/include/ngraph/op/asinh.hpp
@@ -7,34 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/asinh.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Elementwise inverse hyperbolic sin operation.
-///
-class NGRAPH_API Asinh : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an Asinh operation.
-    Asinh() = default;
-    /// \brief Constructs an Asinh operation.
-    ///
-    /// \param arg Output that produces the input tensor.<br>
-    /// `[d1, ...]`
-    ///
-    /// Output `[d1, ...]`
-    ///
-    Asinh(const Output<Node>& arg);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v3::Asinh;
 }  // namespace v3
 using v3::Asinh;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/assign.hpp b/ngraph/core/include/ngraph/op/assign.hpp
index c99dc8c321e099..316a61cbd37a04 100644
--- a/ngraph/core/include/ngraph/op/assign.hpp
+++ b/ngraph/core/include/ngraph/op/assign.hpp
@@ -7,74 +7,17 @@
 #include "ngraph/op/sink.hpp"
 #include "ngraph/op/util/variable.hpp"
 #include "ngraph/op/util/variable_extension.hpp"
+#include "openvino/op/assign.hpp"
 
 namespace ngraph {
 namespace op {
-class NGRAPH_API AssignBase : public Sink, public VariableExtension {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    AssignBase() = default;
-    /// \brief Constructs an AssignBase operation.
-    explicit AssignBase(const OutputVector& arguments) : Sink(arguments) {}
-};
+using ov::op::util::AssignBase;
 
 namespace v3 {
-/// \brief Assign operation sets an input value to the variable with `variable_id`
-class NGRAPH_API Assign : public AssignBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Assign() = default;
-
-    /// \brief Constructs an Assign operation.
-    ///
-    /// \param new_value   Node that produces the input tensor.
-    /// \param variable_id identifier of the variable to be updated.
-    Assign(const Output<Node>& new_value, const std::string& variable_id);
-
-    void validate_and_infer_types() override;
-    std::string get_variable_id() const override {
-        return m_variable_id;
-    }
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    std::string m_variable_id;
-};
+using ov::op::v3::Assign;
 }  // namespace v3
 namespace v6 {
-/// \brief Assign operation sets an input value to the variable with `variable_id`
-class NGRAPH_API Assign : public AssignBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Assign() = default;
-
-    /// \brief Constructs an Assign operation.
-    ///
-    /// \param new_value Node that produces the input tensor.
-    /// \param variable Class for storing and synchronizing element types, shapes and
-    /// identifiers
-    /// between pairs of Assign/ReadValue nodes.
-    Assign(const Output<Node>& new_value, const std::shared_ptr<Variable>& variable);
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::string get_variable_id() const override {
-        NGRAPH_CHECK(m_variable, "Variable is not initialized. Variable_id is unavailable");
-        return m_variable->get_info().variable_id;
-    }
-    bool evaluate(const HostTensorVector& outputs,
-                  const HostTensorVector& inputs,
-                  const EvaluationContext& evaluation_context) const override;
-    bool has_evaluate() const override;
-    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
-};
+using ov::op::v6::Assign;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/atan.hpp b/ngraph/core/include/ngraph/op/atan.hpp
index d43fd997141acf..af3a168c9a339d 100644
--- a/ngraph/core/include/ngraph/op/atan.hpp
+++ b/ngraph/core/include/ngraph/op/atan.hpp
@@ -7,34 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/atan.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise inverse tangent (arctan) operation.
-///
-class NGRAPH_API Atan : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs an arctan operation.
-    Atan() = default;
-
-    /// \brief Constructs an arctan operation.
-    ///
-    /// \param arg Output that produces the input tensor.<br>
-    /// `[d1, ...]`
-    ///
-    /// Output `[d1, ...]`
-    ///
-    Atan(const Output<Node>& arg);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Atan;
 }  // namespace v0
 using v0::Atan;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/atanh.hpp b/ngraph/core/include/ngraph/op/atanh.hpp
index c9de03b05aa3c7..dbc4eebb7e1df9 100644
--- a/ngraph/core/include/ngraph/op/atanh.hpp
+++ b/ngraph/core/include/ngraph/op/atanh.hpp
@@ -7,34 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/atanh.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Elementwise inverse hyperbolic tangent operation.
-///
-class NGRAPH_API Atanh : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an Atanh operation.
-    Atanh() = default;
-    /// \brief Constructs an Atanh operation.
-    ///
-    /// \param arg Output that produces the input tensor.<br>
-    /// `[d1, ...]`
-    ///
-    /// Output `[d1, ...]`
-    ///
-    Atanh(const Output<Node>& arg);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v3::Atanh;
 }  // namespace v3
 using v3::Atanh;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/avg_pool.hpp b/ngraph/core/include/ngraph/op/avg_pool.hpp
index 3d1d1aa52c8921..8943d5ac827496 100644
--- a/ngraph/core/include/ngraph/op/avg_pool.hpp
+++ b/ngraph/core/include/ngraph/op/avg_pool.hpp
@@ -6,83 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/avg_pool.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Batched average pooling operation.
-///
-class NGRAPH_API AvgPool : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a batched average pooling operation.
-    AvgPool() = default;
-
-    ///
-    /// \brief      Constructs a batched average pooling operation.
-    ///
-    /// \param      arg            The output producing the input data batch tensor.<br>
-    ///                            `[d1, dn]`
-    /// \param      strides        The strides.<br> `[n]`
-    /// \param      pads_begin     The beginning of padding shape.<br> `[n]`
-    /// \param      pads_end       The end of padding shape.<br> `[n]`
-    /// \param      kernel         The kernel shape.<br> `[n]`
-    /// \param      exclude_pad    If false then averages include padding elements, each
-    ///                            treated as the number zero.  If true, padding
-    ///                            elements
-    ///                            are entirely ignored when computing averages.
-    /// \param      rounding_type  Whether to use ceiling or floor rounding type while
-    ///                            computing output shape.
-    /// \param      auto_pad       Padding type to use for additional padded dimensions
-    ///
-    AvgPool(const Output<Node>& arg,
-            const Strides& strides,
-            const Shape& pads_begin,
-            const Shape& pads_end,
-            const Shape& kernel,
-            bool exclude_pad,
-            op::RoundingType rounding_type = op::RoundingType::FLOOR,
-            const PadType& auto_pad = op::PadType::EXPLICIT);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The kernel shape.
-    const Shape& get_kernel() const;
-    void set_kernel(const Shape& kernel);
-    /// \return The strides.
-    const Strides& get_strides() const;
-    void set_strides(const Strides& strides);
-    /// \return The beginning of padding shape.
-    const Shape& get_pads_begin() const;
-    void set_pads_begin(const Shape& pads_begin);
-    /// \return The end of padding shape.
-    const Shape& get_pads_end() const;
-    void set_pads_end(const Shape& pads_end);
-    bool get_exclude_pad() const;
-    void set_exclude_pad(bool exclude_pad);
-    /// \return The pad type for pooling.
-    const PadType& get_auto_pad() const;
-    void set_auto_pad(const PadType& auto_pad);
-    op::RoundingType get_rounding_type() const;
-    void set_rounding_type(op::RoundingType rounding_type);
-    /// \return The default value for AvgPool.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-protected:
-    Shape m_kernel;
-    Strides m_strides;
-    Shape m_pads_begin;
-    Shape m_pads_end;
-    bool m_exclude_pad{true};
-    PadType m_auto_pad{PadType::EXPLICIT};
-    op::RoundingType m_rounding_type{op::RoundingType::FLOOR};
-};
+using ov::op::v1::AvgPool;
 }  // namespace v1
 
 using v1::AvgPool;
diff --git a/ngraph/core/include/ngraph/op/batch_norm.hpp b/ngraph/core/include/ngraph/op/batch_norm.hpp
index 20f8ebc30de3c9..749d7fdeb6c32b 100644
--- a/ngraph/core/include/ngraph/op/batch_norm.hpp
+++ b/ngraph/core/include/ngraph/op/batch_norm.hpp
@@ -6,91 +6,17 @@
 
 #include <memory>
 
-#include "ngraph/deprecated.hpp"
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/batch_norm.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API BatchNormInference : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    BatchNormInference() = default;
-    /// \param input [., C, ...]
-    /// \param gamma gamma scaling for normalized value. [C]
-    /// \param beta bias added to the scaled normalized value [C]
-    /// \param mean value for mean normalization [C]
-    /// \param variance value for variance normalization [C]
-    /// \param epsilon Avoids divsion by 0 if input has 0 variance
-    BatchNormInference(const Output<Node>& input,
-                       const Output<Node>& gamma,
-                       const Output<Node>& beta,
-                       const Output<Node>& mean,
-                       const Output<Node>& variance,
-                       double epsilon);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    double get_eps_value() const {
-        return m_epsilon;
-    }
-    void set_eps_value(double epsilon) {
-        m_epsilon = epsilon;
-    }
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-private:
-    static constexpr size_t INPUT_GAMMA = 0;
-    static constexpr size_t INPUT_BETA = 1;
-    static constexpr size_t INPUT_DATA = 2;
-    static constexpr size_t INPUT_MEAN = 3;
-    static constexpr size_t INPUT_VARIANCE = 4;
-
-    double m_epsilon;
-};
+using ov::op::v0::BatchNormInference;
 }  // namespace v0
 namespace v5 {
-class NGRAPH_API BatchNormInference : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    BatchNormInference() = default;
-    /// \param input [., C, ...]
-    /// \param gamma gamma scaling for normalized value. [C]
-    /// \param beta bias added to the scaled normalized value [C]
-    /// \param mean value for mean normalization [C]
-    /// \param variance value for variance normalization [C]
-    /// \param epsilon Avoids divsion by 0 if input has 0 variance
-    BatchNormInference(const Output<Node>& input,
-                       const Output<Node>& gamma,
-                       const Output<Node>& beta,
-                       const Output<Node>& mean,
-                       const Output<Node>& variance,
-                       double epsilon);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    double get_eps_value() const {
-        return m_epsilon;
-    }
-    void set_eps_value(double epsilon) {
-        m_epsilon = epsilon;
-    }
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-private:
-    static constexpr size_t INPUT_DATA = 0;
-    static constexpr size_t INPUT_GAMMA = 1;
-    static constexpr size_t INPUT_BETA = 2;
-    static constexpr size_t INPUT_MEAN = 3;
-    static constexpr size_t INPUT_VARIANCE = 4;
-
-    double m_epsilon;
-};
+using ov::op::v5::BatchNormInference;
 }  // namespace v5
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/batch_to_space.hpp b/ngraph/core/include/ngraph/op/batch_to_space.hpp
index 836ccbc4c9d91c..7f18a376ac62d1 100644
--- a/ngraph/core/include/ngraph/op/batch_to_space.hpp
+++ b/ngraph/core/include/ngraph/op/batch_to_space.hpp
@@ -6,44 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/batch_to_space.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief BatchToSpace permutes data from the batch dimension of the data tensor into
-///        spatial dimensions.
-///
-/// \note  Values from the batch dimension are moved in spatial blocks dimensions.
-///
-///        Output node produces a tensor with shape:
-///        `[batch / (block_shape[0] * block_shape[1] * ... * block_shape[N - 1]),
-///         D_1 * block_shape[1] - crops_begin[1] - crops_end[1],
-///         D_2 * block_shape[2] - crops_begin[2] - crops_end[2], ...,
-///         D_{N - 1} * block_shape[N - 1] - crops_begin[N - 1] - crops_end[N - 1]`
-///         of the same type as `data` input.
-class NGRAPH_API BatchToSpace : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    BatchToSpace() = default;
-    /// \brief Constructs a BatchToSpace operation.
-    ///
-    /// \param data Node producing the data tensor
-    /// \param block_shape The sizes of the block of values to be moved
-    /// \param crops_begin Specifies the amount to crop from the beginning along each
-    /// axis of `data` input
-    /// \param crops_end Specifies the amount to crop from the ending along each axis of
-    /// `data` input.
-    BatchToSpace(const Output<Node>& data,
-                 const Output<Node>& block_shape,
-                 const Output<Node>& crops_begin,
-                 const Output<Node>& crops_end);
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-    void validate_and_infer_types() override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-};
+using ov::op::v1::BatchToSpace;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/binary_convolution.hpp b/ngraph/core/include/ngraph/op/binary_convolution.hpp
index 14f7ccf6c05dad..c795309fa0d2f7 100644
--- a/ngraph/core/include/ngraph/op/binary_convolution.hpp
+++ b/ngraph/core/include/ngraph/op/binary_convolution.hpp
@@ -7,141 +7,12 @@
 #include "ngraph/coordinate_diff.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/binary_convolution.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API BinaryConvolution : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    enum class BinaryConvolutionMode {
-        // Interpret input data and kernel values: 0 as -1, 1 as 1
-        XNOR_POPCOUNT
-    };
-
-    /// \brief Constructs a binary convolution operation.
-    BinaryConvolution() = default;
-    /// \brief Constructs a binary convolution operation.
-    /// \param data The node producing the input data batch tensor.
-    /// \param kernel The node producing the filters tensor.
-    /// \param strides The strides.
-    /// \param pads_begin The beginning of padding shape.
-    /// \param pads_end The end of padding shape.
-    /// \param dilations The dilations.
-    /// \param mode Defines how input tensor 0/1 values and weights 0/1 are interpreted.
-    /// \param pad_value Floating-point value used to fill pad area.
-    /// \param auto_pad The pad type for automatically computing padding sizes.
-    ///
-    /// Output `[N, C_OUT, R1, ... Rf]`
-    BinaryConvolution(const Output<Node>& data,
-                      const Output<Node>& kernel,
-                      const Strides& strides,
-                      const CoordinateDiff& pads_begin,
-                      const CoordinateDiff& pads_end,
-                      const Strides& dilations,
-                      BinaryConvolutionMode mode,
-                      float pad_value,
-                      const PadType& auto_pad = PadType::EXPLICIT);
-
-    BinaryConvolution(const Output<Node>& data,
-                      const Output<Node>& kernel,
-                      const Strides& strides,
-                      const CoordinateDiff& pads_begin,
-                      const CoordinateDiff& pads_end,
-                      const Strides& dilations,
-                      const std::string& mode,
-                      float pad_value,
-                      const PadType& auto_pad = PadType::EXPLICIT);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The strides.
-    const Strides& get_strides() const {
-        return m_strides;
-    }
-    void set_strides(const Strides& strides) {
-        m_strides = strides;
-    }
-    /// \return The dilations.
-    const Strides& get_dilations() const {
-        return m_dilations;
-    }
-    void set_dilations(const Strides& dilations) {
-        m_dilations = dilations;
-    }
-    /// \return The padding-below sizes (possibly negative).
-    const CoordinateDiff& get_pads_begin() const {
-        return m_pads_begin;
-    }
-    void set_pads_begin(const CoordinateDiff& pads_begin) {
-        m_pads_begin = pads_begin;
-    }
-    /// \return The padding-above sizes (possibly negative).
-    const CoordinateDiff& get_pads_end() const {
-        return m_pads_end;
-    }
-    void set_adding_above(const CoordinateDiff& pads_end) {
-        m_pads_end = pads_end;
-    }
-    /// \return The pad type for convolution.
-    const PadType& get_auto_pad() const {
-        return m_auto_pad;
-    }
-    void set_auto_pad(const PadType& auto_pad) {
-        m_auto_pad = auto_pad;
-    }
-    /// \return The mode of convolution.
-    const BinaryConvolutionMode& get_mode() const {
-        return m_mode;
-    }
-    void set_mode(const BinaryConvolutionMode& mode) {
-        m_mode = mode;
-    }
-    /// \return The pad value.
-    float get_pad_value() const {
-        return m_pad_value;
-    }
-    void set_pad_value(float pad_value) {
-        m_pad_value = pad_value;
-    }
-
-protected:
-    BinaryConvolutionMode mode_from_string(const std::string& mode) const;
-    Strides m_strides;
-    Strides m_dilations;
-    CoordinateDiff m_pads_begin;
-    CoordinateDiff m_pads_end;
-    BinaryConvolutionMode m_mode;
-    float m_pad_value;
-    PadType m_auto_pad;
-};
+using ov::op::v1::BinaryConvolution;
 }  // namespace v1
 }  // namespace op
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v1::BinaryConvolution::BinaryConvolutionMode& type);
-
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode> {
-public:
-    AttributeAdapter(ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v1::BinaryConvolution::BinaryConvolutionMode>",
-                                                0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/broadcast.hpp b/ngraph/core/include/ngraph/op/broadcast.hpp
index 5637ea720a0c47..34eef26e703f6b 100644
--- a/ngraph/core/include/ngraph/op/broadcast.hpp
+++ b/ngraph/core/include/ngraph/op/broadcast.hpp
@@ -8,126 +8,16 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/op/util/broadcast_base.hpp"
+#include "openvino/op/broadcast.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Operation which "adds" axes to an input tensor, replicating elements from the
-///        input as needed along the new axes.
-class NGRAPH_API Broadcast : public util::BroadcastBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a broadcast operation.
-    Broadcast() = default;
-    /// \brief Constructs a broadcast operation.
-    ///
-    /// \param arg            The input tensor to be broadcast.
-    /// \param target_shape   The shape of the output tensor.
-    /// \param axes_mapping   The axis positions (0-based) in the result that correspond
-    ///                       to input axes. 'Arg' tensor is broadcast along the
-    ///                       remaining axes.
-    ///                       E.g., Input Shape - [3, 4], Target Shape - [3, 5, 4, 4]
-    ///                       axes_mapping - [0, 2] => Broadcast along axes 1 and 3.
-    ///                       axes_mapping - [0, 3] => Broadcast along axes 1 and 2.
-    /// \param broadcast_spec Broadcast specification to use for determining broadcast
-    ///                       axes. 'axes_mapping' should not be provided if mode other
-    ///                       than explicit (none) is used.
-    Broadcast(const Output<Node>& arg,
-              const Output<Node>& target_shape,
-              const Output<Node>& axes_mapping,
-              const BroadcastModeSpec& broadcast_spec = BroadcastType::EXPLICIT);
-
-    /// \brief Constructs a broadcast operation.
-    ///
-    /// \param arg            The input tensor to be broadcast.
-    /// \param target_shape   The shape of the output tensor.
-    /// \param broadcast_spec Broadcast specification to use for determining broadcast
-    ///                       axes
-    Broadcast(const Output<Node>& arg,
-              const Output<Node>& target_shape,
-              const BroadcastModeSpec& broadcast_spec = BroadcastType::NUMPY);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    // \return Broadcast Specification.
-    const BroadcastModeSpec& get_broadcast_spec() const {
-        return m_mode;
-    }
-    void set_broadcast_spec(const BroadcastModeSpec& broadcast_spec) {
-        m_mode = broadcast_spec;
-    }
-
-    void validate_and_infer_types() override;
-
-    /// \return true and the AxisSet if broadcast axes can be fully determined.
-    std::pair<bool, AxisSet> get_broadcast_axes() const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool broadcast_evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v3::Broadcast;
 }  // namespace v3
 
 namespace v1 {
-/// \brief Operation which "adds" axes to an input tensor, replicating elements from the
-///        input as needed along the new axes.
-class NGRAPH_API Broadcast : public util::BroadcastBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a broadcast operation.
-    Broadcast() = default;
-    /// \brief Constructs a broadcast operation.
-    ///
-    /// \param arg            The input tensor to be broadcast.
-    /// \param target_shape   The shape of the output tensor.
-    /// \param axes_mapping   The axis positions (0-based) in the result that correspond
-    ///                       to input axes. 'Arg' tensor is broadcast along the
-    ///                       remaining axes.
-    ///                       E.g., Input Shape - [3, 4], Target Shape - [3, 5, 4, 4]
-    ///                       axes_mapping - [0, 2] => Broadcast along axes 1 and 3.
-    ///                       axes_mapping - [0, 3] => Broadcast along axes 1 and 2.
-    /// \param broadcast_spec Broadcast specification to use for determining broadcast
-    ///                       axes. 'axes_mapping' is ignored if broadcast_spec is not
-    ///                       NONE
-    Broadcast(const Output<Node>& arg,
-              const Output<Node>& target_shape,
-              const Output<Node>& axes_mapping,
-              const AutoBroadcastSpec& broadcast_spec = AutoBroadcastSpec());
-
-    /// \brief Constructs a broadcast operation.
-    ///
-    /// \param arg            The input tensor to be broadcast.
-    /// \param target_shape   The shape of the output tensor.
-    /// \param broadcast_spec Broadcast specification to use for determining broadcast
-    ///                       axes
-    Broadcast(const Output<Node>& arg,
-              const Output<Node>& target_shape,
-              const AutoBroadcastSpec& broadcast_spec = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return Broadcast Specification.
-    const AutoBroadcastSpec& get_broadcast_spec() const {
-        return m_broadcast_spec;
-    }
-    void set_broadcast_spec(const AutoBroadcastSpec& broadcast_spec) {
-        m_broadcast_spec = broadcast_spec;
-    }
-
-    void validate_and_infer_types() override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    AutoBroadcastSpec m_broadcast_spec;
-};
+using ov::op::v1::Broadcast;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/bucketize.hpp b/ngraph/core/include/ngraph/op/bucketize.hpp
index 354fe8733bd6f6..693e3f44d4a8c1 100644
--- a/ngraph/core/include/ngraph/op/bucketize.hpp
+++ b/ngraph/core/include/ngraph/op/bucketize.hpp
@@ -5,53 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/bucketize.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Operation that bucketizes the input based on boundaries
-class NGRAPH_API Bucketize : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Bucketize() = default;
-    /// \brief Constructs a Bucketize node
-
-    /// \param data              Input data to bucketize
-    /// \param buckets           1-D of sorted unique boundaries for buckets
-    /// \param output_type       Output tensor type, "i64" or "i32", defaults to i64
-    /// \param with_right_bound  indicates whether bucket includes the right or left
-    ///                          edge of interval. default true = includes right edge
-    Bucketize(const Output<Node>& data,
-              const Output<Node>& buckets,
-              const element::Type output_type = element::i64,
-              const bool with_right_bound = true);
-
-    virtual void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override;
-
-    element::Type get_output_type() const {
-        return m_output_type;
-    }
-    void set_output_type(element::Type output_type) {
-        m_output_type = output_type;
-    }
-    // Overload collision with method on Node
-    using Node::set_output_type;
-
-    bool get_with_right_bound() const {
-        return m_with_right_bound;
-    }
-    void set_with_right_bound(bool with_right_bound) {
-        m_with_right_bound = with_right_bound;
-    }
-
-private:
-    element::Type m_output_type;
-    bool m_with_right_bound;
-};
+using ov::op::v3::Bucketize;
 }  // namespace v3
 using v3::Bucketize;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/ceiling.hpp b/ngraph/core/include/ngraph/op/ceiling.hpp
index eac8cde6f30108..7c015d140f15e6 100644
--- a/ngraph/core/include/ngraph/op/ceiling.hpp
+++ b/ngraph/core/include/ngraph/op/ceiling.hpp
@@ -5,28 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/ceiling.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise ceiling operation.
-class NGRAPH_API Ceiling : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a ceiling operation.
-    Ceiling() = default;
-    /// \brief Constructs a ceiling operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Ceiling(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Ceiling;
 }  // namespace v0
 using v0::Ceiling;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/clamp.hpp b/ngraph/core/include/ngraph/op/clamp.hpp
index c22829fadbb5ae..f288956008ec64 100644
--- a/ngraph/core/include/ngraph/op/clamp.hpp
+++ b/ngraph/core/include/ngraph/op/clamp.hpp
@@ -6,46 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/clamp.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Performs a clipping operation on all elements of the input node
-///
-/// All input values that are outside of the <min;max> range are set to 'min' or 'max'
-/// depending on which side of the <min;max> range they are. The values that fall into
-/// this range remain unchanged.
-class NGRAPH_API Clamp : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Clamp();
-    /// \brief Constructs a Clamp node.
-    ///
-    /// \param data - Node producing the input tensor
-    /// \param min - the lower bound of the <min;max> range
-    /// \param max - the upper bound of the <min;max> range
-    Clamp(const Output<Node>& data, const double min, const double max);
-
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    double get_min() const {
-        return m_min;
-    }
-    double get_max() const {
-        return m_max;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    double m_min;
-    double m_max;
-};
+using ov::op::v0::Clamp;
 }  // namespace v0
 using v0::Clamp;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/concat.hpp b/ngraph/core/include/ngraph/op/concat.hpp
index 80e941be4f8c22..a597fdf6035186 100644
--- a/ngraph/core/include/ngraph/op/concat.hpp
+++ b/ngraph/core/include/ngraph/op/concat.hpp
@@ -7,59 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/concat.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Concatenation operation.
-class NGRAPH_API Concat : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a concatenation operation.
-    Concat() = default;
-    /// \brief Constructs a concatenation operation.
-    ///
-    /// \param args               The outputs producing the input tensors.
-    /// \param axis The axis along which to concatenate the input tensors.
-    Concat(const OutputVector& args, int64_t axis);
-
-    /// \brief Constructs a concatenation operation.
-    ///
-    /// \param args               The nodes producing the input tensors.
-    /// \param axis The axis along which to concatenate the input tensors.
-    Concat(const NodeVector& args, int64_t axis);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The concatenation axis.
-    int64_t get_concatenation_axis() const {
-        return m_concat_axis;
-    }
-    void set_concatenation_axis(int64_t concatenation_axis) {
-        m_concat_axis = concatenation_axis;
-    }
-    /// \return The concatenation axis.
-    int64_t get_axis() const {
-        return m_axis;
-    }
-    void set_axis(int64_t axis) {
-        m_axis = axis;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& output_values) const override;
-    bool evaluate_upper(const HostTensorVector& output_values) const override;
-
-protected:
-    /// \ brief m_axis stores default value for all iterations
-    int64_t m_axis;
-    /// \brief m_concat_axis stores m_axis plus the number of rank for each iteration
-    int64_t m_concat_axis = -1;
-};
+using ov::op::v0::Concat;
 }  // namespace v0
 using v0::Concat;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/constant.hpp b/ngraph/core/include/ngraph/op/constant.hpp
index aeca47c5cb84ed..f13fd70fa5afa0 100644
--- a/ngraph/core/include/ngraph/op/constant.hpp
+++ b/ngraph/core/include/ngraph/op/constant.hpp
@@ -15,694 +15,12 @@
 #include "ngraph/type/element_type.hpp"
 #include "ngraph/type/element_type_traits.hpp"
 #include "ngraph/util.hpp"
+#include "openvino/op/constant.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Class for constants.
-class NGRAPH_API Constant : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Constant() = default;
-
-    /// \brief Initialize a constant from tensor
-    /// \param tensor The tensor with data
-    Constant(const std::shared_ptr<runtime::Tensor>& tensor);
-
-    /// \brief Constructs a tensor constant.
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param values A vector of literals for initializing the tensor constant. The
-    ///               size of values must match the size of the shape.
-    template <typename T>
-    Constant(const element::Type& type, const Shape& shape, const std::vector<T>& values) : Constant(type, shape) {
-        NODE_VALIDATION_CHECK(this,
-                              values.size() == 1 || values.size() == shape_size(m_shape),
-                              "Did not get the expected number of literals for a constant of shape ",
-                              m_shape,
-                              " (got ",
-                              values.size(),
-                              ", expected ",
-                              (shape_size(m_shape) == 1 ? "" : "1 or "),
-                              shape_size(m_shape),
-                              ").");
-
-        if (values.size() == 1) {
-            fill_data(type, values.front());
-        } else {
-            write_values(values);
-        }
-        m_all_elements_bitwise_identical = are_all_data_elements_bitwise_identical();
-    }
-
-    /// \brief Create uninitialized constant
-    Constant(const element::Type& type, const Shape& shape);
-    /// \brief Constructs a uniform tensor constant.
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param value A scalar for initializing the uniform tensor constant. The
-    ///               value is broadcast to the specified shape.
-    template <class T, class = typename std::enable_if<std::is_fundamental<T>::value>::type>
-    Constant(const element::Type& type, const Shape& shape, T value) : Constant(type, shape) {
-        fill_data(type, value);
-        m_all_elements_bitwise_identical = true;
-    }
-
-    template <typename T>
-    void fill_data(const element::Type& type, T value) {
-        using Type_t = element::Type_t;
-#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#    pragma GCC diagnostic push
-#    pragma GCC diagnostic error "-Wswitch"
-#    pragma GCC diagnostic error "-Wswitch-enum"
-#endif
-        switch (type) {
-        case Type_t::boolean:
-            fill_data<Type_t::boolean>(value);
-            break;
-        case Type_t::bf16:
-            fill_data<Type_t::bf16>(value);
-            break;
-        case Type_t::f16:
-            fill_data<Type_t::f16>(value);
-            break;
-        case Type_t::f32:
-            fill_data<Type_t::f32>(value);
-            break;
-        case Type_t::f64:
-            fill_data<Type_t::f64>(value);
-            break;
-        case Type_t::i4:
-            fill_data<Type_t::i4>(value);
-            break;
-        case Type_t::i8:
-            fill_data<Type_t::i8>(value);
-            break;
-        case Type_t::i16:
-            fill_data<Type_t::i16>(value);
-            break;
-        case Type_t::i32:
-            fill_data<Type_t::i32>(value);
-            break;
-        case Type_t::i64:
-            fill_data<Type_t::i64>(value);
-            break;
-        case Type_t::u1:
-            fill_data<Type_t::u1>(value);
-            break;
-        case Type_t::u4:
-            fill_data<Type_t::u4>(value);
-            break;
-        case Type_t::u8:
-            fill_data<Type_t::u8>(value);
-            break;
-        case Type_t::u16:
-            fill_data<Type_t::u16>(value);
-            break;
-        case Type_t::u32:
-            fill_data<Type_t::u32>(value);
-            break;
-        case Type_t::u64:
-            fill_data<Type_t::u64>(value);
-            break;
-        case Type_t::undefined:
-        case Type_t::dynamic:
-            throw std::runtime_error("unsupported type");
-        }
-#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#    pragma GCC diagnostic pop
-#endif
-    }
-
-    /// \brief Constructs a tensor constant
-    ///        This constructor is mainly to support deserialization of constants.
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param values A list of string values to use as the constant data.
-    Constant(const element::Type& type, const Shape& shape, const std::vector<std::string>& values);
-
-    /// \brief Constructs a tensor constant with the supplied data
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param data A void* to constant data.
-    Constant(const element::Type& type, const Shape& shape, const void* data);
-
-    /// \brief Constructs a tensor constant with the supplied data
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param data A pointer to pre-allocated shared data.
-    template <typename T>
-    Constant(const element::Type& type, const Shape& shape, std::shared_ptr<runtime::SharedBuffer<T>> data)
-        : m_element_type(type),
-          m_shape(shape) {
-        m_data = data;
-        constructor_validate_and_infer_types();
-    }
-
-    Constant(const Constant& other);
-    Constant(const Constant& other, const Shape& new_shape);
-    Constant& operator=(const Constant&) = delete;
-
-    virtual ~Constant() override;
-
-    void validate_and_infer_types() override {
-        infer_element_type();
-        set_output_type(0, m_element_type, m_shape);
-    }
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-
-    // Don't constant fold a constant; it would make a copy
-    bool constant_fold(OutputVector& outputs, const OutputVector& inputs) override {
-        (void)outputs;
-        (void)inputs;
-        return false;
-    }
-
-    /// \brief Returns the value of the constant node as a Shape object
-    ///        Can only be used on element::i64 nodes and interprets
-    ///        negative values as zeros.
-    Shape get_shape_val() const;
-    /// \brief Returns the value of the constant node as a Strides
-    ///        object
-    ///        Can only be used on element::i64 nodes and interprets
-    ///        negative values as zeros.
-    Strides get_strides_val() const;
-    /// \brief Returns the value of the constant node as a Coordinate
-    ///        object
-    ///        Can only be used on element::i64 nodes and interprets
-    ///        negative values as zeros.
-    Coordinate get_coordinate_val() const;
-    /// \brief Returns the value of the constant node as a
-    ///        CoordinateDiff object
-    ///        Can only be used on element::i64 nodes.
-    CoordinateDiff get_coordinate_diff_val() const;
-    /// \brief Returns the value of the constant node as an AxisVector
-    ///        object
-    ///        Can only be used on element::i64 nodes and interprets
-    ///        negative values as zeros.
-    AxisVector get_axis_vector_val() const;
-    /// \brief Returns the value of the constant node as an AxisSet
-    ///        object
-    ///        Can only be used on element::i64 nodes and interprets
-    ///        negative values as zeros.
-    ///        Repeated values are allowed.
-    AxisSet get_axis_set_val() const;
-
-    /// \brief Update Constant shape. New shape size must equal to the data elements
-    /// count
-    ///
-    /// \param shape The shape of the tensor constant.
-    NGRAPH_DEPRECATED("Use Constant c-tor with shape argument instead")
-    void set_data_shape(const Shape& shape);
-
-    /// \brief Wrapper around constructing a shared_ptr of a Constant
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param values A vector of values to use as the constant data.
-    template <typename T>
-    static std::shared_ptr<Constant> create(const element::Type& type,
-                                            const Shape& shape,
-                                            const std::vector<T>& values) {
-        return std::make_shared<Constant>(type, shape, values);
-    }
-
-    /// \brief Wrapper around constructing a shared_ptr of a Constant
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param values An initializer_list of values to use as the constant data.
-    template <typename T>
-    static std::shared_ptr<Constant> create(const element::Type& type,
-                                            const Shape& shape,
-                                            std::initializer_list<T> values) {
-        return std::make_shared<Constant>(type, shape, std::vector<T>{values});
-    }
-
-    /// \brief Wrapper around constructing a shared_ptr of a Constant
-    ///
-    /// \param type The element type of the tensor constant.
-    /// \param shape The shape of the tensor constant.
-    /// \param memory An continues memory chunk which contains the constant data.
-    static std::shared_ptr<Constant> create(const element::Type& type, const Shape& shape, const void* memory) {
-        return std::make_shared<Constant>(type, shape, memory);
-    }
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The initialization literals for the tensor constant.
-    std::vector<std::string> get_value_strings() const;
-
-    template <typename T>
-    std::vector<T> get_vector() const {
-        const T* p = get_data_ptr<T>();
-        if (p == nullptr)
-            throw std::runtime_error("Cannot create vector! Buffer is not allocated.");
-        return std::vector<T>(p, p + shape_size(m_shape));
-    }
-
-    /// \brief Return the Constant's value as a vector cast to type T
-    ///
-    /// \tparam T  Type to which data vector's entries will be cast.
-    /// \return    Constant's data vector.
-    template <typename T>
-    std::vector<T> cast_vector() const {
-        auto source_type = get_element_type();
-        std::vector<T> rc;
-        using Type_t = element::Type_t;
-#if defined(_MSC_VER)
-#    pragma warning(push)
-#    pragma warning(disable : 4244)
-#endif
-        switch (source_type) {
-        case Type_t::boolean:
-            cast_vector<Type_t::boolean>(rc);
-            break;
-        case Type_t::bf16:
-            cast_vector<Type_t::bf16>(rc);
-            break;
-        case Type_t::f16:
-            cast_vector<Type_t::f16>(rc);
-            break;
-        case Type_t::f32:
-            cast_vector<Type_t::f32>(rc);
-            break;
-        case Type_t::f64:
-            cast_vector<Type_t::f64>(rc);
-            break;
-        case Type_t::i4:
-            cast_vector<Type_t::i4>(rc);
-            break;
-        case Type_t::i8:
-            cast_vector<Type_t::i8>(rc);
-            break;
-        case Type_t::i16:
-            cast_vector<Type_t::i16>(rc);
-            break;
-        case Type_t::i32:
-            cast_vector<Type_t::i32>(rc);
-            break;
-        case Type_t::i64:
-            cast_vector<Type_t::i64>(rc);
-            break;
-        case Type_t::u1:
-            cast_vector<Type_t::u1>(rc);
-            break;
-        case Type_t::u4:
-            cast_vector<Type_t::u4>(rc);
-            break;
-        case Type_t::u8:
-            cast_vector<Type_t::u8>(rc);
-            break;
-        case Type_t::u16:
-            cast_vector<Type_t::u16>(rc);
-            break;
-        case Type_t::u32:
-            cast_vector<Type_t::u32>(rc);
-            break;
-        case Type_t::u64:
-            cast_vector<Type_t::u64>(rc);
-            break;
-        default:
-            throw std::runtime_error("unsupported type");
-        }
-#if defined(_MSC_VER)
-#    pragma warning(pop)
-#endif
-        return rc;
-    }
-
-    const void* get_data_ptr() const {
-        return (m_data ? m_data->get_ptr() : nullptr);
-    }
-    template <typename T>
-    const T* get_data_ptr() const {
-        if (sizeof(T) > m_element_type.size() && shape_size(m_shape) > 0) {
-            throw ngraph_error("Buffer over-read");
-        }
-
-        return static_cast<const T*>(get_data_ptr());
-    }
-
-    template <element::Type_t ET>
-    const typename element_type_traits<ET>::value_type* get_data_ptr() const {
-        NGRAPH_CHECK(ET == get_element_type(), "get_data_ptr() called for incorrect element type.");
-        return static_cast<const typename element_type_traits<ET>::value_type*>(get_data_ptr());
-    }
-
-    bool get_all_data_elements_bitwise_identical() const {
-        return m_all_elements_bitwise_identical;
-    }
-    std::string convert_value_to_string(size_t index) const;
-
-    /**
-     * \brief Allows to avoid buffer allocation on the visit_attributes call
-     */
-    void alloc_buffer_on_visit_attributes(bool val) {
-        m_alloc_buffer_on_visit_attributes = val;
-    }
-
-private:
-    template <element::Type_t Type,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
-                                          Type != element::Type_t::i4,
-                                      bool>::type = true>
-    StorageDataType get_element_value(size_t index) const {
-        return get_data_ptr<Type>()[index];
-    }
-
-    template <element::Type_t Type,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
-    StorageDataType get_element_value(size_t index) const {
-        return (get_data_ptr<uint8_t>()[index / 8] >> (7 - (index % 8))) & 1;
-    }
-
-    template <element::Type_t Type,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type == element::Type_t::u4, bool>::type = true>
-    StorageDataType get_element_value(size_t index) const {
-        return (get_data_ptr<uint8_t>()[index / 2] >> (index % 2 ? 0 : 4)) & 0x0F;
-    }
-
-    template <element::Type_t Type,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type == element::Type_t::i4, bool>::type = true>
-    StorageDataType get_element_value(size_t index) const {
-        const uint8_t i4data = (get_data_ptr<uint8_t>()[index / 2] >> (index % 2 ? 0 : 4)) & 0x0F;
-        const bool is_negative_number = (i4data >> 3) & 0x01;
-        const int8_t data = is_negative_number ? i4data | 0xF0 : i4data;
-        return data;
-    }
-
-    template <element::Type_t Type,
-              typename OUT_T,
-              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
-                                          Type != element::Type_t::i4,
-                                      bool>::type = true>
-    void cast_vector(std::vector<OUT_T>& output_vector) const {
-        // this function is workaround for waring during windows building
-        // build complains for vector creation based on iterators
-        // which point on different type than destination vector::value_type
-        using IN_T = fundamental_type_for<Type>;
-        auto source_vector = get_vector<IN_T>();
-        output_vector.reserve(source_vector.size());
-
-        std::transform(source_vector.begin(), source_vector.end(), std::back_inserter(output_vector), [](IN_T c) {
-            return static_cast<OUT_T>(c);
-        });
-    }
-
-    template <element::Type_t Type,
-              typename OUT_T,
-              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
-    void cast_vector(std::vector<OUT_T>& output) const {
-        using IN_T = fundamental_type_for<Type>;
-        const auto element_number = shape_size(m_shape);
-        const auto source_begin = get_data_ptr<uint8_t>();
-        const auto source_end = std::next(source_begin, (element_number + 7) / 8);
-        const auto round_element_no = element_number % 8 ? element_number - element_number % 8 + 8 : element_number;
-        output.reserve(round_element_no);  // adds 7 more elements here?
-        std::for_each(source_begin, source_end, [&](IN_T c) {
-            for (const auto i : {7, 6, 5, 4, 3, 2, 1, 0}) {
-                const uint8_t data = (c >> i) & 0x01;
-                output.push_back(data);
-            }
-        });
-        output.resize(element_number);
-    }
-
-    template <element::Type_t Type,
-              typename OUT_T,
-              typename std::enable_if<Type == element::Type_t::u4, bool>::type = true>
-    void cast_vector(std::vector<OUT_T>& output) const {
-        using IN_T = fundamental_type_for<Type>;
-        const auto element_number = shape_size(m_shape);
-        const auto source_begin = get_data_ptr<uint8_t>();
-        const auto source_end = std::next(source_begin, (element_number + 1) / 2);
-        const auto round_element_no = element_number % 2 ? element_number + 1 : element_number;
-        output.reserve(round_element_no);  // adds 1 more elements here?
-        std::for_each(source_begin, source_end, [&](IN_T c) {
-            for (const auto i : {4, 0}) {
-                const uint8_t data = (c >> i) & 0x0F;
-                output.push_back(data);
-            }
-        });
-        output.resize(element_number);
-    }
-    template <element::Type_t Type,
-              typename OUT_T,
-              typename std::enable_if<Type == element::Type_t::i4, bool>::type = true>
-    void cast_vector(std::vector<OUT_T>& output) const {
-        using IN_T = fundamental_type_for<Type>;
-        const auto element_number = shape_size(m_shape);
-        const auto source_begin = get_data_ptr<uint8_t>();
-        const auto source_end = std::next(source_begin, (element_number + 1) / 2);
-        const auto round_element_no = element_number % 2 ? element_number + 1 : element_number;
-        output.reserve(round_element_no);  // adds 1 more elements here?
-        std::for_each(source_begin, source_end, [&](IN_T c) {
-            for (const auto i : {4, 0}) {
-                const uint8_t i4data = (c >> i) & 0x0F;
-                const bool is_negative_number = (i4data >> 3) & 0x01;
-                const int8_t data = is_negative_number ? i4data | 0xF0 : i4data;
-                output.push_back(data);
-            }
-        });
-        output.resize(element_number);
-    }
-
-    template <element::Type_t Type,
-              typename T,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
-                                          Type != element::Type_t::i4,
-                                      bool>::type = true>
-    void fill_data(const T& value) {
-        const auto size = shape_size(m_shape);
-        const auto v = static_cast<StorageDataType>(value);
-        std::fill_n(get_data_ptr_nc<Type>(), size, v);
-    }
-
-    template <element::Type_t Type,
-              typename T,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
-    void fill_data(const T& value) {
-        const StorageDataType v = value ? 0xFF : 0x00;
-        std::fill_n(get_data_ptr_nc<Type>(), mem_size(), v);
-    }
-
-    template <element::Type_t Type,
-              typename T,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type == element::Type_t::u4 || Type == element::Type_t::i4, bool>::type = true>
-    void fill_data(const T& value) {
-        uint8_t v = value_in_range<Type>(value);
-        v &= 0x0F;
-        v += v << 4;
-        std::fill_n(get_data_ptr_nc<Type>(), mem_size(), v);
-    }
-
-    void allocate_buffer();
-
-    void* get_data_ptr_nc() {
-        return (m_data ? m_data->get_ptr() : nullptr);
-    }
-
-    template <element::Type_t ET>
-    typename element_type_traits<ET>::value_type* get_data_ptr_nc() {
-        NGRAPH_CHECK(ET == get_element_type(), "get_data_ptr_nc() called for incorrect element type.");
-        return static_cast<typename element_type_traits<ET>::value_type*>(get_data_ptr_nc());
-    }
-
-    Constant(const OutputVector& args) : Op(args), m_shape({}) {}
-
-    virtual void infer_element_type() {}
-    template <typename T>
-    void write_values(const std::vector<T>& values) {
-        write_to_buffer(values);
-    }
-
-    template <element::Type_t Type,
-              typename T,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
-                                          Type != element::Type_t::i4,
-                                      bool>::type = true>
-    void write_buffer(const std::vector<T>& source) {
-        auto p = get_data_ptr_nc<Type>();
-        for (size_t i = 0; i < source.size(); i++) {
-            p[i] = static_cast<StorageDataType>(source[i]);
-        }
-    }
-
-    template <element::Type_t Type,
-              typename T,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type == element::Type_t::u4 || Type == element::Type_t::i4, bool>::type = true>
-    void write_buffer(const std::vector<T>& source) {
-        auto p = get_data_ptr_nc<Type>();
-        size_t i = 0;
-        for (; i < source.size() / 2; i++) {
-            const auto v1 = value_in_range<Type>(source[i * 2]) & 0x0F;
-            const auto v2 = value_in_range<Type>(source[i * 2 + 1]) & 0x0F;
-            const auto v = (v1 << 4) | v2;
-            p[i] = static_cast<StorageDataType>(v);
-        }
-        if (source.size() % 2) {
-            const auto v1 = value_in_range<Type>(source[i * 2]) & 0x0F;
-            const auto v = v1 << 4;
-            p[i] = static_cast<StorageDataType>(v);
-        }
-    }
-
-    template <element::Type_t Type,
-              typename T,
-              typename StorageDataType = fundamental_type_for<Type>,
-              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
-    void write_buffer(const std::vector<T>& source) {
-        auto p = get_data_ptr_nc<Type>();
-        size_t i = 0;
-        for (; i < source.size() / 8; i++) {
-            uint8_t v{};
-            for (int j = 0; j != 8; j++) {
-                const uint8_t b = source[i * 8 + j] ? 0x01 << (7 - j) : 0;
-                v |= b;
-            }
-            p[i] = static_cast<StorageDataType>(v);
-        }
-        uint8_t v{};
-        for (unsigned j = 0; j != source.size() % 8; j++) {
-            const uint8_t b = source[i * 8 + j] ? 0x01 << (7 - j) : 0;
-            v |= b;
-        }
-        p[i] = static_cast<StorageDataType>(v);
-    }
-
-    template <typename T>
-    void write_to_buffer(const std::vector<T>& source) {
-        const auto& target_type = m_element_type;
-        size_t target_element_count = shape_size(m_shape);
-        if (source.size() != target_element_count) {
-            throw std::runtime_error("Constant initializer does not match shape");
-        }
-        using Type_t = element::Type_t;
-#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#    pragma GCC diagnostic push
-#    pragma GCC diagnostic error "-Wswitch"
-#    pragma GCC diagnostic error "-Wswitch-enum"
-#endif
-        switch (target_type) {
-        case Type_t::boolean:
-            write_buffer<Type_t::boolean>(source);
-            break;
-        case Type_t::bf16:
-            write_buffer<Type_t::bf16>(source);
-            break;
-        case Type_t::f16:
-            write_buffer<Type_t::f16>(source);
-            break;
-        case Type_t::f32:
-            write_buffer<Type_t::f32>(source);
-            break;
-        case Type_t::f64:
-            write_buffer<Type_t::f64>(source);
-            break;
-        case Type_t::i4:
-            write_buffer<Type_t::i4>(source);
-            break;
-        case Type_t::i8:
-            write_buffer<Type_t::i8>(source);
-            break;
-        case Type_t::i16:
-            write_buffer<Type_t::i16>(source);
-            break;
-        case Type_t::i32:
-            write_buffer<Type_t::i32>(source);
-            break;
-        case Type_t::i64:
-            write_buffer<Type_t::i64>(source);
-            break;
-        case Type_t::u1:
-            write_buffer<Type_t::u1>(source);
-            break;
-        case Type_t::u4:
-            write_buffer<Type_t::u4>(source);
-            break;
-        case Type_t::u8:
-            write_buffer<Type_t::u8>(source);
-            break;
-        case Type_t::u16:
-            write_buffer<Type_t::u16>(source);
-            break;
-        case Type_t::u32:
-            write_buffer<Type_t::u32>(source);
-            break;
-        case Type_t::u64:
-            write_buffer<Type_t::u64>(source);
-            break;
-        case element::Type_t::undefined:
-        case element::Type_t::dynamic:
-            throw std::runtime_error("unsupported type");
-        }
-#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#    pragma GCC diagnostic pop
-#endif
-    }
-    template <ngraph::element::Type_t Type,
-              typename ValueT,
-              typename std::enable_if<Type == ngraph::element::Type_t::u4, bool>::type = true>
-    static ngraph::fundamental_type_for<Type> value_in_range(const ValueT& value) {
-        const auto result = ngraph::fundamental_type_for<Type>(value);
-        NGRAPH_CHECK(0 <= result && result <= 15, "assigned value out of range u4 values");
-        return result;
-    }
-
-    template <ngraph::element::Type_t Type,
-              typename ValueT,
-              typename std::enable_if<Type == ngraph::element::Type_t::i4, bool>::type = true>
-    static ngraph::fundamental_type_for<Type> value_in_range(const ValueT& value) {
-        const auto result = ngraph::fundamental_type_for<Type>(value);
-        NGRAPH_CHECK(-8 <= result && result <= 7, "assigned value out of range i4 values");
-        return result;
-    }
-
-    bool are_all_data_elements_bitwise_identical() const;
-    static constexpr size_t host_alignment() {
-        return 64;
-    }
-
-    size_t mem_size() const {
-        const bool bitwidth_less_than_byte = m_element_type.bitwidth() < 8;
-        if (bitwidth_less_than_byte) {
-            const auto size = shape_size(m_shape);
-            const auto bitwidth = size * m_element_type.bitwidth();
-            // for rounding by `(bitwidth + 7) / 8` will work for
-            // `bitwidth < numeric_limits<size_t>::max() - 7`
-            return bitwidth / 8 + (bitwidth % 8 ? 1 : 0);
-        }
-        return shape_size(m_shape) * m_element_type.size();
-    }
-
-    element::Type m_element_type;
-    Shape m_shape{};
-    std::shared_ptr<runtime::AlignedBuffer> m_data;
-    bool m_all_elements_bitwise_identical;
-    bool m_alloc_buffer_on_visit_attributes = true;
-};
+using ov::op::v0::Constant;
 }  // namespace v0
 using v0::Constant;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/convert.hpp b/ngraph/core/include/ngraph/op/convert.hpp
index db29280bf62239..cc5181da8ee596 100644
--- a/ngraph/core/include/ngraph/op/convert.hpp
+++ b/ngraph/core/include/ngraph/op/convert.hpp
@@ -6,47 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/op/convert.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise type conversion operation.
-class NGRAPH_API Convert : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a conversion operation.
-    Convert() = default;
-    /// \brief Constructs a conversion operation.
-    ///
-    /// \param arg          Node that produces the input tensor.
-    /// \param destination_type  Element type for the output tensor.
-    Convert(const Output<Node>& arg, const ngraph::element::Type& destination_type);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    const element::Type& get_destination_type() const {
-        return m_destination_type;
-    }
-    void set_destination_type(const element::Type& destination_type) {
-        m_destination_type = destination_type;
-    }
-    const element::Type& get_convert_element_type() const {
-        return m_destination_type;
-    }
-    void set_convert_element_type(const element::Type& destination_type) {
-        m_destination_type = destination_type;
-    }
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-
-protected:
-    ngraph::element::Type m_destination_type;
-};
+using ov::op::v0::Convert;
 }  // namespace v0
 using v0::Convert;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/convert_like.hpp b/ngraph/core/include/ngraph/op/convert_like.hpp
index 068abf4d5dbd9f..47f20f87646ca5 100644
--- a/ngraph/core/include/ngraph/op/convert_like.hpp
+++ b/ngraph/core/include/ngraph/op/convert_like.hpp
@@ -5,32 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/convert_like.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise type conversion operation.
-class NGRAPH_API ConvertLike : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a conversion operation.
-    ConvertLike() = default;
-    /// \brief Constructs a conversion operation.
-    /// \param data  Node that produces the input tensor.
-    /// \param like  Node which provides the target type information for the conversion.
-    ConvertLike(const Output<Node>& data, const Output<Node>& like);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool constant_fold(OutputVector& output_values, const OutputVector& input_values) override;
-};
-
+using ov::op::v1::ConvertLike;
 }  // namespace v1
-
 }  // namespace op
-
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/convolution.hpp b/ngraph/core/include/ngraph/op/convolution.hpp
index 1db18078f6685b..e974e695e87d69 100644
--- a/ngraph/core/include/ngraph/op/convolution.hpp
+++ b/ngraph/core/include/ngraph/op/convolution.hpp
@@ -7,219 +7,13 @@
 #include "ngraph/coordinate_diff.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/convolution.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Batched convolution operation, with optional window dilation and stride.
-///
-class NGRAPH_API Convolution : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a batched convolution operation.
-    Convolution() = default;
-    /// \brief Constructs a batched convolution operation.
-    ///
-    /// \param data_batch The node producing the input data batch tensor.<br>
-    /// `[N, C_IN, D1, ... Df]`
-    /// \param filters The node producing the filters tensor.<br>
-    /// `[C_OUT, C_IN, F1, ... Ff]`
-    /// \param strides The strides.<br>
-    /// `[f]`
-    /// \param dilations The dilations.<br>
-    /// `[f]`
-    /// \param pads_begin The beginning of padding shape.<br>
-    /// `[f]`
-    /// \param pads_end The end of padding shape.<br>
-    /// `[f]`
-    /// \param auto_pad The pad type for automatically computing padding sizes.<br>
-    /// `[f]`
-    ///
-    /// Output `[N, C_OUT, R1, ... Rf]`
-    ///
-    Convolution(const Output<Node>& data_batch,
-                const Output<Node>& filters,
-                const Strides& strides,
-                const CoordinateDiff& pads_begin,
-                const CoordinateDiff& pads_end,
-                const Strides& dilations,
-                const PadType& auto_pad = PadType::EXPLICIT);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The strides.
-    const Strides& get_strides() const {
-        return m_strides;
-    }
-    void set_strides(const Strides& strides) {
-        m_strides = strides;
-    }
-    /// \return The dilations.
-    const Strides& get_dilations() const {
-        return m_dilations;
-    }
-    void set_dilations(const Strides& dilations) {
-        m_dilations = dilations;
-    }
-    /// \return The padding-below sizes (possibly negative).
-    const CoordinateDiff& get_pads_begin() const {
-        return m_pads_begin;
-    }
-    void set_pads_begin(const CoordinateDiff& pads_begin) {
-        m_pads_begin = pads_begin;
-    }
-    /// \return The padding-above sizes (possibly negative).
-    const CoordinateDiff& get_pads_end() const {
-        return m_pads_end;
-    }
-    void set_adding_above(const CoordinateDiff& pads_end) {
-        m_pads_end = pads_end;
-    }
-    /// \return The pad type for convolution.
-    const PadType& get_auto_pad() const {
-        return m_auto_pad;
-    }
-    void set_auto_pad(const PadType& auto_pad) {
-        m_auto_pad = auto_pad;
-    }
-    /// \return The default value for Convolution.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-protected:
-    Strides m_strides;
-    Strides m_dilations;
-    CoordinateDiff m_pads_begin;
-    CoordinateDiff m_pads_end;
-    PadType m_auto_pad;
-};
-
-/// \brief Data batch backprop for batched convolution operation.
-class NGRAPH_API ConvolutionBackpropData : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a batched-convolution data batch-backprop operation.
-    ConvolutionBackpropData() = default;
-    // clang-format off
-                //
-                // \brief      Constructs a batched-convolution data batch-backprop operation.
-                //
-                // \param      data            The node producing data from forward-prop. Shape: [N,
-                //                             C_INPUT, X1, ..., XD].
-                // \param      filters         The node producing the filter from forward-prop. Shape:
-                //                             [C_INPUT, C_OUTPUT, K_D, ..., K_1]
-                // \param      output_shape    The shape of the data batch from forward-prop. It's size
-                //                             should be equal to number of data spatial dimensions.
-                // \param      strides         The strides from forward-prop.
-                // \param      pads_begin      The padding-below sizes from forward-prop.
-                // \param      pads_end        The padding-above sizes from forward-prop.
-                // \param      dilations       The dilations from forward-prop.
-                // \param      auto_pad        The pad type for automatically computing padding sizes.
-                // \param      output_padding  The output padding adds additional amount of paddings per
-                //                             each spatial axis in the output tensor. clang-format on
-                //
-                ConvolutionBackpropData(const Output<Node>& data,
-                                        const Output<Node>& filters,
-                                        const Output<Node>& output_shape,
-                                        const Strides& strides,
-                                        const CoordinateDiff& pads_begin,
-                                        const CoordinateDiff& pads_end,
-                                        const Strides& dilations,
-                                        const PadType& auto_pad = PadType::EXPLICIT,
-                                        const CoordinateDiff& output_padding = {});
-
-                // clang-format off
-                //
-                // \brief      Constructs a batched-convolution data batch-backprop operation.
-                //
-                // \param      data            The node producing data from forward-prop. Shape: [N,
-                //                             C_INPUT, X1, ..., XD].
-                // \param      filters         The node producing the filter from forward-prop. Shape:
-                //                             [C_INPUT, C_OUTPUT, K_D, ..., K_1]
-                // \param      strides         The strides from forward-prop.
-                // \param      pads_begin      The padding-below sizes from forward-prop.
-                // \param      pads_end        The padding-above sizes from forward-prop.
-                // \param      dilations       The dilations from forward-prop.
-                // \param      auto_pad        The pad type for automatically computing padding sizes.
-                // \param      output_padding  The output padding adds additional amount of paddings per
-                //                             each spatial axis in the output tensor. clang-format on
-                //
-                ConvolutionBackpropData(const Output<Node>& data,
-                                        const Output<Node>& filters,
-                                        const Strides& strides,
-                                        const CoordinateDiff& pads_begin,
-                                        const CoordinateDiff& pads_end,
-                                        const Strides& dilations,
-                                        const PadType& auto_pad = PadType::EXPLICIT,
-                                        const CoordinateDiff& output_padding = {});
-
-                void validate_and_infer_types() override;
-                bool visit_attributes(AttributeVisitor& visitor) override;
-                virtual bool is_dynamic() const override;
-
-                virtual std::shared_ptr<Node>
-                    clone_with_new_inputs(const OutputVector& new_args) const override;
-
-                /// \return The output spatial dimensions shape.
-                const PartialShape get_output_shape() const;
-                void set_output_shape(const Shape& output_shape);
-                /// \return The strides from the forward prop.
-                const Strides& get_strides() const { return m_strides; }
-                void set_strides(const Strides& strides) { m_strides = strides; }
-                /// \return The dilations from the forward prop.
-                const Strides& get_dilations() const { return m_dilations; }
-                void set_dilations(const Strides& dilations) { m_dilations = dilations; }
-                /// \return The padding-below sizes (possibly negative) from the forward prop.
-                const CoordinateDiff& get_pads_begin() const { return m_pads_begin; }
-                void set_pads_begin(const CoordinateDiff& pads_begin) { m_pads_begin = pads_begin; }
-                /// \return The padding-above sizes (possibly negative) from the forward prop.
-                const CoordinateDiff& get_pads_end() const { return m_pads_end; }
-                void set_pads_end(const CoordinateDiff& pads_end) { m_pads_end = pads_end; }
-                /// \return The auto pad.
-                const PadType& get_auto_pad() const { return m_auto_pad; }
-                void set_auto_pad(const PadType& auto_pad) { m_auto_pad = auto_pad; }
-                /// \return The output padding.
-                const CoordinateDiff& get_output_padding() const { return m_output_padding; }
-                void set_output_padding(const CoordinateDiff& output_padding)
-                {
-                    m_output_padding = output_padding;
-                }
-                /// \brief      Calculates output spatial features size.
-                ///
-                /// \param[in]  input_data_shape      The input data partial shape
-                /// \param[in]  filters_shape         The filters partial shape
-                /// \param[in]  strides               The strides values.
-                /// \param[in]  dilations             The dilations values.
-                /// \param[in]  pads_begin            The paddings at the beginning of axis.
-                /// \param[in]  pads_end              The paddings at the end of axis.
-                /// \param[in]  output_padding    The output padding values.
-                /// \param      output_spatial_shape  The placeholder for computed output spatial partial
-                /// shape.
-                ///
-                void
-                    infer_conv_backprop_output_spatial_shape(const std::vector<Dimension>& input_data_shape,
-                                                            const std::vector<Dimension>& filters_shape,
-                                                            const Strides& strides,
-                                                            const Strides& dilations,
-                                                            const CoordinateDiff& pads_begin,
-                                                            const CoordinateDiff& pads_end,
-                                                            const CoordinateDiff& output_padding,
-                                                            std::vector<Dimension>& output_spatial_shape);
-
-            protected:
-                Strides m_strides;
-                Strides m_dilations;
-                CoordinateDiff m_pads_begin;
-                CoordinateDiff m_pads_end;
-                PadType m_auto_pad;
-                CoordinateDiff m_output_padding;
-            };
-        } // namespace v1
-    } // namespace op
-} // namespace ngraph
+using ov::op::v1::Convolution;
+using ov::op::v1::ConvolutionBackpropData;
+}  // namespace v1
+}  // namespace op
+}  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/cos.hpp b/ngraph/core/include/ngraph/op/cos.hpp
index 902b763588aec1..200d95ce9ad43f 100644
--- a/ngraph/core/include/ngraph/op/cos.hpp
+++ b/ngraph/core/include/ngraph/op/cos.hpp
@@ -5,27 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/cos.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise cosine operation.
-class NGRAPH_API Cos : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a cosine operation.
-    Cos() = default;
-    /// \brief Constructs a cosine operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Cos(const Output<Node>& arg);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Cos;
 }  // namespace v0
 using v0::Cos;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/cosh.hpp b/ngraph/core/include/ngraph/op/cosh.hpp
index f279a8579517ea..bea0453b73f0c3 100644
--- a/ngraph/core/include/ngraph/op/cosh.hpp
+++ b/ngraph/core/include/ngraph/op/cosh.hpp
@@ -5,27 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/cosh.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise hyperbolic cosine (cosh) operation.
-class NGRAPH_API Cosh : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a hyperbolic cosine operation.
-    Cosh() = default;
-    /// \brief Constructs a hyperbolic cosine operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Cosh(const Output<Node>& arg);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Cosh;
 }  // namespace v0
 using v0::Cosh;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/ctc_greedy_decoder.hpp b/ngraph/core/include/ngraph/op/ctc_greedy_decoder.hpp
index 3749f2832e2e7c..1b2d0784a9ecc5 100644
--- a/ngraph/core/include/ngraph/op/ctc_greedy_decoder.hpp
+++ b/ngraph/core/include/ngraph/op/ctc_greedy_decoder.hpp
@@ -5,33 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/ctc_greedy_decoder.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API CTCGreedyDecoder : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    CTCGreedyDecoder() = default;
-    /// \brief Constructs a CTCGreedyDecoder operation
-    ///
-    /// \param input              Logits on which greedy decoding is performed
-    /// \param seq_len            Sequence lengths
-    /// \param ctc_merge_repeated Whether to merge repeated labels
-    CTCGreedyDecoder(const Output<Node>& input, const Output<Node>& seq_len, const bool ctc_merge_repeated);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool get_ctc_merge_repeated() const {
-        return m_ctc_merge_repeated;
-    }
-
-private:
-    bool m_ctc_merge_repeated;
-};
+using ov::op::v0::CTCGreedyDecoder;
 }  // namespace v0
 using v0::CTCGreedyDecoder;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/ctc_greedy_decoder_seq_len.hpp b/ngraph/core/include/ngraph/op/ctc_greedy_decoder_seq_len.hpp
index c1131ec3b408e2..4e74038047d036 100644
--- a/ngraph/core/include/ngraph/op/ctc_greedy_decoder_seq_len.hpp
+++ b/ngraph/core/include/ngraph/op/ctc_greedy_decoder_seq_len.hpp
@@ -5,96 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/ctc_greedy_decoder_seq_len.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v6 {
-/// \brief Operator performing CTCGreedyDecoder
-///
-class NGRAPH_API CTCGreedyDecoderSeqLen : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    CTCGreedyDecoderSeqLen() = default;
-    /// \brief Constructs a CTCGreedyDecoderSeqLen operation
-    ///
-    /// \param input                3-D tensor of logits on which greedy decoding is
-    /// performed
-    /// \param seq_len              1-D tensor of sequence lengths
-    /// \param merge_repeated       Whether to merge repeated labels
-    /// \param classes_index_type   Specifies the output classes_index tensor type
-    /// \param sequence_length_type Specifies the output sequence_length tensor type
-    CTCGreedyDecoderSeqLen(const Output<Node>& input,
-                           const Output<Node>& seq_len,
-                           const bool merge_repeated = true,
-                           const element::Type& classes_index_type = element::i32,
-                           const element::Type& sequence_length_type = element::i32);
-    /// \brief Constructs a CTCGreedyDecoderSeqLen operation
-    ///
-    /// \param input                3-D tensor of logits on which greedy decoding is
-    /// performed
-    /// \param seq_len              1-D tensor of sequence lengths
-    /// \param blank_index          Scalar or 1-D tensor with 1 element used to mark a
-    /// blank index
-    /// \param merge_repeated       Whether to merge repeated labels
-    /// \param classes_index_type   Specifies the output classes_index tensor type
-    /// \param sequence_length_type Specifies the output sequence_length tensor type
-    CTCGreedyDecoderSeqLen(const Output<Node>& input,
-                           const Output<Node>& seq_len,
-                           const Output<Node>& blank_index,
-                           const bool merge_repeated = true,
-                           const element::Type& classes_index_type = element::i32,
-                           const element::Type& sequence_length_type = element::i32);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \brief Get merge_repeated attribute
-    ///
-    /// \return Current value of merge_repeated attribute
-    ///
-    bool get_merge_repeated() const {
-        return m_merge_repeated;
-    }
-    /// \brief Get classes_index_type attribute
-    ///
-    /// \return Current value of classes_index_type attribute
-    ///
-    const element::Type& get_classes_index_type() const {
-        return m_classes_index_type;
-    }
-    /// \brief Set classes_index_type attribute
-    ///
-    /// \param classes_index_type Type of classes_index
-    ///
-    void set_classes_index_type(const element::Type& classes_index_type) {
-        m_classes_index_type = classes_index_type;
-        validate_and_infer_types();
-    }
-
-    /// \brief Get sequence_length_type attribute
-    ///
-    /// \return Current value of sequence_length_type attribute
-    ///
-    const element::Type& get_sequence_length_type() const {
-        return m_sequence_length_type;
-    }
-
-    /// \brief Set sequence_length_type attribute
-    ///
-    /// \param sequence_length_type Type of sequence length
-    ///
-    void set_sequence_length_type(const element::Type& sequence_length_type) {
-        m_sequence_length_type = sequence_length_type;
-        validate_and_infer_types();
-    }
-
-private:
-    bool m_merge_repeated;
-    element::Type m_classes_index_type{element::i32};
-    element::Type m_sequence_length_type{element::i32};
-};
+using ov::op::v6::CTCGreedyDecoderSeqLen;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/ctc_loss.hpp b/ngraph/core/include/ngraph/op/ctc_loss.hpp
index b4ddf80d5eb3a3..63f989d74796e3 100644
--- a/ngraph/core/include/ngraph/op/ctc_loss.hpp
+++ b/ngraph/core/include/ngraph/op/ctc_loss.hpp
@@ -5,67 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/ctc_loss.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-class NGRAPH_API CTCLoss : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    CTCLoss() = default;
-    /// \brief Constructs a CTCLoss operation
-    ///
-    /// \param logits                         3-D tensor of logits
-    /// \param logit_length                   1-D tensor of length for each object from
-    /// a batch
-    /// \param labels                         2-D tensor of labels for which likelyhood
-    /// is estimated using logist
-    /// \param label_length                   1-D tensor of length for each label
-    /// sequence
-    /// \param blank_index                    Scalar used to mark a blank index
-    /// \param preprocess_collapse_repeated   Flag for preprocessing labels before loss
-    /// calculation
-    /// \param ctc_merge_repeated             Flag for merging repeated characters in a
-    /// potential alignment
-    /// \param unique                         Flag to find unique elements in a target
-    /// before matching with alignment
-    CTCLoss(const Output<Node>& logits,
-            const Output<Node>& logit_length,
-            const Output<Node>& labels,
-            const Output<Node>& label_length,
-            const bool preprocess_collapse_repeated = false,
-            const bool ctc_merge_repeated = true,
-            const bool unique = false);
-
-    CTCLoss(const Output<Node>& logits,
-            const Output<Node>& logit_length,
-            const Output<Node>& labels,
-            const Output<Node>& label_length,
-            const Output<Node>& blank_index,
-            const bool preprocess_collapse_repeated = false,
-            const bool ctc_merge_repeated = true,
-            const bool unique = false);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool get_preprocess_collapse_repeated() const {
-        return preprocess_collapse_repeated_;
-    }
-    bool get_ctc_merge_repeated() const {
-        return ctc_merge_repeated_;
-    }
-    bool get_unique() const {
-        return unique_;
-    }
-
-private:
-    bool preprocess_collapse_repeated_;
-    bool ctc_merge_repeated_;
-    bool unique_;
-};
+using ov::op::v4::CTCLoss;
 }  // namespace v4
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/cum_sum.hpp b/ngraph/core/include/ngraph/op/cum_sum.hpp
index a2edb446a4d7d4..7ed1580f80e2c5 100644
--- a/ngraph/core/include/ngraph/op/cum_sum.hpp
+++ b/ngraph/core/include/ngraph/op/cum_sum.hpp
@@ -6,55 +6,12 @@
 
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/cum_sum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Tensor cumulative sum operation.
-///
-/// Compute the cumulative sum of the input tensor along the axis specified.
-///
-class NGRAPH_API CumSum : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a cumulative summation operation.
-    CumSum() = default;
-
-    /// \brief Constructs a cumulative summation operation.
-    ///
-    /// \param arg The tensor to be summed.
-    /// \param axis zero dimension tensor specifying axis position along which
-    /// cumulative sum must be performed
-    /// \param exclusive if set to true, the top element is not included
-    /// \param reverse if set to true, will perform the sums in reverse direction
-    CumSum(const Output<Node>& arg, const Output<Node>& axis, const bool exclusive = false, const bool reverse = false);
-
-    /// \brief Constructs a cumulative summation operation with axis = 0
-    ///
-    /// \param arg The tensor to be summed
-    CumSum(const Output<Node>& arg, const bool exclusive = false, const bool reverse = false);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    /// \return The default value for CumSum.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-    bool is_exclusive() const {
-        return m_exclusive;
-    }
-    bool is_reverse() const {
-        return m_reverse;
-    }
-
-private:
-    bool m_exclusive = false;
-    bool m_reverse = false;
-};
+using ov::op::v0::CumSum;
 }  // namespace v0
 using v0::CumSum;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/deformable_convolution.hpp b/ngraph/core/include/ngraph/op/deformable_convolution.hpp
index 2d95b83eafddc3..88141dcd39c77c 100644
--- a/ngraph/core/include/ngraph/op/deformable_convolution.hpp
+++ b/ngraph/core/include/ngraph/op/deformable_convolution.hpp
@@ -8,168 +8,16 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/op/util/deformable_convolution_base.hpp"
+#include "openvino/op/deformable_convolution.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief DeformableConvolution operation.
-class NGRAPH_API DeformableConvolution : public op::util::DeformableConvolutionBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a conversion operation.
-    DeformableConvolution() = default;
-    /// \brief Constructs a conversion operation.
-    ///
-    /// \param arg                Node that produces the input tensor.
-    /// \param offsets            Node producing the deformable values tensor.
-    /// \param filters            Node producing the filters(kernels) tensor with OIZYX
-    ///                           layout.
-    /// \param strides            Convolution strides.
-    /// \param pads_begin         Amount of padding to be added to the beginning along
-    ///                           each axis. For example in case of a 2D input the value
-    ///                           of (1, 2) means that 1 element will be added to the
-    ///                           top and 2 elements to the left.
-    /// \param pads_end           Amount of padding to be added to the end along each
-    ///                           axis.
-    /// \param dilations          The distance in width and height between the weights
-    ///                           in the filters tensor.
-    /// \param auto_pad           Specifies how the automatic calculation of padding
-    ///                           should be done.
-    /// \param group              The number of groups which both output and input
-    ///                           should be split into.
-    /// \param deformable_group   The number of groups which deformable values and
-    ///                           output should be split into along the channel axis.
-    DeformableConvolution(const Output<Node>& arg,
-                          const Output<Node>& offsets,
-                          const Output<Node>& filters,
-                          const Strides& strides,
-                          const CoordinateDiff& pads_begin,
-                          const CoordinateDiff& pads_end,
-                          const Strides& dilations,
-                          const PadType& auto_pad = PadType::EXPLICIT,
-                          const int64_t group = 1,
-                          const int64_t deformable_group = 1);
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v1::DeformableConvolution;
 }  // namespace v1
 
 namespace v8 {
-class NGRAPH_API DeformableConvolution : public op::util::DeformableConvolutionBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a conversion operation.
-    DeformableConvolution() = default;
-    /// \brief Constructs a conversion operation.
-    ///
-    /// \param arg                Node that produces the input tensor.
-    /// \param offsets            Node producing the deformable values tensor.
-    /// \param filters            Node producing the filters(kernels) tensor with OIZYX
-    ///                           layout.
-    /// \param strides            Convolution strides.
-    /// \param pads_begin         Amount of padding to be added to the beginning along
-    ///                           each axis. For example in case of a 2D input the value
-    ///                           of (1, 2) means that 1 element will be added to the
-    ///                           top and 2 elements to the left.
-    /// \param pads_end           Amount of padding to be added to the end along each
-    ///                           axis.
-    /// \param dilations          The distance in width and height between the weights
-    ///                           in the filters tensor.
-    /// \param auto_pad           Specifies how the automatic calculation of padding
-    ///                           should be done.
-    /// \param group              The number of groups which both output and input
-    ///                           should be split into.
-    /// \param deformable_group   The number of groups which deformable values and
-    ///                           output should be split into along the channel axis.
-    /// \param bilinear_interpolation_pad
-    ///                           The flag that determines the mode of bilinear
-    ///                           interpolation execution.
-    ///                           If the flag is `true` and the sampling location is
-    ///                           within one pixel outside of the feature map boundary,
-    ///                           then bilinear interpolation is performed on the zero
-    ///                           padded feature map. If the flag is `false` and the
-    ///                           sampling location is within one pixel outside of the
-    ///                           feature map boundary, then the sampling location
-    ///                           shifts to the inner boundary of the feature map.`
-    DeformableConvolution(const Output<Node>& arg,
-                          const Output<Node>& offsets,
-                          const Output<Node>& filters,
-                          const Strides& strides,
-                          const CoordinateDiff& pads_begin,
-                          const CoordinateDiff& pads_end,
-                          const Strides& dilations,
-                          const PadType& auto_pad = PadType::EXPLICIT,
-                          const int64_t group = 1,
-                          const int64_t deformable_group = 1,
-                          const bool bilinear_interpolation_pad = false);
-
-    /// \brief Constructs a conversion operation.
-    ///
-    /// \param arg                Node that produces the input tensor.
-    /// \param offsets            Node producing the deformable values tensor.
-    /// \param filters            Node producing the filters(kernels) tensor with OIZYX
-    ///                           layout.
-    /// \param mask               Node producing the mask(mask) tensor.
-    /// \param strides            Convolution strides.
-    /// \param pads_begin         Amount of padding to be added to the beginning along
-    ///                           each axis. For example in case of a 2D input the value
-    ///                           of (1, 2) means that 1 element will be added to the
-    ///                           top and 2 elements to the left.
-    /// \param pads_end           Amount of padding to be added to the end along each
-    ///                           axis.
-    /// \param dilations          The distance in width and height between the weights
-    ///                           in the filters tensor.
-    /// \param auto_pad           Specifies how the automatic calculation of padding
-    ///                           should be done.
-    /// \param group              The number of groups which both output and input
-    ///                           should be split into.
-    /// \param deformable_group   The number of groups which deformable values and
-    ///                           output should be split into along the channel axis.
-    /// \param bilinear_interpolation_pad
-    ///                           The flag that determines the mode of bilinear
-    ///                           interpolation execution.
-    ///                           If the flag is `true` and the sampling location is
-    ///                           within one pixel outside of the feature map boundary,
-    ///                           then bilinear interpolation is performed on the zero
-    ///                           padded feature map. If the flag is `false` and the
-    ///                           sampling location is within one pixel outside of the
-    ///                           feature map boundary, then the sampling location
-    ///                           shifts to the inner boundary of the feature map.
-    DeformableConvolution(const Output<Node>& arg,
-                          const Output<Node>& offsets,
-                          const Output<Node>& filters,
-                          const Output<Node>& mask,
-                          const Strides& strides,
-                          const CoordinateDiff& pads_begin,
-                          const CoordinateDiff& pads_end,
-                          const Strides& dilations,
-                          const PadType& auto_pad = PadType::EXPLICIT,
-                          const int64_t group = 1,
-                          const int64_t deformable_group = 1,
-                          const bool bilinear_interpolation_pad = false);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-
-    bool has_evaluate() const override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool get_bilinear_interpolation_pad() const {
-        return m_bilinear_interpolation_pad;
-    }
-
-    void set_bilinear_interpolation_pad(const bool bilinear_interpolation_pad) {
-        m_bilinear_interpolation_pad = bilinear_interpolation_pad;
-    }
-
-private:
-    bool m_bilinear_interpolation_pad;
-};
+using ov::op::v8::DeformableConvolution;
 }  // namespace v8
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/deformable_psroi_pooling.hpp b/ngraph/core/include/ngraph/op/deformable_psroi_pooling.hpp
index 362d325ef33bdc..6e47d387a987da 100644
--- a/ngraph/core/include/ngraph/op/deformable_psroi_pooling.hpp
+++ b/ngraph/core/include/ngraph/op/deformable_psroi_pooling.hpp
@@ -5,103 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/deformable_psroi_pooling.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API DeformablePSROIPooling : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    DeformablePSROIPooling() = default;
-    /// \brief Constructs a DeformablePSROIPooling operation
-    ///
-    /// \param input           Input tensor with position sensitive score maps
-    /// \param coords          Input tensor with list of five element tuples
-    ///                        describing ROI coordinates
-    /// \param offsets         Input tensor with transformation values
-    /// \param output_dim      Pooled output channel number
-    /// \param group_size      Number of horizontal bins per row to divide ROI area,
-    ///                        it defines output width and height
-    /// \param spatial_scale   Multiplicative spatial scale factor to translate ROI
-    ///                        coordinates from their input scale to the scale used when
-    ///                        pooling
-    /// \param mode            Specifies mode for pooling.
-    /// \param spatial_bins_x  Specifies numbers of bins to divide ROI single
-    ///                        bin over width
-    /// \param spatial_bins_y  Specifies numbers of bins to divide ROI single
-    ///                        bin over height
-    /// \param no_trans        The flag that specifies whenever third input exists
-    ///                        and contains transformation (offset) values
-    /// \param trans_std       The value that all transformation (offset) values are
-    ///                        multiplied with
-    /// \param part_size       The number of parts the output tensor spatial dimensions
-    ///                        are divided into. Basically it is the height
-    ///                        and width of the third input
-    DeformablePSROIPooling(const Output<Node>& input,
-                           const Output<Node>& coords,
-                           const Output<Node>& offsets,
-                           const int64_t output_dim,
-                           const float spatial_scale,
-                           const int64_t group_size = 1,
-                           const std::string mode = "bilinear_deformable",
-                           int64_t spatial_bins_x = 1,
-                           int64_t spatial_bins_y = 1,
-                           float trans_std = 1,
-                           int64_t part_size = 1);
-
-    DeformablePSROIPooling(const Output<Node>& input,
-                           const Output<Node>& coords,
-                           const int64_t output_dim,
-                           const float spatial_scale,
-                           const int64_t group_size = 1,
-                           const std::string mode = "bilinear_deformable",
-                           int64_t spatial_bins_x = 1,
-                           int64_t spatial_bins_y = 1,
-                           float trans_std = 1,
-                           int64_t part_size = 1);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    int64_t get_output_dim() const {
-        return m_output_dim;
-    }
-    int64_t get_group_size() const {
-        return m_group_size;
-    }
-    float get_spatial_scale() const {
-        return m_spatial_scale;
-    }
-    const std::string& get_mode() const {
-        return m_mode;
-    }
-    int64_t get_spatial_bins_x() const {
-        return m_spatial_bins_x;
-    }
-    int64_t get_spatial_bins_y() const {
-        return m_spatial_bins_y;
-    }
-    float get_trans_std() const {
-        return m_trans_std;
-    }
-    int64_t get_part_size() const {
-        return m_part_size;
-    }
-
-private:
-    int64_t m_output_dim;
-    float m_spatial_scale;
-    int64_t m_group_size = 1;
-    std::string m_mode = "bilinear_deformable";
-    int64_t m_spatial_bins_x = 1;
-    int64_t m_spatial_bins_y = 1;
-    float m_trans_std = 1.f;
-    int64_t m_part_size = 1;
-};
+using ov::op::v1::DeformablePSROIPooling;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/depth_to_space.hpp b/ngraph/core/include/ngraph/op/depth_to_space.hpp
index 0b57d0476db3e9..8fd67c9eda5855 100644
--- a/ngraph/core/include/ngraph/op/depth_to_space.hpp
+++ b/ngraph/core/include/ngraph/op/depth_to_space.hpp
@@ -6,76 +6,13 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/depth_to_space.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief DepthToSpace permutes data from the depth dimension of the input blob into
-///        spatial dimensions.
-///
-/// \note  Values from the depth dimension (assuming NCHW layout) are moved in
-///        spatial blocks to the height and width dimensions.
-///
-///        Output node produces a tensor with shape:
-///        [N, C/(blocksize * blocksize), H * blocksize, W * blocksize]
-class NGRAPH_API DepthToSpace : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    enum class DepthToSpaceMode {
-        // The input depth is divided to [block_size, ..., block_size, new_depth]
-        BLOCKS_FIRST,
-        // The input depth is divided to [new_depth, block_size, ..., block_size]
-        DEPTH_FIRST
-    };
-
-    DepthToSpace() = default;
-    /// \brief Constructs a DepthToSpace operation.
-    ///
-    /// \param data Node producing the input tensor
-    /// \param mode Specifies how the input depth dimension is split to block
-    /// coordinates
-    /// \param block_size The size of the block of values to be moved
-    DepthToSpace(const Output<Node>& data, const DepthToSpaceMode& mode, std::size_t block_size = 1);
-
-    DepthToSpace(const Output<Node>& data, const std::string& mode, std::size_t block_size = 1);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::size_t get_block_size() const {
-        return m_blocksize;
-    }
-    DepthToSpaceMode get_mode() const {
-        return m_mode;
-    }
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    void validate_and_infer_types() override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    std::size_t m_blocksize;
-    DepthToSpaceMode m_mode;
-};
+using ov::op::v0::DepthToSpace;
 }  // namespace v0
 using v0::DepthToSpace;
 }  // namespace op
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v0::DepthToSpace::DepthToSpaceMode& type);
 }  // namespace ngraph
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v0::DepthToSpace::DepthToSpaceMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v0::DepthToSpace::DepthToSpaceMode> {
-public:
-    AttributeAdapter(ngraph::op::v0::DepthToSpace::DepthToSpaceMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v0::DepthToSpace::DepthToSpaceMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v0::DepthToSpace::DepthToSpaceMode>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/detection_output.hpp b/ngraph/core/include/ngraph/op/detection_output.hpp
index b00a41096c7fab..5400d5b22bfbf3 100644
--- a/ngraph/core/include/ngraph/op/detection_output.hpp
+++ b/ngraph/core/include/ngraph/op/detection_output.hpp
@@ -5,74 +5,14 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/detection_output.hpp"
 
 namespace ngraph {
 namespace op {
-struct DetectionOutputAttrs {
-    int num_classes;
-    int background_label_id = 0;
-    int top_k = -1;
-    bool variance_encoded_in_target = false;
-    std::vector<int> keep_top_k;
-    std::string code_type = std::string{"caffe.PriorBoxParameter.CORNER"};
-    bool share_location = true;
-    float nms_threshold;
-    float confidence_threshold = 0;
-    bool clip_after_nms = false;
-    bool clip_before_nms = false;
-    bool decrease_label_id = false;
-    bool normalized = false;
-    size_t input_height = 1;
-    size_t input_width = 1;
-    float objectness_score = 0;
-};
+using DetectionOutputAttrs = ov::op::v0::DetectionOutput::Attributes;
 
 namespace v0 {
-/// \brief Layer which performs non-max suppression to
-/// generate detection output using location and confidence predictions
-class NGRAPH_API DetectionOutput : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    DetectionOutput() = default;
-    /// \brief Constructs a DetectionOutput operation
-    ///
-    /// \param box_logits			Box logits
-    /// \param class_preds			Class predictions
-    /// \param proposals			Proposals
-    /// \param aux_class_preds		Auxilary class predictions
-    /// \param aux_box_preds		Auxilary box predictions
-    /// \param attrs				Detection Output attributes
-    DetectionOutput(const Output<Node>& box_logits,
-                    const Output<Node>& class_preds,
-                    const Output<Node>& proposals,
-                    const Output<Node>& aux_class_preds,
-                    const Output<Node>& aux_box_preds,
-                    const DetectionOutputAttrs& attrs);
-
-    /// \brief Constructs a DetectionOutput operation
-    ///
-    /// \param box_logits			Box logits
-    /// \param class_preds			Class predictions
-    /// \param proposals			Proposals
-    /// \param attrs				Detection Output attributes
-    DetectionOutput(const Output<Node>& box_logits,
-                    const Output<Node>& class_preds,
-                    const Output<Node>& proposals,
-                    const DetectionOutputAttrs& attrs);
-
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    const DetectionOutputAttrs& get_attrs() const {
-        return m_attrs;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    DetectionOutputAttrs m_attrs;
-};
+using ov::op::v0::DetectionOutput;
 }  // namespace v0
 using v0::DetectionOutput;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/dft.hpp b/ngraph/core/include/ngraph/op/dft.hpp
index 3065d128df7d06..abd217511bc8fc 100644
--- a/ngraph/core/include/ngraph/op/dft.hpp
+++ b/ngraph/core/include/ngraph/op/dft.hpp
@@ -23,33 +23,12 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/op/util/fft_base.hpp"
+#include "openvino/op/dft.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v7 {
-/// \brief An operation DFT that computes the discrete Fourier transformation.
-class NGRAPH_API DFT : public util::FFTBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    DFT() = default;
-
-    /// \brief Constructs a DFT operation. DFT is performed for full size axes.
-    ///
-    /// \param data  Input data
-    /// \param axes Axes to perform DFT
-    DFT(const Output<Node>& data, const Output<Node>& axes);
-
-    /// \brief Constructs a DFT operation.
-    ///
-    /// \param data  Input data
-    /// \param axes Axes to perform DFT
-    /// \param signal_size Signal sizes for 'axes'
-    DFT(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v7::DFT;
 }  // namespace v7
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/divide.hpp b/ngraph/core/include/ngraph/op/divide.hpp
index 9f9364e81814bb..9b74d17e1493a4 100644
--- a/ngraph/core/include/ngraph/op/divide.hpp
+++ b/ngraph/core/include/ngraph/op/divide.hpp
@@ -5,51 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/divide.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise division operation.
-class NGRAPH_API Divide : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a division operation.
-    Divide() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs a division operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param pythondiv Use Python style rounding for integral type
-    /// \param auto_broadcast Auto broadcast specification
-    Divide(const Output<Node>& arg0,
-           const Output<Node>& arg1,
-           bool pythondiv,
-           const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    /// \brief Constructs a division operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Divide(const Output<Node>& arg0,
-           const Output<Node>& arg1,
-           const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool is_pythondiv() const {
-        return m_pythondiv;
-    }
-    void set_is_pythondiv(bool pythondiv) {
-        m_pythondiv = pythondiv;
-    }
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    bool m_pythondiv{true};
-};
+using ov::op::v1::Divide;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/einsum.hpp b/ngraph/core/include/ngraph/op/einsum.hpp
index a23c2c0f7c507c..71de175f8ddf56 100644
--- a/ngraph/core/include/ngraph/op/einsum.hpp
+++ b/ngraph/core/include/ngraph/op/einsum.hpp
@@ -6,67 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/einsum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v7 {
-/// \brief Einsum operation.
-class NGRAPH_API Einsum : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Einsum() = default;
-
-    ///
-    /// \brief      Constructs Einsum operation.
-    ///
-    /// \param      inputs        Input nodes on which Einsum operation performs
-    /// contraction
-    ///
-    /// \param      equation      Einstein summation convention
-    ///
-    Einsum(const OutputVector& inputs, const std::string& equation);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \brief      Get an equation of Einsum operation
-    ///
-    /// \return     Einsum equation
-    ///
-    std::string get_equation() const {
-        return m_equation;
-    }
-
-    /// \brief      Check correctness of equation format and extract input subscripts
-    /// and output subscript
-    ///
-    /// \param      equation              Equation to be parsed and checked
-    ///
-    /// \param      input_subscripts      A vector of extracted input subscripts
-    ///
-    /// \param      output_subscript      An output subscript
-    ///
-    static void parse_equation(const std::string& equation,
-                               std::vector<std::string>& input_subscripts,
-                               std::string& output_subscript);
-
-    /// \brief      Extract labels (from subscript) that can be alphabetic letters or
-    /// ellipsis
-    ///
-    /// \param      subscript      Subscript
-    ///
-    /// \return     A vector of extracted labels from the input subscript in the order
-    /// of appearence
-    ///
-    static std::vector<std::string> extract_labels(const std::string& subscript);
-
-private:
-    std::string m_equation;
-};
+using ov::op::v7::Einsum;
 }  // namespace v7
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/elu.hpp b/ngraph/core/include/ngraph/op/elu.hpp
index 173cb9b02a6a1e..0e1356c130f87c 100644
--- a/ngraph/core/include/ngraph/op/elu.hpp
+++ b/ngraph/core/include/ngraph/op/elu.hpp
@@ -6,37 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/elu.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Exponential Linear Unit
-/// x <  0 => f(x) = alpha * (exp(x) - 1.)
-/// x >= 0 => f(x) = x
-///
-class NGRAPH_API Elu : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Elu() = default;
-    /// \brief Constructs an Elu operation.
-    ///
-    /// \param data Input tensor
-    /// \param alpha Multiplier for negative values
-    Elu(const Output<Node>& data, const double alpha);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    double get_alpha() const {
-        return m_alpha;
-    }
-
-private:
-    double m_alpha;
-};
+using ov::op::v0::Elu;
 }  // namespace v0
 using v0::Elu;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/embedding_segments_sum.hpp b/ngraph/core/include/ngraph/op/embedding_segments_sum.hpp
index ebca3b5164b7a4..0d264a28cf5b7d 100644
--- a/ngraph/core/include/ngraph/op/embedding_segments_sum.hpp
+++ b/ngraph/core/include/ngraph/op/embedding_segments_sum.hpp
@@ -6,75 +6,12 @@
 
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/util/index_reduction.hpp"
+#include "openvino/op/embedding_segments_sum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Returns embeddings for given indices
-class NGRAPH_API EmbeddingSegmentsSum : public Op {
-public:
-    static constexpr NodeTypeInfo type_info{"EmbeddingSegmentsSum", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs a EmbeddingSegmentsSum operation.
-    EmbeddingSegmentsSum() = default;
-    /// \brief Constructs a EmbeddingSegmentsSum operation.
-    ///
-    /// EmbeddingSegmentsSum constructs an output tensor by replacing every index in a
-    /// given
-    /// input tensor with a row (from the weights matrix) at that index
-    ///
-    /// \param 'emb_table' tensor containing the embedding lookup table of the module of
-    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
-    /// \param 'indices' tensor of shape [num_indices] and of type T_IND. Required
-    /// \param `segment_ids` tensor of shape `[num_indices]` and of type *T_IND* with
-    /// indices
-    /// into the output Tensor. Values should be sorted and can be repeated. Required.
-    /// \param `num_segments` scalar of type *T_IND* indicating the number of segments.
-    /// Required.
-    /// \param 'default_index' scalar of type T_IND containing default index in
-    /// embedding
-    /// table to fill empty "bags". If not provided empty "bags"
-    /// are filled with zeros. Optional.
-    /// \param 'per_sample_weights' tensor of the same shape as indices and of type T.
-    /// Each value in this tensor are multiplied with each
-    /// value pooled from embedding table for each index. Optional.
-
-    EmbeddingSegmentsSum(const Output<Node>& emb_table,
-                         const Output<Node>& indices,
-                         const Output<Node>& segment_ids,
-                         const Output<Node>& num_segments,
-                         const Output<Node>& default_index,
-                         const Output<Node>& per_sample_weights);
-
-    EmbeddingSegmentsSum(const Output<Node>& emb_table,
-                         const Output<Node>& indices,
-                         const Output<Node>& segment_ids,
-                         const Output<Node>& num_segments,
-                         const Output<Node>& default_index);
-
-    EmbeddingSegmentsSum(const Output<Node>& emb_table,
-                         const Output<Node>& indices,
-                         const Output<Node>& segment_ids,
-                         const Output<Node>& num_segments);
-
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor&) override {
-        return true;
-    }
-
-private:
-    static constexpr int EMB_TABLE = 0;
-    static constexpr int INDICES = 1;
-    static constexpr int SEGMENT_IDS = 2;
-    static constexpr int NUM_SEGMENTS = 3;
-    static constexpr int DEFAULT_INDEX = 4;
-    static constexpr int PER_SAMPLE_WEIGHTS = 5;
-};
+using ov::op::v3::EmbeddingSegmentsSum;
 }  // namespace v3
 using v3::EmbeddingSegmentsSum;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/embeddingbag_offsets_sum.hpp b/ngraph/core/include/ngraph/op/embeddingbag_offsets_sum.hpp
index f47def5fee5e85..6fc907a272df79 100644
--- a/ngraph/core/include/ngraph/op/embeddingbag_offsets_sum.hpp
+++ b/ngraph/core/include/ngraph/op/embeddingbag_offsets_sum.hpp
@@ -7,52 +7,12 @@
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/util/embeddingbag_offsets_base.hpp"
 #include "ngraph/op/util/index_reduction.hpp"
+#include "openvino/op/embeddingbag_offsets_sum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Returns embeddings for given indices
-class NGRAPH_API EmbeddingBagOffsetsSum : public util::EmbeddingBagOffsetsBase {
-public:
-    static constexpr NodeTypeInfo type_info{"EmbeddingBagOffsetsSum", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs a EmbeddingBagOffsetsSum operation.
-    EmbeddingBagOffsetsSum() = default;
-    /// \brief Constructs a EmbeddingBagOffsetsSum operation.
-    ///
-    /// EmbeddingBagOffsetsSum constructs an output tensor by replacing every index in a
-    /// given
-    /// input tensor with a row (from the weights matrix) at that index
-    ///
-    /// \param emb_table tensor containing the embedding lookup table of the module of
-    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
-    /// \param tensor of shape [num_indices] and of type T_IND. Required
-    /// \param offsets tensor of shape [batch] and of type T_IND containing the starting
-    /// index positions of each "bag" in indices. Required.
-    /// \param default_index scalar of type T_IND containing default index in embedding
-    /// table to fill empty "bags". If not provided empty "bags"
-    /// are filled with zeros. Optional.
-    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
-    /// Each value in this tensor are multiplied with each
-    /// value pooled from embedding table for each index. Optional.
-
-    EmbeddingBagOffsetsSum(const Output<Node>& emb_table,
-                           const Output<Node>& indices,
-                           const Output<Node>& offsets,
-                           const Output<Node>& default_index,
-                           const Output<Node>& per_sample_weights);
-
-    EmbeddingBagOffsetsSum(const Output<Node>& emb_table,
-                           const Output<Node>& indices,
-                           const Output<Node>& offsets,
-                           const Output<Node>& default_index);
-
-    EmbeddingBagOffsetsSum(const Output<Node>& emb_table, const Output<Node>& indices, const Output<Node>& offsets);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v3::EmbeddingBagOffsetsSum;
 }  // namespace v3
 using v3::EmbeddingBagOffsetsSum;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/embeddingbag_packedsum.hpp b/ngraph/core/include/ngraph/op/embeddingbag_packedsum.hpp
index 159f100a610a6d..8952ce1be9db2f 100644
--- a/ngraph/core/include/ngraph/op/embeddingbag_packedsum.hpp
+++ b/ngraph/core/include/ngraph/op/embeddingbag_packedsum.hpp
@@ -7,41 +7,12 @@
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/util/embeddingbag_packed_base.hpp"
 #include "ngraph/op/util/index_reduction.hpp"
+#include "openvino/op/embeddingbag_packedsum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Returns embeddings for given indices
-class NGRAPH_API EmbeddingBagPackedSum : public util::EmbeddingBagPackedBase {
-public:
-    static constexpr NodeTypeInfo type_info{"EmbeddingBagPackedSum", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs a EmbeddingBagPackedSum operation.
-    EmbeddingBagPackedSum() = default;
-    /// \brief Constructs a EmbeddingBagPackedSum operation.
-    ///
-    /// EmbeddingBagPackedSum constructs an output tensor by replacing every index in a
-    /// given
-    /// input tensor with a row (from the weights matrix) at that index
-    ///
-    /// \param emb_table Tensor containing the embedding lookup table of the module of
-    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
-    /// \param  indices Tensor of shape `[batch, indices_per_bag]` and of type *T_IND*.
-    /// Required.
-    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
-    /// Each value in this tensor are multiplied with each
-    /// value pooled from embedding table for each index. Optional.
-
-    EmbeddingBagPackedSum(const Output<Node>& emb_table,
-                          const Output<Node>& indices,
-                          const Output<Node>& per_sample_weights);
-
-    EmbeddingBagPackedSum(const Output<Node>& emb_table, const Output<Node>& indices);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v3::EmbeddingBagPackedSum;
 }  // namespace v3
 using v3::EmbeddingBagPackedSum;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/equal.hpp b/ngraph/core/include/ngraph/op/equal.hpp
index 81766834f0b302..6751bd0b8eb12d 100644
--- a/ngraph/core/include/ngraph/op/equal.hpp
+++ b/ngraph/core/include/ngraph/op/equal.hpp
@@ -5,47 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_comparison.hpp"
+#include "openvino/op/equal.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-// clang-format off
-            /// \brief Elementwise is-equal operation.
-            ///
-            /// ## Inputs
-            ///
-            /// |        | Type                              | Description                                            |
-            /// | ------ | --------------------------------- | ------------------------------------------------------ |
-            /// | `arg0` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and element type.                |
-            /// | `arg1` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
-            /// | `autob`| AutoBroadcastSpec                 | Auto broadcast specification.                          |
-            ///
-            /// ## Output
-            ///
-            /// | Type                               | Description                                                                                                                                |
-            /// | ---------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------ |
-            /// | \f$\texttt{bool}[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = 1\text{ if }\texttt{arg0}[i_1,\dots,i_n] = \texttt{arg1}[i_1,\dots,i_n]\text{, else } 0\f$ |
-// clang-format on
-class NGRAPH_API Equal : public util::BinaryElementwiseComparison {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs an equal operation.
-    Equal() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
-    /// \brief Constructs an equal operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Equal(const Output<Node>& arg0,
-          const Output<Node>& arg1,
-          const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Equal;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/erf.hpp b/ngraph/core/include/ngraph/op/erf.hpp
index 3bb5392bbfee1a..22a4a7246f5e45 100644
--- a/ngraph/core/include/ngraph/op/erf.hpp
+++ b/ngraph/core/include/ngraph/op/erf.hpp
@@ -5,26 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/erf.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise erf operation.
-class NGRAPH_API Erf : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a floor operation.
-    Erf() = default;
-    /// \brief Constructs a floor operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Erf(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Erf;
 }  // namespace v0
 using v0::Erf;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/exp.hpp b/ngraph/core/include/ngraph/op/exp.hpp
index f8170c66249eff..8172778087e435 100644
--- a/ngraph/core/include/ngraph/op/exp.hpp
+++ b/ngraph/core/include/ngraph/op/exp.hpp
@@ -5,28 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/exp.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise natural exponential (exp) operation.
-class NGRAPH_API Exp : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an exponential operation.
-    Exp() = default;
-    /// \brief Constructs an exponential operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Exp(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Exp;
 }  // namespace v0
 using v0::Exp;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/experimental_detectron_detection_output.hpp b/ngraph/core/include/ngraph/op/experimental_detectron_detection_output.hpp
index 0231d20eba90a3..bd3689ee662df5 100644
--- a/ngraph/core/include/ngraph/op/experimental_detectron_detection_output.hpp
+++ b/ngraph/core/include/ngraph/op/experimental_detectron_detection_output.hpp
@@ -10,65 +10,12 @@
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/experimental_detectron_detection_output.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v6 {
-/// \brief An operation ExperimentalDetectronDetectionOutput performs
-/// non-maximum suppression to generate the detection output using
-/// information on location and score predictions.
-class NGRAPH_API ExperimentalDetectronDetectionOutput : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Structure that specifies attributes of the operation
-    struct Attributes {
-        // specifies score threshold
-        float score_threshold;
-        // specifies NMS threshold
-        float nms_threshold;
-        // specifies maximal delta of logarithms for width and height
-        float max_delta_log_wh;
-        // specifies number of detected classes
-        int64_t num_classes;
-        // specifies maximal number of detections per class
-        int64_t post_nms_count;
-        // specifies maximual number of detections per image
-        size_t max_detections_per_image;
-        // a flag specifies whether to delete background classes or not
-        // `true`  means background classes should be deleted,
-        // `false` means background classes shouldn't be deleted.
-        bool class_agnostic_box_regression;
-        // specifies deltas of weights
-        std::vector<float> deltas_weights;
-    };
-
-    ExperimentalDetectronDetectionOutput() = default;
-    /// \brief Constructs a ExperimentalDetectronDetectionOutput operation.
-    ///
-    /// \param input_rois  Input rois
-    /// \param input_deltas Input deltas
-    /// \param input_scores Input scores
-    /// \param input_im_info Input image info
-    /// \param attrs  Attributes attributes
-    ExperimentalDetectronDetectionOutput(const Output<Node>& input_rois,
-                                         const Output<Node>& input_deltas,
-                                         const Output<Node>& input_scores,
-                                         const Output<Node>& input_im_info,
-                                         const Attributes& attrs);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    /// \brief Returns attributes of the operation ExperimentalDetectronDetectionOutput
-    const Attributes& get_attrs() const {
-        return m_attrs;
-    }
-
-private:
-    Attributes m_attrs;
-};
+using ov::op::v6::ExperimentalDetectronDetectionOutput;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/experimental_detectron_generate_proposals.hpp b/ngraph/core/include/ngraph/op/experimental_detectron_generate_proposals.hpp
index 2abb9d5d5939a8..26cf040ec39560 100644
--- a/ngraph/core/include/ngraph/op/experimental_detectron_generate_proposals.hpp
+++ b/ngraph/core/include/ngraph/op/experimental_detectron_generate_proposals.hpp
@@ -10,55 +10,12 @@
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/experimental_detectron_generate_proposals.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v6 {
-/// \brief An operation ExperimentalDetectronGenerateProposalsSingleImage
-/// computes ROIs and their scores based on input data.
-class NGRAPH_API ExperimentalDetectronGenerateProposalsSingleImage : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Structure that specifies attributes of the operation
-    struct Attributes {
-        // minimum box width & height
-        float min_size;
-        // specifies NMS threshold
-        float nms_threshold;
-        // number of top-n proposals after NMS
-        int64_t post_nms_count;
-        // number of top-n proposals before NMS
-        int64_t pre_nms_count;
-    };
-
-    ExperimentalDetectronGenerateProposalsSingleImage() = default;
-    /// \brief Constructs a ExperimentalDetectronGenerateProposalsSingleImage operation.
-    ///
-    /// \param im_info Input image info
-    /// \param anchors Input anchors
-    /// \param deltas Input deltas
-    /// \param scores Input scores
-    /// \param attrs Operation attributes
-    ExperimentalDetectronGenerateProposalsSingleImage(const Output<Node>& im_info,
-                                                      const Output<Node>& anchors,
-                                                      const Output<Node>& deltas,
-                                                      const Output<Node>& scores,
-                                                      const Attributes& attrs);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    const Attributes& get_attrs() const {
-        return m_attrs;
-    }
-
-private:
-    Attributes m_attrs;
-};
+using ov::op::v6::ExperimentalDetectronGenerateProposalsSingleImage;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/experimental_detectron_prior_grid_generator.hpp b/ngraph/core/include/ngraph/op/experimental_detectron_prior_grid_generator.hpp
index c109412cc780a4..ded6e775721a9c 100644
--- a/ngraph/core/include/ngraph/op/experimental_detectron_prior_grid_generator.hpp
+++ b/ngraph/core/include/ngraph/op/experimental_detectron_prior_grid_generator.hpp
@@ -10,58 +10,12 @@
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/experimental_detectron_prior_grid_generator.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v6 {
-/// \brief An operation ExperimentalDetectronPriorGridGenerator generates prior
-/// grids of specified sizes.
-class NGRAPH_API ExperimentalDetectronPriorGridGenerator : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Structure that specifies attributes of the operation
-    struct Attributes {
-        // Specifies whether the output tensor should be 2D or 4D
-        // `true`  means the output tensor should be 2D tensor,
-        // `false` means the output tensor should be 4D tensor.
-        bool flatten;
-        // Specifies number of cells of the generated grid with respect to height.
-        int64_t h;
-        // Specifies number of cells of the generated grid with respect to width.
-        int64_t w;
-        // Specifies the step of generated grid with respect to x coordinate
-        float stride_x;
-        // Specifies the step of generated grid with respect to y coordinate
-        float stride_y;
-    };
-
-    ExperimentalDetectronPriorGridGenerator() = default;
-    /// \brief Constructs a ExperimentalDetectronDetectionOutput operation.
-    ///
-    /// \param priors  Input priors
-    /// \param feature_map Input feature map
-    /// \param im_data Image data
-    /// \param attrs   attributes
-    ExperimentalDetectronPriorGridGenerator(const Output<Node>& priors,
-                                            const Output<Node>& feature_map,
-                                            const Output<Node>& im_data,
-                                            const Attributes& attrs);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    /// \brief Returns attributes of this operation.
-    const Attributes& get_attrs() const {
-        return m_attrs;
-    }
-
-private:
-    Attributes m_attrs;
-
-    void validate();
-};
+using ov::op::v6::ExperimentalDetectronPriorGridGenerator;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/experimental_detectron_roi_feature.hpp b/ngraph/core/include/ngraph/op/experimental_detectron_roi_feature.hpp
index 675573ba254166..6c4043456f7376 100644
--- a/ngraph/core/include/ngraph/op/experimental_detectron_roi_feature.hpp
+++ b/ngraph/core/include/ngraph/op/experimental_detectron_roi_feature.hpp
@@ -11,49 +11,12 @@
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/experimental_detectron_roi_feature.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v6 {
-/// \brief An operation ExperimentalDetectronROIFeatureExtractor
-/// is the ROIAlign operation applied over a feature pyramid.
-class NGRAPH_API ExperimentalDetectronROIFeatureExtractor : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Structure that specifies attributes of the operation
-    struct Attributes {
-        int64_t output_size;
-        int64_t sampling_ratio;
-        std::vector<int64_t> pyramid_scales;
-        bool aligned;
-    };
-
-    ExperimentalDetectronROIFeatureExtractor() = default;
-    /// \brief Constructs a ExperimentalDetectronROIFeatureExtractor operation.
-    ///
-    /// \param args  Inputs of ExperimentalDetectronROIFeatureExtractor
-    /// \param attrs  Operation attributes
-    ExperimentalDetectronROIFeatureExtractor(const OutputVector& args, const Attributes& attrs);
-
-    /// \brief Constructs a ExperimentalDetectronROIFeatureExtractor operation.
-    ///
-    /// \param args  Inputs of ExperimentalDetectronROIFeatureExtractor
-    /// \param attrs  Operation attributes
-    ExperimentalDetectronROIFeatureExtractor(const NodeVector& args, const Attributes& attrs);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    /// \brief Returns attributes of the operation.
-    const Attributes& get_attrs() const {
-        return m_attrs;
-    }
-
-private:
-    Attributes m_attrs;
-};
+using ov::op::v6::ExperimentalDetectronROIFeatureExtractor;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/experimental_detectron_topkrois.hpp b/ngraph/core/include/ngraph/op/experimental_detectron_topkrois.hpp
index 17f6bd591f3ddf..91f56825d90554 100644
--- a/ngraph/core/include/ngraph/op/experimental_detectron_topkrois.hpp
+++ b/ngraph/core/include/ngraph/op/experimental_detectron_topkrois.hpp
@@ -10,36 +10,12 @@
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/experimental_detectron_topkrois.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v6 {
-/// \brief An operation ExperimentalDetectronTopKROIs, according to the repository
-/// is TopK operation applied to probabilities of input ROIs.
-class NGRAPH_API ExperimentalDetectronTopKROIs : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ExperimentalDetectronTopKROIs() = default;
-    /// \brief Constructs a ExperimentalDetectronTopKROIs operation.
-    ///
-    /// \param input_rois  Input rois
-    /// \param rois_probs Probabilities for input rois
-    /// \param max_rois Maximal numbers of output rois
-    ExperimentalDetectronTopKROIs(const Output<Node>& input_rois, const Output<Node>& rois_probs, size_t max_rois = 0);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    size_t get_max_rois() const {
-        return m_max_rois;
-    }
-
-private:
-    size_t m_max_rois;
-};
+using ov::op::v6::ExperimentalDetectronTopKROIs;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/extractimagepatches.hpp b/ngraph/core/include/ngraph/op/extractimagepatches.hpp
index ae3eb3ed62b9c4..8c427d1087672a 100644
--- a/ngraph/core/include/ngraph/op/extractimagepatches.hpp
+++ b/ngraph/core/include/ngraph/op/extractimagepatches.hpp
@@ -5,66 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/extractimagepatches.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-class NGRAPH_API ExtractImagePatches : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ExtractImagePatches() = default;
-    /// \brief Constructs a ExtractImagePatches operation
-    ///
-    /// \param data 4-D Input data to extract image patches
-    /// \param sizes Patch size in the format of [size_rows, size_cols]
-    /// \param strides Patch movement stride in the format of [stride_rows, stride_cols]
-    /// \param rates Element seleciton rate for creating a patch. in the format of
-    /// [rate_rows, rate_cols]
-    /// \param auto_pad Padding type. it can be any value from
-    /// valid, same_lower, same_upper
-    ExtractImagePatches(const Output<Node>& image,
-                        const Shape& sizes,
-                        const Strides& strides,
-                        const Shape& rates,
-                        const PadType& auto_pad);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    const Shape& get_sizes() const {
-        return m_patch_sizes;
-    }
-    void set_sizes(const Shape& sizes) {
-        m_patch_sizes = sizes;
-    }
-    const Strides& get_strides() const {
-        return m_patch_movement_strides;
-    }
-    void set_strides(const Strides& strides) {
-        m_patch_movement_strides = strides;
-    }
-    const Shape& get_rates() const {
-        return m_patch_selection_rates;
-    }
-    void set_rates(const Shape& rates) {
-        m_patch_selection_rates = rates;
-    }
-    const PadType& get_auto_pad() const {
-        return m_padding;
-    }
-    void set_auto_pad(PadType& padding) {
-        m_padding = padding;
-    }
-
-private:
-    Shape m_patch_sizes;
-    Strides m_patch_movement_strides;
-    Shape m_patch_selection_rates;
-    PadType m_padding;
-};
+using ov::op::v3::ExtractImagePatches;
 }  // namespace v3
 using v3::ExtractImagePatches;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/fake_quantize.hpp b/ngraph/core/include/ngraph/op/fake_quantize.hpp
index 08a53dca2fdcb9..d36772c2dc9c53 100644
--- a/ngraph/core/include/ngraph/op/fake_quantize.hpp
+++ b/ngraph/core/include/ngraph/op/fake_quantize.hpp
@@ -7,70 +7,12 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/fake_quantize.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-///
-/// \brief      Class performing element-wise linear quantization.
-///
-/// \note       Input floating point values are quantized into a discrete
-///             set of floating point values.
-///
-/// \paragraph Implementation This class creates a node which performs the following
-///            operation:
-///
-///            round((data - input_low) / (input_high - input_low) * (levels-1)) /
-///                 (levels-1) * (output_high - output_low) + output_low
-///
-///
-class NGRAPH_API FakeQuantize : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    FakeQuantize();
-    ///
-    /// \brief      Constructs a FakeQuantize operation node.
-    ///
-    /// \param[in]  data            The input data tensor.
-    /// \param[in]  input_low       The minimum limit for input values.
-    /// \param[in]  input_high      The maximum limit for input values.
-    /// \param[in]  output_low      The minimum quantized value.
-    /// \param[in]  output_high     The maximum quantized value.
-    /// \param[in]  levels          The number of quantization levels.
-    /// \param[in]  auto_broadcast  AutoBroadcast mode to be used for broadcasting
-    ///                             limit values
-    ///
-    FakeQuantize(const Output<Node>& data,
-                 const Output<Node>& input_low,
-                 const Output<Node>& input_high,
-                 const Output<Node>& output_low,
-                 const Output<Node>& output_high,
-                 std::size_t levels,
-                 const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    std::size_t get_levels() const {
-        return m_levels;
-    }
-    void set_levels(std::size_t levels) {
-        m_levels = levels;
-    }
-    const AutoBroadcastSpec& get_auto_broadcast() const {
-        return m_auto_broadcast;
-    }
-    void set_auto_broadcast(const AutoBroadcastSpec& auto_broadcast) {
-        m_auto_broadcast = auto_broadcast;
-    }
-
-private:
-    std::size_t m_levels;
-    AutoBroadcastSpec m_auto_broadcast = op::AutoBroadcastType::NUMPY;
-};
+using ov::op::v0::FakeQuantize;
 }  // namespace v0
 using v0::FakeQuantize;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/floor.hpp b/ngraph/core/include/ngraph/op/floor.hpp
index 6196f8f689c2b4..e58ce80b042b57 100644
--- a/ngraph/core/include/ngraph/op/floor.hpp
+++ b/ngraph/core/include/ngraph/op/floor.hpp
@@ -5,26 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/floor.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise floor operation.
-class NGRAPH_API Floor : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a floor operation.
-    Floor() = default;
-    /// \brief Constructs a floor operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Floor(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Floor;
 }  // namespace v0
 using v0::Floor;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/floor_mod.hpp b/ngraph/core/include/ngraph/op/floor_mod.hpp
index 2ce6441af991b0..b4fd0f9309eb68 100644
--- a/ngraph/core/include/ngraph/op/floor_mod.hpp
+++ b/ngraph/core/include/ngraph/op/floor_mod.hpp
@@ -7,40 +7,13 @@
 #include <memory>
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/floor_mod.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise FloorMod operation.
-///
-class NGRAPH_API FloorMod : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an uninitialized addition operation
-    FloorMod() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY){};
-
-    /// \brief Constructs an Floor Mod operation.
-    ///
-    /// \param arg0 Output that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param arg1 Output that produces the second input tensor.<br>
-    /// `[d0, ...]`
-    /// \param auto_broadcast Auto broadcast specification
-    ///
-    /// Output `[d0, ...]`
-    ///
-    FloorMod(const Output<Node>& arg0,
-             const Output<Node>& arg1,
-             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastType::NUMPY);
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::FloorMod;
 }  // namespace v1
-
 using v1::FloorMod;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/gather.hpp b/ngraph/core/include/ngraph/op/gather.hpp
index c81397fcf120f9..31f2e1d3ee7428 100644
--- a/ngraph/core/include/ngraph/op/gather.hpp
+++ b/ngraph/core/include/ngraph/op/gather.hpp
@@ -5,76 +5,18 @@
 #pragma once
 
 #include "ngraph/op/util/gather_base.hpp"
+#include "openvino/op/gather.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Gather slices from axis of data according to indices
-class NGRAPH_API Gather : public op::util::GatherBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    static const int64_t AXIS_NOT_SET_VALUE = std::numeric_limits<int64_t>::max();
-    Gather() = default;
-    /// \param data The tensor from which slices are gathered
-    /// \param indices Tensor with indexes to gather
-    /// \param axis The tensor is a dimension index to gather data from
-    Gather(const Output<Node>& params, const Output<Node>& indices, const Output<Node>& axis);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    int64_t get_axis() const override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v1::Gather;
 }  // namespace v1
-
 namespace v7 {
-/// \brief Gather slices from axis of data according to indices
-class NGRAPH_API Gather : public op::util::GatherBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Gather() = default;
-
-    /// \param data The tensor from which slices are gathered
-    /// \param indices Tensor with indexes to gather
-    /// \param axis The tensor is a dimension index to gather data from
-    /// \param batch_dims The number of batch dimension in data and indices tensors.
-    /// If batch_dims = 0 Gather v7 is identical to Gather v1.
-    Gather(const Output<Node>& data,
-           const Output<Node>& indices,
-           const Output<Node>& axis,
-           const int64_t batch_dims = 0);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-    int64_t get_batch_dims() const;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v7::Gather;
 }  // namespace v7
-
 namespace v8 {
-/// \brief Gather slices from axis of data according to indices. Negative indices
-/// are supported and indicate reverse indexing from the end
-class NGRAPH_API Gather : public op::util::GatherBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Gather() = default;
-
-    /// \param data The tensor from which slices are gathered
-    /// \param indices Tensor with indexes to gather
-    /// \param axis The tensor is a dimension index to gather data from
-    /// \param batch_dims The number of batch dimension in data and indices tensors.
-    Gather(const Output<Node>& data,
-           const Output<Node>& indices,
-           const Output<Node>& axis,
-           const int64_t batch_dims = 0);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-    int64_t get_batch_dims() const;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v8::Gather;
 }  // namespace v8
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/gather_elements.hpp b/ngraph/core/include/ngraph/op/gather_elements.hpp
index 36c36caeec4f54..9dbfa1c1644299 100644
--- a/ngraph/core/include/ngraph/op/gather_elements.hpp
+++ b/ngraph/core/include/ngraph/op/gather_elements.hpp
@@ -5,35 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/gather_elements.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v6 {
-/// \brief GatherElements operation
-///
-class NGRAPH_API GatherElements : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    GatherElements() = default;
-
-    /// \brief Constructs a GatherElements operation.
-    ///
-    /// \param data Node producing data that are gathered
-    /// \param indices Node producing indices by which the operation gathers elements
-    /// \param axis specifies axis along which indices are specified
-    GatherElements(const Output<Node>& data, const Output<Node>& indices, const int64_t axis);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    int64_t get_axis() const {
-        return m_axis;
-    }
-
-private:
-    int64_t m_axis;
-};
+using ov::op::v6::GatherElements;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/gather_nd.hpp b/ngraph/core/include/ngraph/op/gather_nd.hpp
index fffcc96e653bf1..9689be8b854b0b 100644
--- a/ngraph/core/include/ngraph/op/gather_nd.hpp
+++ b/ngraph/core/include/ngraph/op/gather_nd.hpp
@@ -5,36 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/gather_nd.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v5 {
-/// \brief GatherND operation
-///
-class NGRAPH_API GatherND : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    GatherND() = default;
-
-    /// \brief Constructs a GatherND operation.
-    ///
-    /// \param data Node producing data that are gathered
-    /// \param indices Node producing indices by which the operation gathers elements
-    /// or slices from data
-    /// \param batch_dims Specifies a number of batch dimensions
-    GatherND(const Output<Node>& data, const Output<Node>& indices, const size_t batch_dims = 0);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    size_t get_batch_dims() const {
-        return m_batch_dims;
-    }
-
-private:
-    size_t m_batch_dims;
-};
+using ov::op::v5::GatherND;
 }  // namespace v5
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/gather_tree.hpp b/ngraph/core/include/ngraph/op/gather_tree.hpp
index 792531f03e2d6a..9f015b9bcd11ea 100644
--- a/ngraph/core/include/ngraph/op/gather_tree.hpp
+++ b/ngraph/core/include/ngraph/op/gather_tree.hpp
@@ -5,34 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/gather_tree.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Generates the complete beams from the ids per each step and the parent beam
-/// ids.
-class NGRAPH_API GatherTree : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    GatherTree() = default;
-    /// \param step_ids     Tensor of shape [MAX_TIME, BATCH_SIZE, BEAM_WIDTH] with
-    ///                     indices from per each step
-    /// \param parent_idx   Tensor of shape [MAX_TIME, BATCH_SIZE, BEAM_WIDTH] with
-    ///                     parent beam indices
-    /// \param max_seq_len  Tensor of shape [BATCH_SIZE] with maximum lengths for each
-    ///                     sequence in the batch
-    /// \param end_token    Tensor of shape [MAX_TIME, BATCH_SIZE, BEAM_WIDTH]
-    GatherTree(const Output<Node>& step_ids,
-               const Output<Node>& parent_idx,
-               const Output<Node>& max_seq_len,
-               const Output<Node>& end_token);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v1::GatherTree;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/gelu.hpp b/ngraph/core/include/ngraph/op/gelu.hpp
index e662bada82f9a1..08b0e813205af9 100644
--- a/ngraph/core/include/ngraph/op/gelu.hpp
+++ b/ngraph/core/include/ngraph/op/gelu.hpp
@@ -7,81 +7,19 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/gelu.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Gaussian Error Linear Unit
-/// f(x) = 0.5 * x * (1 + erf( x / sqrt(2) )
-class NGRAPH_API Gelu : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Gelu();
-    /// \brief Constructs a Gelu operation.
-    ///
-    /// \param data Input tensor
-    Gelu(const Output<Node>& data);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v0::Gelu;
 }  // namespace v0
 using v0::Gelu;
 
-/// \brief Specifies the approximation to calculate Gelu
-enum class GeluApproximationMode { TANH, ERF };
-NGRAPH_API std::ostream& operator<<(std::ostream& s, const GeluApproximationMode& type);
+using ov::op::GeluApproximationMode;
 
 namespace v7 {
-/// \brief Gaussian Error Linear Unit
-/// f(x) = 0.5 * x * (1 + erf( x / sqrt(2) ) for "approximation" = "erf"
-/// f(x) = 0.5 * x * (1 + tanh([sqrt(2 / pi)] * [x + 0.044715^3]) for "approximation" =
-/// "tanh"
-class NGRAPH_API Gelu : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Gelu() = default;
-    /// \brief Constructs a Gelu operation.
-    ///
-    /// \param data Input tensor
-    /// \param mode Approximation mode
-    Gelu(const Output<Node>& data, GeluApproximationMode mode = GeluApproximationMode::ERF);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    GeluApproximationMode get_approximation_mode() const;
-
-private:
-    GeluApproximationMode m_approximation_mode = GeluApproximationMode::ERF;
-};
+using ov::op::v7::Gelu;
 }  // namespace v7
 }  // namespace op
 }  // namespace ngraph
-
-namespace ov {
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::GeluApproximationMode>
-    : public EnumAttributeAdapterBase<ngraph::op::GeluApproximationMode> {
-public:
-    AttributeAdapter(ngraph::op::GeluApproximationMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::GeluApproximationMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::GeluApproximationMode>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/greater.hpp b/ngraph/core/include/ngraph/op/greater.hpp
index b89089fbb5fd34..1302e88d867920 100644
--- a/ngraph/core/include/ngraph/op/greater.hpp
+++ b/ngraph/core/include/ngraph/op/greater.hpp
@@ -5,29 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_comparison.hpp"
+#include "openvino/op/greater.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise greater-than operation.
-class NGRAPH_API Greater : public util::BinaryElementwiseComparison {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a greater-than operation.
-    Greater() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
-    /// \brief Constructs a greater-than operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Greater(const Output<Node>& arg0,
-            const Output<Node>& arg1,
-            const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Greater;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/greater_eq.hpp b/ngraph/core/include/ngraph/op/greater_eq.hpp
index f9e9fc61a583a7..061628e004fedf 100644
--- a/ngraph/core/include/ngraph/op/greater_eq.hpp
+++ b/ngraph/core/include/ngraph/op/greater_eq.hpp
@@ -5,29 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_comparison.hpp"
+#include "openvino/op/greater_eq.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise greater-than-or-equal operation.
-class NGRAPH_API GreaterEqual : public util::BinaryElementwiseComparison {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a greater-than-or-equal operation.
-    GreaterEqual() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
-    /// \brief Constructs a greater-than-or-equal operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    GreaterEqual(const Output<Node>& arg0,
-                 const Output<Node>& arg1,
-                 const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::GreaterEqual;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/grn.hpp b/ngraph/core/include/ngraph/op/grn.hpp
index 58471d0b882619..03133d31f05d71 100644
--- a/ngraph/core/include/ngraph/op/grn.hpp
+++ b/ngraph/core/include/ngraph/op/grn.hpp
@@ -7,35 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/grn.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief  Global Response Normalization with L2 norm (across channels only).
-///
-class NGRAPH_API GRN : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    GRN() = default;
-    /// \brief      Constructs a GRN operation.
-    ///
-    /// \param      data  - Node producing the input tensor
-    /// \param      bias  - The bias added to the variance.
-    ///
-    GRN(const Output<Node>& data, float bias);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    float get_bias() const {
-        return m_bias;
-    }
-
-protected:
-    float m_bias = 1.0f;
-};
+using ov::op::v0::GRN;
 }  // namespace v0
 using v0::GRN;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/group_conv.hpp b/ngraph/core/include/ngraph/op/group_conv.hpp
index 42d79149c87b2b..352093535e89a7 100644
--- a/ngraph/core/include/ngraph/op/group_conv.hpp
+++ b/ngraph/core/include/ngraph/op/group_conv.hpp
@@ -7,268 +7,13 @@
 #include "ngraph/op/convolution.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/group_conv.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Batched convolution operation, with optional window dilation and stride.
-class NGRAPH_API GroupConvolution : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a batched convolution operation.
-    GroupConvolution() = default;
-    /// \brief Constructs a batched convolution operation.
-    ///
-    /// \param data_batch The node producing the input data batch tensor.<br>
-    /// `[N, C_IN, D1, ... Df]`
-    /// \param filters The node producing the filters tensor.<br>
-    /// `[GROUPS, FC_OUT, FC_IN, F1, ... Ff]`
-    /// \param strides The strides.<br>
-    /// `[f]`
-    /// \param dilations The dilations.<br>
-    /// `[f]`
-    /// \param pads_begin The beginning of padding shape.<br>
-    /// `[f]`
-    /// \param pads_end The end of padding shape.<br>
-    /// `[f]`
-    /// \param auto_pad The pad type for automatically computing padding sizes.<br>
-    /// `[f]`
-    ///
-    /// Output `[N, FC_OUT * GROUPS, R1, ... Rf]`
-    ///
-    GroupConvolution(const Output<Node>& data_batch,
-                     const Output<Node>& filters,
-                     const Strides& strides,
-                     const CoordinateDiff& pads_begin,
-                     const CoordinateDiff& pads_end,
-                     const Strides& dilations,
-                     const PadType& auto_pad = PadType::EXPLICIT);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    /// \return The strides.
-    const Strides& get_strides() const {
-        return m_strides;
-    }
-    void set_strides(const Strides& strides) {
-        m_strides = strides;
-    }
-    /// \return The dilations.
-    const Strides& get_dilations() const {
-        return m_dilations;
-    }
-    void set_dilations(const Strides& dilations) {
-        m_dilations = dilations;
-    }
-    /// \return The padding-below sizes (possibly negative).
-    const CoordinateDiff& get_pads_begin() const {
-        return m_pads_begin;
-    }
-    void set_pads_begin(const CoordinateDiff& pads_begin) {
-        m_pads_begin = pads_begin;
-    }
-    /// \return The padding-above sizes (possibly negative).
-    const CoordinateDiff& get_pads_end() const {
-        return m_pads_end;
-    }
-    void set_adding_above(const CoordinateDiff& pads_end) {
-        m_pads_end = pads_end;
-    }
-    /// \return The pad type for convolution.
-    const PadType& get_auto_pad() const {
-        return m_auto_pad;
-    }
-    void set_auto_pad(const PadType& auto_pad) {
-        m_auto_pad = auto_pad;
-    }
-    /// \return The default value for Convolution.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-protected:
-    Strides m_strides;
-    Strides m_dilations;
-    CoordinateDiff m_pads_begin;
-    CoordinateDiff m_pads_end;
-    PadType m_auto_pad;
-};
-
-/// \brief Data batch backprop for batched convolution operation.
-class NGRAPH_API GroupConvolutionBackpropData : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a batched-convolution data batch-backprop operation.
-    GroupConvolutionBackpropData();
-    // clang-format off
-                //
-                // \brief      Constructs a batched-convolution data batch-backprop operation.
-                //
-                // \param      data            The node producing data from forward-prop. Shape: [N,
-                //                             C_INPUT * GROUPS, X1, ..., XD].
-                // \param      filter          The node producing the filter from forward-prop. Shape:
-                //                             [GROUPS, C_INPUT, C_OUTPUT, K_D, ..., K_1]
-                // \param      output_shape    The shape of the data batch from forward-prop. It's size
-                //                             should be equal to number of data spatial dimensions.
-                // \param      strides         The strides from forward-prop.
-                // \param      pads_begin      The padding-below sizes from forward-prop.
-                // \param      pads_end        The padding-above sizes from forward-prop.
-                // \param      dilations       The dilations from forward-prop.
-                // \param      auto_pad        The pad type for automatically computing padding sizes.
-                // \param      output_padding  The output padding adds additional amount of paddings per
-                //                             each spatial axis in the output tensor.
-                //
-    // clang-format on
-    //
-    GroupConvolutionBackpropData(const Output<Node>& data,
-                                 const Output<Node>& filter,
-                                 const Output<Node>& output_shape,
-                                 const Strides& strides,
-                                 const CoordinateDiff& pads_begin,
-                                 const CoordinateDiff& pads_end,
-                                 const Strides& dilations,
-                                 const PadType& auto_pad = PadType::EXPLICIT,
-                                 const CoordinateDiff& output_padding = {});
-
-    // clang-format off
-                //
-                // \brief      Constructs a batched-convolution data batch-backprop operation.
-                //
-                // \param      data            The node producing data from forward-prop. Shape: [N,
-                //                             C_INPUT * GROUPS, X1, ..., XD].
-                // \param      filter          The node producing the filter from forward-prop. Shape:
-                //                             [GROUPS, C_INPUT, C_OUTPUT, K_D, ..., K_1]
-                // \param      output_shape    The shape of the data batch from forward-prop. It's size
-                //                             should be equal to number of data spatial dimensions.
-                // \param      strides         The strides from forward-prop.
-                // \param      dilations       The dilations from forward-prop.
-                // \param      auto_pad        The pad type for automatically computing padding sizes.
-                // \param      output_padding  The output padding adds additional amount of paddings per
-                //                             each spatial axis in the output tensor.
-                //
-    // clang-format on
-    //
-    GroupConvolutionBackpropData(const Output<Node>& data,
-                                 const Output<Node>& filter,
-                                 const Output<Node>& output_shape,
-                                 const Strides& strides,
-                                 const Strides& dilations,
-                                 const PadType& auto_pad,
-                                 const CoordinateDiff& output_padding = {});
-
-    // clang-format off
-                //
-                // \brief      Constructs a batched-convolution data batch-backprop operation.
-                //
-                // \param      data            The node producing data from forward-prop. Shape:
-                //                             [N, C_INPUT * GROUPS, X1, ..., XD].
-                // \param      filter          The node producing the filter from forward-prop. Shape:
-                //                             [GROUPS, C_INPUT, C_OUTPUT, K_D, ..., K_1]
-                // \param      strides         The strides from forward-prop.
-                // \param      pads_begin      The padding-below sizes from forward-prop.
-                // \param      pads_end        The padding-above sizes from forward-prop.
-                // \param      dilations       The dilations from forward-prop.
-                // \param      auto_pad        The pad type for automatically computing padding sizes.
-                // \param      output_padding  The output padding adds additional amount of paddings per
-                //                             each spatial axis in the output tensor.
-                //
-    // clang-format on
-    GroupConvolutionBackpropData(const Output<Node>& data,
-                                 const Output<Node>& filter,
-                                 const Strides& strides,
-                                 const CoordinateDiff& pads_begin,
-                                 const CoordinateDiff& pads_end,
-                                 const Strides& dilations,
-                                 const PadType& auto_pad = PadType::EXPLICIT,
-                                 const CoordinateDiff& output_padding = {});
-    ///
-    /// \brief      Calculates output spatial features size.
-    ///
-    /// \param[in]  input_data_shape      The input data partial shape
-    /// \param[in]  filters_shape         The filters partial shape
-    /// \param[in]  strides               The strides values.
-    /// \param[in]  dilations             The dilations values.
-    /// \param[in]  pads_begin            The paddings at the beginning of axis.
-    /// \param[in]  pads_end              The paddings at the end of axis.
-    /// \param[in]  output_padding    The output padding values.
-    /// \param      output_spatial_shape  The placeholder for computed output spatial
-    /// partial
-    /// shape.
-    ///
-    void infer_conv_backprop_output_spatial_shape(const std::vector<Dimension>& input_data_shape,
-                                                  const std::vector<Dimension>& filters_shape,
-                                                  const Strides& strides,
-                                                  const Strides& dilations,
-                                                  const CoordinateDiff& pads_begin,
-                                                  const CoordinateDiff& pads_end,
-                                                  const CoordinateDiff& output_padding,
-                                                  std::vector<Dimension>& output_spatial_shape);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual bool is_dynamic() const override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The spatial shape of the output.
-    const PartialShape get_convolution_output_shape() const;
-    void set_output_shape(const Shape& output_shape);
-    /// \return The strides from the forward prop.
-    const Strides& get_strides() const {
-        return m_strides;
-    }
-    void set_strides(const Strides& strides) {
-        m_strides = strides;
-    }
-    /// \return The dilations from the forward prop.
-    const Strides& get_dilations() const {
-        return m_dilations;
-    }
-    void set_dilations(const Strides& dilations) {
-        m_dilations = dilations;
-    }
-    /// \return The number of pixels to add to the beginning along each axis.
-    const CoordinateDiff& get_pads_begin() const {
-        return m_pads_begin;
-    }
-    void set_pads_begin(const CoordinateDiff& pads_begin) {
-        m_pads_begin = pads_begin;
-    }
-    /// \return The number of pixels to add to the ending along each axis.
-    const CoordinateDiff& get_pads_end() const {
-        return m_pads_end;
-    }
-    void set_pads_end(const CoordinateDiff& pads_end) {
-        m_pads_end = pads_end;
-    }
-    /// \return The auto pad.
-    const PadType& get_auto_pad() const {
-        return m_auto_pad;
-    }
-    void set_auto_pad(const PadType& auto_pad) {
-        m_auto_pad = auto_pad;
-    }
-    /// \return The output padding.
-    const CoordinateDiff& get_output_padding() const {
-        return m_output_padding;
-    }
-    void set_output_padding(const CoordinateDiff& output_padding) {
-        m_output_padding = output_padding;
-    }
-
-protected:
-    Strides m_strides;
-    Strides m_dilations;
-    CoordinateDiff m_pads_begin;
-    CoordinateDiff m_pads_end;
-    PadType m_auto_pad;
-    CoordinateDiff m_output_padding;
-};
-
+using ov::op::v1::GroupConvolution;
+using ov::op::v1::GroupConvolutionBackpropData;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/gru_cell.hpp b/ngraph/core/include/ngraph/op/gru_cell.hpp
index 3fa8e4d6c40757..ed5c7e532a21ee 100644
--- a/ngraph/core/include/ngraph/op/gru_cell.hpp
+++ b/ngraph/core/include/ngraph/op/gru_cell.hpp
@@ -13,155 +13,12 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/activation_functions.hpp"
 #include "ngraph/op/util/rnn_cell_base.hpp"
+#include "openvino/op/gru_cell.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-///
-/// \brief      Class for GRU cell node.
-///
-/// \note       It follows notation and equations defined as in ONNX standard:
-///             https://github.com/onnx/onnx/blob/master/docs/Operators.md#GRU
-///
-///             Note this class represents only single *cell* and not whole GRU *layer*.
-///
-class NGRAPH_API GRUCell : public util::RNNCellBase {
-public:
-    static constexpr NodeTypeInfo type_info{"GRUCell", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    GRUCell();
-    ///
-    /// \brief      Constructs GRUCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape:
-    ///                                   [gates_count * hidden_size, input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [gates_count * hidden_size, hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    ///
-    GRUCell(const Output<Node>& X,
-            const Output<Node>& initial_hidden_state,
-            const Output<Node>& W,
-            const Output<Node>& R,
-            std::size_t hidden_size);
-
-    ///
-    /// \brief      Constructs GRUCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape:
-    ///                                   [gates_count * hidden_size, input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [gates_count * hidden_size, hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    ///
-    GRUCell(const Output<Node>& X,
-            const Output<Node>& initial_hidden_state,
-            const Output<Node>& W,
-            const Output<Node>& R,
-            std::size_t hidden_size,
-            const std::vector<std::string>& activations,
-            const std::vector<float>& activations_alpha,
-            const std::vector<float>& activations_beta,
-            float clip,
-            bool linear_before_reset);
-
-    ///
-    /// \brief      Constructs GRUCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape: [gates_count *
-    ///                                   hidden_size, input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [gates_count * hidden_size, hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  B                     The sum of biases (weight and recurrence) for
-    ///                                   update, reset and hidden gates.
-    ///                                   If linear_before_reset := true then biases for
-    ///                                   hidden gates are
-    ///                                   placed separately (weight and recurrence).
-    ///                                   Shape: [gates_count * hidden_size] if
-    ///                                   linear_before_reset := false
-    ///                                   Shape: [(gates_count + 1) * hidden_size] if
-    ///                                   linear_before_reset := true
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    /// \param[in]  linear_before_reset   Whether or not to apply the linear
-    ///                                   transformation before multiplying by the
-    ///                                   output of the reset gate.
-    ///
-    GRUCell(const Output<Node>& X,
-            const Output<Node>& initial_hidden_state,
-            const Output<Node>& W,
-            const Output<Node>& R,
-            const Output<Node>& B,
-            std::size_t hidden_size,
-            const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh"},
-            const std::vector<float>& activations_alpha = {},
-            const std::vector<float>& activations_beta = {},
-            float clip = 0.f,
-            bool linear_before_reset = false);
-
-    virtual void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool get_linear_before_reset() const {
-        return m_linear_before_reset;
-    }
-
-private:
-    /// brief Add and initialize bias input to all zeros.
-    void add_default_bias_input();
-
-    ///
-    /// \brief The Activation function f.
-    ///
-    util::ActivationFunction m_activation_f;
-    ///
-    /// \brief The Activation function g.
-    ///
-    util::ActivationFunction m_activation_g;
-
-    static constexpr std::size_t s_gates_count{3};
-    ///
-    /// \brief Control whether or not apply the linear transformation.
-    ///
-    /// \note The linear transformation may be applied when computing the output of
-    ///       hidden gate. It's done before multiplying by the output of the reset gate.
-    ///
-    bool m_linear_before_reset;
-};
+using ov::op::v3::GRUCell;
 }  // namespace v3
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/gru_sequence.hpp b/ngraph/core/include/ngraph/op/gru_sequence.hpp
index f6e80740fccb6c..f5b5487331664d 100644
--- a/ngraph/core/include/ngraph/op/gru_sequence.hpp
+++ b/ngraph/core/include/ngraph/op/gru_sequence.hpp
@@ -10,45 +10,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/rnn_cell_base.hpp"
+#include "openvino/op/gru_sequence.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v5 {
-class NGRAPH_API GRUSequence : public util::RNNCellBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    GRUSequence();
-
-    GRUSequence(const Output<Node>& X,
-                const Output<Node>& H_t,
-                const Output<Node>& sequence_lengths,
-                const Output<Node>& W,
-                const Output<Node>& R,
-                const Output<Node>& B,
-                size_t hidden_size,
-                op::RecurrentSequenceDirection direction,
-                const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh"},
-                const std::vector<float>& activations_alpha = {},
-                const std::vector<float>& activations_beta = {},
-                float clip = 0.f,
-                bool linear_before_reset = false);
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool get_linear_before_reset() const {
-        return m_linear_before_reset;
-    }
-    op::RecurrentSequenceDirection get_direction() const {
-        return m_direction;
-    }
-
-protected:
-    op::RecurrentSequenceDirection m_direction;
-    bool m_linear_before_reset;
-};
+using ov::op::v5::GRUSequence;
 }  // namespace v5
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/hard_sigmoid.hpp b/ngraph/core/include/ngraph/op/hard_sigmoid.hpp
index 1a6c56d2fe19fb..03b8a0e72daa3b 100644
--- a/ngraph/core/include/ngraph/op/hard_sigmoid.hpp
+++ b/ngraph/core/include/ngraph/op/hard_sigmoid.hpp
@@ -6,31 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/hard_sigmoid.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief      Parameterized, bounded sigmoid-like, piecewise linear
-///             function. min(max(alpha*x + beta, 0), 1)
-///
-class NGRAPH_API HardSigmoid : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    HardSigmoid();
-
-    /// \brief      Constructs a HardSigmoid operation.
-    ///
-    /// \param      data   Input tensor.
-    /// \param[in]  alpha  A scalar value representing the alpha parameter.
-    /// \param[in]  beta   A scalar value representing the beta parameter.
-    ///
-    HardSigmoid(const Output<Node>& data, const Output<Node>& alpha, const Output<Node>& beta);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v0::HardSigmoid;
 }  // namespace v0
 using v0::HardSigmoid;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/hsigmoid.hpp b/ngraph/core/include/ngraph/op/hsigmoid.hpp
index 8913c6e809d9b8..8bd8dddb4b5613 100644
--- a/ngraph/core/include/ngraph/op/hsigmoid.hpp
+++ b/ngraph/core/include/ngraph/op/hsigmoid.hpp
@@ -7,30 +7,12 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/hsigmoid.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v5 {
-/// \brief A HSigmoid Activation Function
-/// f(x) = min(max(x + 3, 0), 6) / 6 or
-/// f(x) = min(ReLU(x + 3), 6) / 6
-///
-class NGRAPH_API HSigmoid : public ngraph::op::util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    HSigmoid() = default;
-
-    /// \brief Constructs a HSigmoid operation.
-    ///
-    /// \param data Input tensor
-    HSigmoid(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v5::HSigmoid;
 }  // namespace v5
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/hswish.hpp b/ngraph/core/include/ngraph/op/hswish.hpp
index ce469d5508cb4a..60aa9fb4dbf1bf 100644
--- a/ngraph/core/include/ngraph/op/hswish.hpp
+++ b/ngraph/core/include/ngraph/op/hswish.hpp
@@ -7,30 +7,12 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/hswish.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-/// \brief A HSwish Activation Function
-/// f(x) =  x * min(max(x + 3, 0), 6) / 6 or
-/// f(x) = x * min(ReLU(x + 3), 6) / 6
-///
-class NGRAPH_API HSwish : public ngraph::op::util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    HSwish() = default;
-
-    /// \brief Constructs a HSwish (hard version of Swish) operation.
-    ///
-    /// \param data Input tensor
-    HSwish(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v4::HSwish;
 }  // namespace v4
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/idft.hpp b/ngraph/core/include/ngraph/op/idft.hpp
index 7955cbcad829cf..bddd5873814c20 100644
--- a/ngraph/core/include/ngraph/op/idft.hpp
+++ b/ngraph/core/include/ngraph/op/idft.hpp
@@ -11,33 +11,12 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/op/util/fft_base.hpp"
+#include "openvino/op/idft.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v7 {
-/// \brief An operation IDFT that computes the inverse discrete Fourier transformation.
-class NGRAPH_API IDFT : public util::FFTBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    IDFT() = default;
-
-    /// \brief Constructs a IDFT operation. IDFT is performed for full size axes.
-    ///
-    /// \param data  Input data
-    /// \param axes Axes to perform IDFT
-    IDFT(const Output<Node>& data, const Output<Node>& axes);
-
-    /// \brief Constructs a IDFT operation.
-    ///
-    /// \param data  Input data
-    /// \param axes Axes to perform IDFT
-    /// \param signal_size Signal sizes for 'axes'
-    IDFT(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v7::IDFT;
 }  // namespace v7
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/if.hpp b/ngraph/core/include/ngraph/op/if.hpp
index 32ed1d5b8467c1..f0cea6373ef9ce 100644
--- a/ngraph/core/include/ngraph/op/if.hpp
+++ b/ngraph/core/include/ngraph/op/if.hpp
@@ -9,86 +9,12 @@
 #include "ngraph/function.hpp"
 #include "ngraph/op/parameter.hpp"
 #include "ngraph/op/util/multi_subgraph_base.hpp"
+#include "openvino/op/if.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v8 {
-/// \brief  If operation.
-class NGRAPH_API If : public util::MultiSubGraphOp {
-public:
-    enum BodyIndexes { THEN_BODY_INDEX = 0, ELSE_BODY_INDEX = 1 };
-
-    NGRAPH_RTTI_DECLARATION;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    /// \brief     Constructs If with condition
-    ///
-    /// \param     execution_condition   condition node.
-    If(const Output<Node>& execution_condition);
-    If();
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \brief     gets then_body as ngraph::Function.
-    ///
-    /// \return then_body as ngraph::Function.
-    const std::shared_ptr<Function>& get_then_body() const {
-        return m_bodies[THEN_BODY_INDEX];
-    }
-
-    /// \brief     gets else_body as ngraph::Function.
-    ///
-    /// \return else_body as ngraph::Function.
-    const std::shared_ptr<Function>& get_else_body() const {
-        return m_bodies[ELSE_BODY_INDEX];
-    }
-
-    /// \brief     sets new ngraph::Function as new then_body.
-    ///
-    /// \param     body   new body for 'then' branch.
-    void set_then_body(const std::shared_ptr<Function>& body) {
-        m_bodies[THEN_BODY_INDEX] = body;
-    }
-
-    /// \brief     sets new ngraph::Function as new else_body.
-    ///
-    /// \param     body   new body for 'else' branch.
-    void set_else_body(const std::shared_ptr<Function>& body) {
-        m_bodies[ELSE_BODY_INDEX] = body;
-    }
-
-    /// \brief     sets new input to the operation associated with parameters
-    /// of each sub-graphs
-    ///
-    /// \param     value           input to operation
-    /// \param     then_parameter  parameter for then_body or nullptr
-    /// \param     else_parameter  parameter for else_body or nullpt
-    void set_input(const Output<Node>& value,
-                   const std::shared_ptr<Parameter>& then_parameter,
-                   const std::shared_ptr<Parameter>& else_parameter);
-
-    /// \brief     sets new output from the operation associated with results
-    /// of each sub-graphs
-    ///
-    /// \param     then_result     result from then_body
-    /// \param     else_parameter  result from else_body
-    /// \return    output from operation
-    Output<Node> set_output(const std::shared_ptr<Result>& then_result, const std::shared_ptr<Result>& else_result);
-
-    void validate_and_infer_types() override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-
-    bool has_evaluate() const override;
-
-private:
-    using OutputMap = std::map<int64_t, std::shared_ptr<MultiSubGraphOp::OutputDescription>>;
-
-    void validate_and_infer_type_body(const std::shared_ptr<Function>& body,
-                                      const ngraph::op::util::MultiSubgraphInputDescriptionVector& input_descriptors);
-
-    OutputMap get_mapping_outputs_on_body_description(
-        const ngraph::op::util::MultiSubgraphOutputDescriptionVector& output_descriptors);
-};
+using ov::op::v8::If;
 }  // namespace v8
 }  // namespace op
-}  // namespace ngraph
\ No newline at end of file
+}  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/interpolate.hpp b/ngraph/core/include/ngraph/op/interpolate.hpp
index e2104a8dda778b..0c860817d758df 100644
--- a/ngraph/core/include/ngraph/op/interpolate.hpp
+++ b/ngraph/core/include/ngraph/op/interpolate.hpp
@@ -10,358 +10,18 @@
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/interpolate.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Structure that specifies attributes for interpolation
-struct InterpolateAttrs {
-    // specify dimension indices where interpolation is applied, and `axes` is any
-    // unordered list of indeces of different dimensions of input tensor. Required.
-    AxisSet axes;
-    // specifies type of interpolation
-    // one of `nearest`, `linear`, `cubic`, `area`. Required.
-    std::string mode;
-    // a flag that specifies whether to align corners or not.
-    // `true` (default) means the alignment is applied,
-    // `false` means the alignment isn't applied.
-    bool align_corners = true;
-    // a flag that specifies whether to perform anti-aliasing. default is `false`
-    bool antialias = false;
-    // specify the number of pixels to add to the beginning of the image being
-    // interpolated. This addition of pixels is done before interpolation calculation.
-    std::vector<size_t> pads_begin;
-    // specify the number of pixels to add to the end of the image being interpolated.
-    // This addition of pixels is done before interpolation calculation.
-    std::vector<size_t> pads_end;
-};
-
-/// \brief Layer which performs bilinear interpolation
-class NGRAPH_API Interpolate : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    enum class InterpolateMode {
-        NEAREST,
-        LINEAR,
-        CUBIC,
-        AREA,
-        nearest NGRAPH_ENUM_DEPRECATED("Please use NEAREST instead") = NEAREST,
-        linear NGRAPH_ENUM_DEPRECATED("Please use LINEAR instead") = LINEAR,
-        cubic NGRAPH_ENUM_DEPRECATED("Please use CUBIC instead") = CUBIC,
-        area NGRAPH_ENUM_DEPRECATED("Please use AREA instead") = AREA
-    };
-
-    Interpolate() = default;
-    /// \brief Constructs a Interpolate operation
-    ///
-    /// \param image        Input image
-    /// \param output_shape Output shape of spatial axes
-    /// \param attrs        Interpolation attributes
-    Interpolate(const Output<Node>& image, const Output<Node>& output_shape, const InterpolateAttrs& attrs);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    const InterpolateAttrs& get_attrs() const {
-        return m_attrs;
-    }
-
-private:
-    InterpolateAttrs m_attrs;
-};
+using InterpolateAttrs = ov::op::v0::Interpolate::Attributes;
+using ov::op::v0::Interpolate;
 }  // namespace v0
-
 namespace v4 {
-class NGRAPH_API Interpolate : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Shape calculation mode
-    ///
-    /// sizes  - output shape for interpolated axes is calculated using input `sizes`
-    /// scales - output shape for interpolated axes is calculated using input `scales`
-    enum class ShapeCalcMode {
-        SIZES,
-        SCALES,
-        sizes NGRAPH_ENUM_DEPRECATED("Please use SIZES instead") = SIZES,
-        scales NGRAPH_ENUM_DEPRECATED("Please use SCALES instead") = SCALES
-    };
-
-    /// \brief Interpolation mode
-    ///
-    /// nearest     - nearest interpolation
-    /// linear      - linear interpolation as in TensorFlow
-    /// linear_onnx - linear interpolation as in ONNX
-    /// cubic       - cubic interpolation
-    enum class InterpolateMode {
-        NEAREST,
-        LINEAR,
-        LINEAR_ONNX,
-        CUBIC,
-        nearest NGRAPH_ENUM_DEPRECATED("Please use NEAREST instead") = NEAREST,
-        linear NGRAPH_ENUM_DEPRECATED("Please use LINEAR instead") = LINEAR,
-        linear_onnx NGRAPH_ENUM_DEPRECATED("Please use LINEAR_ONNX instead") = LINEAR_ONNX,
-        cubic NGRAPH_ENUM_DEPRECATED("Please use CUBIC instead") = CUBIC
-    };
-
-    /// \brief Mode of the calculation of the source coordinate from resized one
-    ///
-    /// These modes are modes from ONNX runtime.
-    enum class CoordinateTransformMode {
-        HALF_PIXEL,
-        PYTORCH_HALF_PIXEL,
-        ASYMMETRIC,
-        TF_HALF_PIXEL_FOR_NN,
-        ALIGN_CORNERS,
-        half_pixel NGRAPH_ENUM_DEPRECATED("Please use HALF_PIXEL instead") = HALF_PIXEL,
-        pytorch_half_pixel NGRAPH_ENUM_DEPRECATED("Please use PYTORCH_HALF_PIXEL instead") = PYTORCH_HALF_PIXEL,
-        asymmetric NGRAPH_ENUM_DEPRECATED("Please use ASYMMETRIC instead") = ASYMMETRIC,
-        tf_half_pixel_for_nn NGRAPH_ENUM_DEPRECATED("Please use TF_HALF_PIXEL_FOR_NN instead") = TF_HALF_PIXEL_FOR_NN,
-        align_corners NGRAPH_ENUM_DEPRECATED("Please use ALIGN_CORNERS instead") = ALIGN_CORNERS
-    };
-
-    /// \brief Round modes for the nearest interpolation.
-    enum class NearestMode {
-        ROUND_PREFER_FLOOR,
-        ROUND_PREFER_CEIL,
-        FLOOR,
-        CEIL,
-        SIMPLE,
-        round_prefer_floor NGRAPH_ENUM_DEPRECATED("Please use ROUND_PREFER_FLOOR instead") = ROUND_PREFER_FLOOR,
-        round_prefer_ceil NGRAPH_ENUM_DEPRECATED("Please use ROUND_PREFER_CEIL instead") = ROUND_PREFER_CEIL,
-        floor NGRAPH_ENUM_DEPRECATED("Please use FLOOR instead") = FLOOR,
-        ceil NGRAPH_ENUM_DEPRECATED("Please use CEIL instead") = CEIL,
-        simple NGRAPH_ENUM_DEPRECATED("Please use SIMPLE instead") = SIMPLE
-    };
-
-    struct InterpolateAttrs {
-        // specifies type of interpolation
-        // one of `nearest`, `linear`, `linear_onnx`, `cubic` Required.
-        InterpolateMode mode = InterpolateMode::NEAREST;
-        // specifies shape calculation mode
-        // one of `sizes`, `scales` Required
-        ShapeCalcMode shape_calculation_mode = ShapeCalcMode::SIZES;
-        // specify the number of pixels to add to the beginning of the image being
-        // interpolated. This addition of pixels is done before interpolation
-        // calculation.
-        std::vector<size_t> pads_begin;
-        // specify the number of pixels to add to the end of the image being
-        // interpolated. This addition of pixels is done before interpolation
-        // calculation.
-        std::vector<size_t> pads_end;
-        // specifies how to transform the coordinate in the resized tensor to the
-        // coordinate in the original tensor. one of `half_pixel`, `pytorch_half_pixel`,
-        // `asymmetric`, `tf_half_pixel_for_nn`, `align_corners`
-        CoordinateTransformMode coordinate_transformation_mode = CoordinateTransformMode::HALF_PIXEL;
-        // specifies round mode when `mode == nearest` and is used only when `mode ==
-        // nearest`. one of `round_prefer_floor`, `round_prefer_ceil`, `floor`, `ceil`,
-        // `simple`
-        NearestMode nearest_mode = NearestMode::ROUND_PREFER_FLOOR;
-        // a flag that specifies whether to perform anti-aliasing. default is `false`
-        bool antialias = false;
-        // specifies the parameter *a* for cubic interpolation (see, e.g.
-        // [article](https://ieeexplore.ieee.org/document/1163711/)).  *cube_coeff* is
-        // used only when `mode == cubic`
-        double cube_coeff = -0.75f;
-
-        InterpolateAttrs() = default;
-
-        InterpolateAttrs(InterpolateMode mode,
-                         ShapeCalcMode shape_calculation_mode,
-                         const std::vector<size_t>& pads_begin,
-                         const std::vector<size_t>& pads_end,
-                         CoordinateTransformMode coordinate_transformation_mode = CoordinateTransformMode::HALF_PIXEL,
-                         NearestMode nearest_mode = NearestMode::ROUND_PREFER_FLOOR,
-                         bool antialias = false,
-                         double cube_coeff = -0.75)
-            : mode(mode),
-              shape_calculation_mode(shape_calculation_mode),
-              pads_begin(pads_begin),
-              pads_end(pads_end),
-              coordinate_transformation_mode(coordinate_transformation_mode),
-              nearest_mode(nearest_mode),
-              antialias(antialias),
-              cube_coeff(cube_coeff) {}
-    };
-
-    Interpolate() = default;
-    /// \brief Constructs a Interpolate operation without 'axes' input.
-    ///
-    /// \param image  Input image
-    /// \param output_shape Output shape of spatial axes
-    /// \param scales Scales of spatial axes, i.e. output_shape / input_shape
-    /// \param attrs  Interpolation attributes
-    Interpolate(const Output<Node>& image,
-                const Output<Node>& output_shape,
-                const Output<Node>& scales,
-                const InterpolateAttrs& attrs);
-
-    /// \brief Constructs a Interpolate operation with 'axes' input.
-    ///
-    /// \param image  Input image
-    /// \param output_shape Output shape of spatial axes
-    /// \param scales Scales of spatial axes, i.e. output_shape / input_shape
-    /// \param axes   Interpolation axes
-    /// \param attrs  Interpolation attributes
-    Interpolate(const Output<Node>& image,
-                const Output<Node>& output_shape,
-                const Output<Node>& scales,
-                const Output<Node>& axes,
-                const InterpolateAttrs& attrs);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-    const InterpolateAttrs& get_attrs() const {
-        return m_attrs;
-    }
-
-protected:
-    /// \return The interpolation axes.
-    std::vector<int64_t> get_axes() const;
-
-private:
-    bool evaluate_interpolate(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-    InterpolateAttrs m_attrs;
-
-    /// \brief Corrects pads_begin and pads_end attributes.
-    ///
-    /// \details When Interpolate-4 is a result of some transformation, it is possible
-    ///          that pads_begin.size() != pads_end.size() or
-    ///          pads_begin.size() != input_rank. In such case, we should correct
-    ///          pads_begin and pads_end, using padding of pads_begin and pads_end by
-    ///          zeros or using pads_begin[0 : input_rank], pads_end[0 : input_rank].
-    ///
-    ///          Padding of pads_begin is performed when pads_begin.size() < input_rank,
-    ///          and pads_begin[0 : input_rank] is used when
-    ///          pads_begin.size() < input_rank.
-    ///
-    ///          Similarly for pads_end.
-    void correct_pads();
-
-    /// \brief Calculates input shape after padding.
-    ///
-    /// \param input_shape Shape of input data.
-    ///
-    /// \return Padded input shape, i.e. input_shape + pads_begin + pads_end
-    PartialShape get_padded_input_shape(const PartialShape& input_shape) const;
-
-    /// \brief Infers output shape using scales.
-    ///
-    /// \param output_shape[in,out] output shape
-    /// \param axes Interpolation axes
-    /// \param scales Scales for interpolated axes
-    /// \param padded_input_shape input shape after padding
-    void infer_using_scales(PartialShape& output_shape,
-                            const std::vector<int64_t>& axes,
-                            const std::vector<float>& scales,
-                            const PartialShape& padded_input_shape) const;
-
-    /// \brief Infers output shape using sizes.
-    ///
-    /// \param output_shape[in,out] output shape
-    /// \param axes Interpolation axes
-    /// \param sizes sizes for interpolated axes
-    void infer_using_shapes(PartialShape& output_shape,
-                            const std::vector<int64_t>& axes,
-                            const std::vector<int64_t>& sizes) const;
-};
+using ov::op::v4::Interpolate;
 }  // namespace v4
-
 using v0::Interpolate;
 using v0::InterpolateAttrs;
 }  // namespace op
-
-//---------------------------------------- v0 --------------------------------------------------
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v0::Interpolate::InterpolateMode& type);
-
-//---------------------------------------- v4 --------------------------------------------------
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::InterpolateMode& type);
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::CoordinateTransformMode& type);
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::NearestMode& type);
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::ShapeCalcMode& type);
-
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v0::Interpolate::InterpolateMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v0::Interpolate::InterpolateMode> {
-public:
-    AttributeAdapter(ngraph::op::v0::Interpolate::InterpolateMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v0::Interpolate::InterpolateMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v0::Interpolate::InterpolateMode>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v4::Interpolate::InterpolateMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::InterpolateMode> {
-public:
-    AttributeAdapter(ngraph::op::v4::Interpolate::InterpolateMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::InterpolateMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::InterpolateMode>", 4};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v4::Interpolate::CoordinateTransformMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::CoordinateTransformMode> {
-public:
-    AttributeAdapter(ngraph::op::v4::Interpolate::CoordinateTransformMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::CoordinateTransformMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::CoordinateTransformMode>", 4};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v4::Interpolate::NearestMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::NearestMode> {
-public:
-    AttributeAdapter(ngraph::op::v4::Interpolate::NearestMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::NearestMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::NearestMode>", 4};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v4::Interpolate::ShapeCalcMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::ShapeCalcMode> {
-public:
-    AttributeAdapter(ngraph::op::v4::Interpolate::ShapeCalcMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v4::Interpolate::ShapeCalcMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::ShapeCalcMode>", 4};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/less.hpp b/ngraph/core/include/ngraph/op/less.hpp
index 9df5e153aa38f6..340395cc1da64f 100644
--- a/ngraph/core/include/ngraph/op/less.hpp
+++ b/ngraph/core/include/ngraph/op/less.hpp
@@ -5,29 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_comparison.hpp"
+#include "openvino/op/less.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise less-than operation.
-class NGRAPH_API Less : public util::BinaryElementwiseComparison {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a less-than operation.
-    Less() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
-    /// \brief Constructs a less-than operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Less(const Output<Node>& arg0,
-         const Output<Node>& arg1,
-         const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Less;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/less_eq.hpp b/ngraph/core/include/ngraph/op/less_eq.hpp
index f45fb9614c335d..fe8bfdff9fa770 100644
--- a/ngraph/core/include/ngraph/op/less_eq.hpp
+++ b/ngraph/core/include/ngraph/op/less_eq.hpp
@@ -5,30 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_comparison.hpp"
+#include "openvino/op/less_eq.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise less-than-or-equal operation.
-class NGRAPH_API LessEqual : public util::BinaryElementwiseComparison {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a less-than-or-equal operation.
-    LessEqual() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs a less-than-or-equal operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    LessEqual(const Output<Node>& arg0,
-              const Output<Node>& arg1,
-              const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::LessEqual;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/log.hpp b/ngraph/core/include/ngraph/op/log.hpp
index 6fee3de27d5a49..51c9c232f05df7 100644
--- a/ngraph/core/include/ngraph/op/log.hpp
+++ b/ngraph/core/include/ngraph/op/log.hpp
@@ -5,26 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/log.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise natural log operation.
-class NGRAPH_API Log : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a natural log operation.
-    Log() = default;
-    /// \brief Constructs a natural log operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Log(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Log;
 }  // namespace v0
 using v0::Log;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/log_softmax.hpp b/ngraph/core/include/ngraph/op/log_softmax.hpp
index 5a17ab4e6e65fe..c0d3a2a020de75 100644
--- a/ngraph/core/include/ngraph/op/log_softmax.hpp
+++ b/ngraph/core/include/ngraph/op/log_softmax.hpp
@@ -5,39 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/log_softmax.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v5 {
-class NGRAPH_API LogSoftmax : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    LogSoftmax() = default;
-    /// \brief Constructs a LogSoftmax operation.
-    ///
-    /// \param arg Node that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param axis The axis position (0-based) on which to calculate the LogSoftmax.
-    ///
-    /// Output `[d0, ...]`
-    ///
-    LogSoftmax(const Output<Node>& arg, const int64_t axis);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    int64_t get_axis() const {
-        return m_axis;
-    }
-    void set_axis(const int64_t axis) {
-        m_axis = axis;
-    }
-
-private:
-    int64_t m_axis = 1;
-};
+using ov::op::v5::LogSoftmax;
 }  // namespace v5
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/loop.hpp b/ngraph/core/include/ngraph/op/loop.hpp
index 8d037c9bd37391..33be140ee704f1 100644
--- a/ngraph/core/include/ngraph/op/loop.hpp
+++ b/ngraph/core/include/ngraph/op/loop.hpp
@@ -12,84 +12,12 @@
 #include "ngraph/op/parameter.hpp"
 #include "ngraph/op/tensor_iterator.hpp"
 #include "ngraph/op/util/sub_graph_base.hpp"
+#include "openvino/op/loop.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v5 {
-/// \brief  Iterate a body over tensors, accumulating into tensors.
-class NGRAPH_API Loop : public op::util::SubGraphOp {
-public:
-    /// \brief  Allows to define the purpose of inputs/outputs in the body
-    struct SpecialBodyPorts {
-        SpecialBodyPorts() = default;
-        SpecialBodyPorts(int64_t in_current_iteration_input_idx, int64_t in_body_condition_output_idx)
-            : current_iteration_input_idx(in_current_iteration_input_idx),
-              body_condition_output_idx(in_body_condition_output_idx) {}
-        // -1 means the input is not provided, this input is optional
-        int64_t current_iteration_input_idx = -1;
-        // -1 means the output is not provided,
-        // this output is required, throw an exception if not provided
-        int64_t body_condition_output_idx = -1;
-    };
-
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a Loop operation.
-    Loop() = default;
-
-    /// \brief Constructs a Loop operation.
-    ///
-    /// \param trip_count Node specifies the maximum number of iterations.
-    /// \param execution_condition Node determines whether to execute the first
-    /// iteration or not.
-    Loop(const Output<Node>& trip_count, const Output<Node>& execution_condition);
-
-    Output<Node> get_concatenated_slices(const Output<Node>& value,
-                                         int64_t start,
-                                         int64_t stride,
-                                         int64_t part_size,
-                                         int64_t end,
-                                         int64_t axis) override;
-
-    void set_special_body_ports(const SpecialBodyPorts& special_body_ports) {
-        m_special_body_ports = special_body_ports;
-    }
-
-    SpecialBodyPorts get_special_body_ports() const {
-        return m_special_body_ports;
-    }
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    Loop(const Loop&);
-
-private:
-    void clone_to(Loop& dst, const OutputVector& new_args) const;
-
-    SpecialBodyPorts m_special_body_ports;
-};
+using ov::op::v5::Loop;
 }  // namespace v5
 }  // namespace op
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v5::Loop::SpecialBodyPorts>
-    : public DirectValueAccessor<ngraph::op::v5::Loop::SpecialBodyPorts> {
-public:
-    AttributeAdapter(ngraph::op::v5::Loop::SpecialBodyPorts& value)
-        : DirectValueAccessor<ngraph::op::v5::Loop::SpecialBodyPorts>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v5::Loop::SpecialBodyPorts>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/lrn.hpp b/ngraph/core/include/ngraph/op/lrn.hpp
index a229f9600a1268..908505b9124472 100644
--- a/ngraph/core/include/ngraph/op/lrn.hpp
+++ b/ngraph/core/include/ngraph/op/lrn.hpp
@@ -5,74 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/lrn.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-// clang-format off
-        /// \brief Elementwise Local Response Normalization (LRN) operation.
-        ///
-        /// ## Inputs
-        ///
-        /// |       | Type                                    | Description                                     |
-        /// | ----- | --------------------------------------- | ----------------------------------------------- |
-        /// | `arg` | \f$N[n, c, d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
-        ///
-        /// ## Output
-        ///
-        /// | Type                         | Description                                                                                                                                                                                  |
-        /// | ---------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-        /// | \f$N[n, c, d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[n, c, d_1,\dots,d_n] = \frac{N[n,i,d_1,\dots,d_n]}{ (bias + alpha * (\sum_{i=max(0,(nsize-1)/2)}^{min(C, (nsize-1)/2)+1} N[n,i,d_1,\dots,d_n]^{2}) ^ {2})}\f$ |
-// clang-format on
-class NGRAPH_API LRN : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a LRN operation.
-    LRN() = default;
-    /// \brief Constructs a LRN operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    LRN(const Output<Node>& arg, double alpha, double beta, double bias, size_t size);
-
-    LRN(const Output<Node>& arg, const Output<Node>& axes, double alpha, double beta, double bias, size_t size);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    void validate_and_infer_types() override;
-
-    double get_alpha() const {
-        return m_alpha;
-    }
-    void set_alpha(double alpha) {
-        m_alpha = alpha;
-    }
-    double get_beta() const {
-        return m_beta;
-    }
-    void set_beta(double beta) {
-        m_beta = beta;
-    }
-    double get_bias() const {
-        return m_bias;
-    }
-    void set_bias(double bias) {
-        m_bias = bias;
-    }
-    size_t get_nsize() const {
-        return m_size;
-    }
-    void set_nsize(size_t size) {
-        m_size = size;
-    }
-    AxisSet get_reduction_axes() const;
-
-protected:
-    double m_alpha;
-    double m_beta;
-    double m_bias;
-    size_t m_size;
-};
+using ov::op::v0::LRN;
 }  // namespace v0
 using v0::LRN;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/lstm_cell.hpp b/ngraph/core/include/ngraph/op/lstm_cell.hpp
index 17c81965e377aa..d6a78beac7a239 100644
--- a/ngraph/core/include/ngraph/op/lstm_cell.hpp
+++ b/ngraph/core/include/ngraph/op/lstm_cell.hpp
@@ -13,391 +13,18 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/activation_functions.hpp"
 #include "ngraph/op/util/rnn_cell_base.hpp"
+#include "openvino/op/lstm_cell.hpp"
 
 namespace ngraph {
 namespace op {
-enum class LSTMWeightsFormat {
-    FICO,  // IE
-    ICOF,  // PyTorch
-    IFCO,  // DNNL, TF, MxNet
-    IFOC,  // Caffe
-    IOFC,  // ONNX
-};
+using ov::op::LSTMWeightsFormat;
 
 namespace v0 {
-///
-/// \brief      Class for single lstm cell node.
-///
-/// \note       Following implementation supports:
-///             \li \c peepholes Gers & Schmidhuber (2000)
-///             https://ieeexplore.ieee.org/document/861302
-///             \li Coupling input and forget gates.
-///
-/// \note       It calculates following equations:
-///
-///             it = f(Xt*(Wi^T) + Ht-1*(Ri^T) + Pi (.) Ct-1 + Wbi + Rbi)
-///             ft = f(Xt*(Wf^T) + Ht-1*(Rf^T) + Pf (.) Ct-1 + Wbf + Rbf)
-///             ct = g(Xt*(Wc^T) + Ht-1*(Rc^T) + Wbc + Rbc)
-///             Ct = ft (.) Ct-1 + it (.) ct
-///             ot = f(Xt*(Wo^T) + Ht-1*(Ro^T) + Po (.) Ct + Wbo + Rbo)
-///             Ht = ot (.) h(Ct)
-///
-///             *       - Is a dot product,
-///             (.)     - is a Hadamard product (element-wise),
-///             f, g, h - are activation functions.
-///
-/// \note       This class represents only single *cell* (for current time step) and not
-///             the whole LSTM Sequence layer
-///
-/// \sa         LSTMSequence, RNNCell, GRUCell
-///
-class NGRAPH_API LSTMCell : public util::RNNCellBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    LSTMCell();
-    ///
-    /// \brief      Constructs LSTMCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  initial_cell_state    The cell state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The gate weights tensor with shape:
-    ///                                   [4*hidden_size, input_size].
-    /// \param[in]  R                     The recurrence weights tensor with shape:
-    ///                                   [4*hidden_size, hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  weights_format        The order of gates in weights tensors. The
-    ///                                   default format is IFCO since it is used by
-    ///                                   DNNL.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    /// \param[in]  input_forget          Controls coupling input and forget gates.
-    ///
-    LSTMCell(const Output<Node>& X,
-             const Output<Node>& initial_hidden_state,
-             const Output<Node>& initial_cell_state,
-             const Output<Node>& W,
-             const Output<Node>& R,
-             std::size_t hidden_size,
-             LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
-             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
-             const std::vector<float>& activations_alpha = {},
-             const std::vector<float>& activations_beta = {},
-             float clip = 0.f,
-             bool input_forget = false);
-
-    ///
-    /// \brief      Constructs LSTMCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  initial_cell_state    The cell state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape: [4*hidden_size,
-    ///                                   input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [4*hidden_size, hidden_size].
-    /// \param[in]  B                     The bias tensor for gates with shape:
-    ///                                   [4*hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  weights_format        The order of gates in weights tensors. The
-    ///                                   default format is IFCO since it is used by
-    ///                                   DNNL.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    /// \param[in]  input_forget          Controls coupling input and forget gates.
-    ///
-    LSTMCell(const Output<Node>& X,
-             const Output<Node>& initial_hidden_state,
-             const Output<Node>& initial_cell_state,
-             const Output<Node>& W,
-             const Output<Node>& R,
-             const Output<Node>& B,
-             std::size_t hidden_size,
-             LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
-             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
-             const std::vector<float>& activations_alpha = {},
-             const std::vector<float>& activations_beta = {},
-             float clip = 0.f,
-             bool input_forget = false);
-
-    ///
-    /// \brief      Constructs LSTMCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  initial_cell_state    The cell state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape: [4*hidden_size,
-    ///                                   input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [4*hidden_size, hidden_size].
-    /// \param[in]  B                     The bias tensor for gates with shape:
-    ///                                   [4*hidden_size].
-    /// \param[in]  P                     The weight tensor for peepholes with shape:
-    ///                                   [3*hidden_size] - 3 equals to only iof gates.
-    ///                                   The order is: input, output, forget gates.
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  weights_format        The order of gates in weights tensors. The
-    ///                                   default format is IFCO since it is used by
-    ///                                   DNNL.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    /// \param[in]  input_forget          Controls coupling input and forget gates.
-    ///
-    LSTMCell(const Output<Node>& X,
-             const Output<Node>& initial_hidden_state,
-             const Output<Node>& initial_cell_state,
-             const Output<Node>& W,
-             const Output<Node>& R,
-             const Output<Node>& B,
-             const Output<Node>& P,
-             std::size_t hidden_size,
-             LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
-             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
-             const std::vector<float>& activations_alpha = {},
-             const std::vector<float>& activations_beta = {},
-             float clip = 0.f,
-             bool input_forget = false);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool get_input_forget() const {
-        return m_input_forget;
-    }
-    LSTMWeightsFormat get_weights_format() const {
-        return m_weights_format;
-    }
-
-private:
-    ///
-    /// \brief      Creates the default bias input initialized with zeros.
-    ///
-    /// \return     The object of Output class.
-    ///
-    Output<Node> get_default_bias_input() const;
-
-    ///
-    /// \brief      Creates the default peepholes input initialized with zeros.
-    ///
-    /// \return     The object of Output class.
-    ///
-    Output<Node> get_default_peepholes_input() const;
-    ///
-    /// \brief The Activation function f.
-    ///
-    util::ActivationFunction m_activation_f;
-    ///
-    /// \brief The Activation function g.
-    ///
-    util::ActivationFunction m_activation_g;
-    ///
-    /// \brief The Activation function h.
-    ///
-    util::ActivationFunction m_activation_h;
-    ///
-    /// \brief      Controls whether to couple input and forget gates.
-    ///
-    bool m_input_forget = false;
-
-    ///
-    /// \brief The order of gates in weights tensors.
-    ///
-    LSTMWeightsFormat m_weights_format;
-
-    static constexpr std::size_t s_gates_count{4};
-    static constexpr std::size_t s_peepholes_count{3};
-};
+using ov::op::v0::LSTMCell;
 }  // namespace v0
 
 namespace v4 {
-///
-/// \brief      Class for single lstm cell node.
-///
-/// \note       Following implementation supports:
-///             \li \c peepholes Gers & Schmidhuber (2000)
-///             https://ieeexplore.ieee.org/document/861302
-///             \li Coupling input and forget gates.
-///
-/// \note       It calculates following equations:
-///
-///             it = f(Xt*(Wi^T) + Ht-1*(Ri^T) + Wbi + Rbi)
-///             ft = f(Xt*(Wf^T) + Ht-1*(Rf^T)  + Wbf + Rbf)
-///             ct = g(Xt*(Wc^T) + Ht-1*(Rc^T) + Wbc + Rbc)
-///             Ct = ft (.) Ct-1 + it (.) ct
-///             ot = f(Xt*(Wo^T) + Ht-1*(Ro^T) + Wbo + Rbo)
-///             Ht = ot (.) h(Ct)
-///
-///             *       - Is a dot product,
-///             (.)     - is a Hadamard product (element-wise),
-///             f, g, h - are activation functions.
-///
-/// \note       This class represents only single *cell* (for current time step) and not
-///             the whole LSTM Sequence layer
-///
-/// \sa         LSTMSequence, RNNCell, GRUCell
-///
-class NGRAPH_API LSTMCell : public util::RNNCellBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    LSTMCell();
-    ///
-    /// \brief      Constructs LSTMCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  initial_cell_state    The cell state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The gate weights tensor with shape:
-    ///                                   [4*hidden_size, input_size].
-    /// \param[in]  R                     The recurrence weights tensor with shape:
-    ///                                   [4*hidden_size, hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    LSTMCell(const Output<Node>& X,
-             const Output<Node>& initial_hidden_state,
-             const Output<Node>& initial_cell_state,
-             const Output<Node>& W,
-             const Output<Node>& R,
-             std::size_t hidden_size,
-             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
-             const std::vector<float>& activations_alpha = {},
-             const std::vector<float>& activations_beta = {},
-             float clip = 0.f);
-
-    ///
-    /// \brief      Constructs LSTMCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  initial_cell_state    The cell state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape: [4*hidden_size,
-    ///                                   input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [4*hidden_size, hidden_size].
-    /// \param[in]  B                     The bias tensor for gates with shape:
-    ///                                   [4*hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    ///
-    LSTMCell(const Output<Node>& X,
-             const Output<Node>& initial_hidden_state,
-             const Output<Node>& initial_cell_state,
-             const Output<Node>& W,
-             const Output<Node>& R,
-             const Output<Node>& B,
-             std::size_t hidden_size,
-             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
-             const std::vector<float>& activations_alpha = {},
-             const std::vector<float>& activations_beta = {},
-             float clip = 0.f);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-private:
-    ///
-    /// \brief      Creates the default bias input initialized with zeros.
-    ///
-    /// \return     The object of Output class.
-    ///
-    Output<Node> get_default_bias_input() const;
-
-    ///
-    /// \brief The Activation function f.
-    ///
-    util::ActivationFunction m_activation_f;
-    ///
-    /// \brief The Activation function g.
-    ///
-    util::ActivationFunction m_activation_g;
-    ///
-    /// \brief The Activation function h.
-    ///
-    util::ActivationFunction m_activation_h;
-
-    static constexpr std::size_t s_gates_count{4};
-};
+using ov::op::v4::LSTMCell;
 }  // namespace v4
 }  // namespace op
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::LSTMWeightsFormat& type);
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::LSTMWeightsFormat>
-    : public EnumAttributeAdapterBase<ngraph::op::LSTMWeightsFormat> {
-public:
-    AttributeAdapter(ngraph::op::LSTMWeightsFormat& value)
-        : EnumAttributeAdapterBase<ngraph::op::LSTMWeightsFormat>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::LSTMWeightsFormat>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/lstm_sequence.hpp b/ngraph/core/include/ngraph/op/lstm_sequence.hpp
index 75638c6c411afb..4898b08666d31c 100644
--- a/ngraph/core/include/ngraph/op/lstm_sequence.hpp
+++ b/ngraph/core/include/ngraph/op/lstm_sequence.hpp
@@ -15,184 +15,16 @@
 #include "ngraph/op/lstm_cell.hpp"
 #include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/op/util/rnn_cell_base.hpp"
+#include "openvino/op/lstm_sequence.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-
-///
-/// \brief      Class for lstm sequence node.
-///
-/// \note       It follows notation and equations defined as in ONNX standard:
-///             https://github.com/onnx/onnx/blob/master/docs/Operators.md#LSTM
-///
-/// \sa         LSTMCell, RNNCell, GRUCell
-///
-///
-class NGRAPH_API LSTMSequence : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    LSTMSequence();
-
-    using direction = RecurrentSequenceDirection;
-
-    size_t get_default_output_index() const override {
-        return no_default_index();
-    }
-    explicit LSTMSequence(const Output<Node>& X,
-                          const Output<Node>& initial_hidden_state,
-                          const Output<Node>& initial_cell_state,
-                          const Output<Node>& sequence_lengths,
-                          const Output<Node>& W,
-                          const Output<Node>& R,
-                          const Output<Node>& B,
-                          const Output<Node>& P,
-                          const std::int64_t hidden_size,
-                          const direction lstm_direction,
-                          LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
-                          const std::vector<float> activations_alpha = {},
-                          const std::vector<float> activations_beta = {},
-                          const std::vector<std::string> activations = {"sigmoid", "tanh", "tanh"},
-                          const float clip_threshold = 0,
-                          const bool input_forget = false);
-
-    explicit LSTMSequence(const Output<Node>& X,
-                          const Output<Node>& initial_hidden_state,
-                          const Output<Node>& initial_cell_state,
-                          const Output<Node>& sequence_lengths,
-                          const Output<Node>& W,
-                          const Output<Node>& R,
-                          const Output<Node>& B,
-                          const std::int64_t hidden_size,
-                          const direction lstm_direction,
-                          LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
-                          const std::vector<float>& activations_alpha = {},
-                          const std::vector<float>& activations_beta = {},
-                          const std::vector<std::string>& activations = {"sigmoid", "tanh", "tanh"},
-                          const float clip_threshold = 0,
-                          const bool input_forget = false);
-
-    virtual void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    std::vector<float> get_activations_alpha() const {
-        return m_activations_alpha;
-    }
-    std::vector<float> get_activations_beta() const {
-        return m_activations_beta;
-    }
-    std::vector<std::string> get_activations() const {
-        return m_activations;
-    }
-    float get_clip_threshold() const {
-        return m_clip_threshold;
-    }
-    direction get_direction() const {
-        return m_direction;
-    }
-    std::int64_t get_hidden_size() const {
-        return m_hidden_size;
-    }
-    bool get_input_forget() const {
-        return m_input_forget;
-    }
-    LSTMWeightsFormat get_weights_format() const {
-        return m_weights_format;
-    }
-
-private:
-    ///
-    /// \brief      Gets the masked value according to sequence length in a batch.
-    ///
-    /// \note       Zeros out values or sets them to default value for inputs with
-    ///             sequence length shorter than currently procssed time step.
-    ///
-    /// \param[in]  data           The input value.
-    /// \param[in]  time_step      The current time step denoting sequence length.
-    /// \param[in]  batch_axis     The batch axis index of data tensor.
-    /// \param[in]  default_value  The default value for masked elements.
-    ///
-    /// \return     The masked value.
-    ///
-    std::shared_ptr<Node> get_masked_node(const Output<Node>& data,
-                                          std::int32_t time_step,
-                                          std::size_t batch_axis = 0,
-                                          const Output<Node>& default_value = Output<Node>()) const;
-
-    OutputVector lstm_pass(bool is_reverse = false) const;
-
-    // Split(bi-directional) and squeeze input data to remove 'num_direction' dimension.
-    std::shared_ptr<Node> prepare_input(Output<Node> node, bool is_reverse, size_t num_direction_axis = 0) const;
-
-    std::vector<float> m_activations_alpha;
-    std::vector<float> m_activations_beta;
-    std::vector<std::string> m_activations;
-    float m_clip_threshold;
-    direction m_direction;
-    std::int64_t m_hidden_size;
-    bool m_input_forget;
-    LSTMWeightsFormat m_weights_format;
-};
+using ov::op::v0::LSTMSequence;
 }  // namespace v0
 
 namespace v5 {
-///
-/// \brief      Class for lstm sequence node.
-///
-/// \note       It follows notation and equations defined as in ONNX standard:
-///             https://github.com/onnx/onnx/blob/master/docs/Operators.md#LSTM
-///
-/// \sa         LSTMCell, RNNCell, GRUCell
-///
-///
-class NGRAPH_API LSTMSequence : public util::RNNCellBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    LSTMSequence() = default;
-
-    using direction = RecurrentSequenceDirection;
-
-    size_t get_default_output_index() const override {
-        return no_default_index();
-    }
-    explicit LSTMSequence(const Output<Node>& X,
-                          const Output<Node>& initial_hidden_state,
-                          const Output<Node>& initial_cell_state,
-                          const Output<Node>& sequence_lengths,
-                          const Output<Node>& W,
-                          const Output<Node>& R,
-                          const Output<Node>& B,
-                          const std::int64_t hidden_size,
-                          const direction lstm_direction,
-                          const std::vector<float>& activations_alpha = {},
-                          const std::vector<float>& activations_beta = {},
-                          const std::vector<std::string>& activations = {"sigmoid", "tanh", "tanh"},
-                          const float clip = 0.f)
-        : RNNCellBase({X, initial_hidden_state, initial_cell_state, sequence_lengths, W, R, B},
-                      hidden_size,
-                      clip,
-                      activations,
-                      activations_alpha,
-                      activations_beta),
-          m_direction(lstm_direction) {
-        constructor_validate_and_infer_types();
-    }
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    direction get_direction() const {
-        return m_direction;
-    }
-
-private:
-    direction m_direction;
-};
+using ov::op::v5::LSTMSequence;
 }  // namespace v5
 }  // namespace op
-
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/matmul.hpp b/ngraph/core/include/ngraph/op/matmul.hpp
index 2ace4905c0a344..92a1701f12d31b 100644
--- a/ngraph/core/include/ngraph/op/matmul.hpp
+++ b/ngraph/core/include/ngraph/op/matmul.hpp
@@ -6,48 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/matmul.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Operator performing Matrix Multiplication.
-class NGRAPH_API MatMul : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    MatMul() = default;
-    /// \brief Constructs an Matrix Multiplication operation.
-    ///
-    /// \param A Matrix A
-    /// \param B Matrix B
-    /// \param transpose_a If matrix A should be transposed.
-    /// \param transpose_b If matrix B should be transposed.
-    MatMul(const Output<Node>& A, const Output<Node>& B, const bool& transpose_a = 0, const bool& transpose_b = 0);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-    bool get_transpose_a() const {
-        return m_transpose_a;
-    }
-    bool get_transpose_b() const {
-        return m_transpose_b;
-    }
-    void set_transpose_a(bool transpose_a) {
-        m_transpose_a = transpose_a;
-    }
-    void set_transpose_b(bool transpose_b) {
-        m_transpose_b = transpose_b;
-    }
-
-private:
-    bool m_transpose_a;
-    bool m_transpose_b;
-};
+using ov::op::v0::MatMul;
 }  // namespace v0
 using v0::MatMul;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/matrix_nms.hpp b/ngraph/core/include/ngraph/op/matrix_nms.hpp
index e77b7b439c31aa..b7e2b3d730ad9f 100644
--- a/ngraph/core/include/ngraph/op/matrix_nms.hpp
+++ b/ngraph/core/include/ngraph/op/matrix_nms.hpp
@@ -5,90 +5,13 @@
 #pragma once
 
 #include "ngraph/op/util/nms_base.hpp"
+#include "openvino/op/matrix_nms.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v8 {
-/// \brief MatrixNms operation
-///
-class NGRAPH_API MatrixNms : public util::NmsBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    enum class DecayFunction { GAUSSIAN, LINEAR };
-
-    /// \brief Structure that specifies attributes of the operation
-    struct Attributes {
-        // specifies order of output elements
-        SortResultType sort_result_type = SortResultType::NONE;
-        // specifies whenever it is necessary to sort selected boxes across batches or
-        // not
-        bool sort_result_across_batch = false;
-        // specifies the output tensor type
-        ngraph::element::Type output_type = ngraph::element::i64;
-        // specifies minimum score to consider box for the processing
-        float score_threshold = 0.0f;
-        // specifies maximum number of boxes to be selected per class, -1 meaning to
-        // keep all boxes
-        int nms_top_k = -1;
-        // specifies maximum number of boxes to be selected per batch element, -1
-        // meaning to keep all boxes
-        int keep_top_k = -1;
-        // specifies the background class id, -1 meaning to keep all classes
-        int background_class = -1;
-        // specifies decay function used to decay scores
-        DecayFunction decay_function = DecayFunction::LINEAR;
-        // specifies gaussian_sigma parameter for gaussian decay_function
-        float gaussian_sigma = 2.0f;
-        // specifies threshold to filter out boxes with low confidence score after
-        // decaying
-        float post_threshold = 0.0f;
-        // specifies whether boxes are normalized or not
-        bool normalized = true;
-    };
-
-    MatrixNms();
-
-    /// \brief Constructs a MatrixNms operation
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param attrs Attributes of the operation
-    MatrixNms(const Output<Node>& boxes, const Output<Node>& scores, const Attributes& attrs);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \brief Returns attributes of the operation MatrixNms
-    const Attributes& get_attrs() const {
-        return m_attrs;
-    }
-
-protected:
-    Attributes m_attrs;
-
-    void validate() override;
-};
+using ov::op::v8::MatrixNms;
 }  // namespace v8
 }  // namespace op
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v8::MatrixNms::DecayFunction& type);
+using ov::operator<<;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v8::MatrixNms::DecayFunction>
-    : public EnumAttributeAdapterBase<ngraph::op::v8::MatrixNms::DecayFunction> {
-public:
-    AttributeAdapter(ngraph::op::v8::MatrixNms::DecayFunction& value)
-        : EnumAttributeAdapterBase<ngraph::op::v8::MatrixNms::DecayFunction>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v8::MatrixNms::DecayFunction>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/max.hpp b/ngraph/core/include/ngraph/op/max.hpp
index 7d0a2e825b4f87..5d59bf8567d046 100644
--- a/ngraph/core/include/ngraph/op/max.hpp
+++ b/ngraph/core/include/ngraph/op/max.hpp
@@ -6,27 +6,12 @@
 
 #include "ngraph/op/util/arithmetic_reduction.hpp"
 #include "ngraph/op/util/arithmetic_reductions_keep_dims.hpp"
+#include "openvino/op/max.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API ReduceMax : public util::ArithmeticReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a summation operation.
-    ReduceMax() = default;
-    /// \brief Constructs a summation operation.
-    ///
-    /// \param arg The tensor to be summed.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
-    ReduceMax(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::ReduceMax;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/max_pool.hpp b/ngraph/core/include/ngraph/op/max_pool.hpp
index 53096055b64e03..25c4cb50f404a6 100644
--- a/ngraph/core/include/ngraph/op/max_pool.hpp
+++ b/ngraph/core/include/ngraph/op/max_pool.hpp
@@ -7,124 +7,16 @@
 #include <limits>
 
 #include "ngraph/op/util/max_pool_base.hpp"
+#include "openvino/op/max_pool.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Batched max pooling operation.
-class NGRAPH_API MaxPool : public op::util::MaxPoolBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a batched max pooling operation.
-    MaxPool() = default;
-
-    /// \brief Constructs a batched max pooling operation.
-    ///
-    /// \param arg The node producing the input data batch tensor.
-    /// \param strides The strides.
-    /// \param pads_begin The beginning of padding shape.
-    /// \param pads_end The end of padding shape.
-    /// \param kernel The kernel shape.
-    /// \param rounding_type Whether to use ceiling or floor rounding type while
-    /// computing output shape.
-    /// \param auto_pad The pad type for automatically computing padding sizes.
-    MaxPool(const Output<Node>& arg,
-            const Strides& strides,
-            const Shape& pads_begin,
-            const Shape& pads_end,
-            const Shape& kernel,
-            const op::RoundingType rounding_type = op::RoundingType::FLOOR,
-            const PadType auto_pad = op::PadType::EXPLICIT);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The default value for MaxPool.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool evaluate_maxpool(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v1::MaxPool;
 }  // namespace v1
 
 namespace v8 {
-/// \brief MaxPooling operation with values and indices calculated as individual outputs
-class NGRAPH_API MaxPool : public op::util::MaxPoolBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an empty MaxPool operation.
-    MaxPool() = default;
-
-    /// \brief Constructs a parametrized MaxPool operation.
-    ///
-    /// \param arg Output of a node producing the feature tensor to be pooled.
-    /// \param strides The strides of the pooling filter.
-    /// \param dilations The dilations of the pooling filter.
-    /// \param pads_begin Paddings at the beginning of each spatial axis.
-    /// \param pads_end Paddings at the end of each spatial axis.
-    /// \param kernel The kernel shape.
-    /// \param rounding_type Whether to use ceiling or floor rounding type while
-    ///                      computing the output shape.
-    /// \param auto_pad The pad type for automatic calculation of the padding sizes.
-    /// \param index_element_type The data type used by the second output tensor
-    ///                           containing the selected indices.
-    /// \param axis Indicates a dimension in the input data shape which should be used
-    ///             as a starting point for calculation of the upper bound of allowed
-    ///             values of the indices output.
-    MaxPool(const Output<Node>& arg,
-            const Strides& strides,
-            const Strides& dilations,
-            const Shape& pads_begin,
-            const Shape& pads_end,
-            const Shape& kernel,
-            const op::RoundingType rounding_type = op::RoundingType::FLOOR,
-            const PadType auto_pad = op::PadType::EXPLICIT,
-            const element::Type index_element_type = element::i64,
-            const int64_t axis = 0);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The pooling filter's dilations.
-    const Strides& get_dilations() const noexcept {
-        return m_dilations;
-    }
-    void set_dilations(const Strides& dilations) {
-        m_dilations = dilations;
-    }
-
-    /// \return The data type of the second output tensor (indices).
-    element::Type get_index_element_type() const noexcept {
-        return m_index_element_type;
-    }
-    void set_index_element_type(const element::Type index_element_type) {
-        m_index_element_type = index_element_type;
-    }
-
-    // \return The 'axis' attribute value.
-    int64_t get_axis() const {
-        return m_axis;
-    }
-    void set_axis(const int64_t axis) {
-        m_axis = axis;
-    }
-
-private:
-    Strides m_dilations;
-    element::Type m_index_element_type{element::i64};
-    int64_t m_axis{0};
-};
+using ov::op::v8::MaxPool;
 }  // namespace v8
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/maximum.hpp b/ngraph/core/include/ngraph/op/maximum.hpp
index 02bfd1093791e9..11f63f2f532b16 100644
--- a/ngraph/core/include/ngraph/op/maximum.hpp
+++ b/ngraph/core/include/ngraph/op/maximum.hpp
@@ -5,32 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/maximum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise maximum operation.
-class NGRAPH_API Maximum : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a maximum operation.
-    Maximum() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs a maximum operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Maximum(const Output<Node>& arg0,
-            const Output<Node>& arg1,
-            const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Maximum;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/min.hpp b/ngraph/core/include/ngraph/op/min.hpp
index 21c3b8c710c6ff..e3b6a610b6c9cf 100644
--- a/ngraph/core/include/ngraph/op/min.hpp
+++ b/ngraph/core/include/ngraph/op/min.hpp
@@ -6,29 +6,12 @@
 
 #include "ngraph/op/util/arithmetic_reduction.hpp"
 #include "ngraph/op/util/arithmetic_reductions_keep_dims.hpp"
+#include "openvino/op/reduce_min.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API ReduceMin : public util::ArithmeticReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a summation operation.
-    ReduceMin() = default;
-    /// \brief Constructs a summation operation.
-    ///
-    /// \param arg The tensor to be summed.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
-    ReduceMin(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-};
+using ov::op::v1::ReduceMin;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/minimum.hpp b/ngraph/core/include/ngraph/op/minimum.hpp
index 38d10ea1e106b9..201fc8a3238231 100644
--- a/ngraph/core/include/ngraph/op/minimum.hpp
+++ b/ngraph/core/include/ngraph/op/minimum.hpp
@@ -5,32 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/minimum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise minimum operation.
-class NGRAPH_API Minimum : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a minimum operation.
-    Minimum() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs a minimum operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Minimum(const Output<Node>& arg0,
-            const Output<Node>& arg1,
-            const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Minimum;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/mish.hpp b/ngraph/core/include/ngraph/op/mish.hpp
index 943ef5699d8c39..43884f6f318104 100644
--- a/ngraph/core/include/ngraph/op/mish.hpp
+++ b/ngraph/core/include/ngraph/op/mish.hpp
@@ -6,30 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/mish.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-/// \brief A Self Regularized Non-Monotonic Neural Activation Function
-/// f(x) =  x * tanh(log(exp(x) + 1.))
-///
-class NGRAPH_API Mish : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Mish() = default;
-    /// \brief Constructs an Mish operation.
-    ///
-    /// \param data Input tensor
-    Mish(const Output<Node>& arg);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v4::Mish;
 }  // namespace v4
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/mod.hpp b/ngraph/core/include/ngraph/op/mod.hpp
index 4726c24945c94f..7a86e04230d496 100644
--- a/ngraph/core/include/ngraph/op/mod.hpp
+++ b/ngraph/core/include/ngraph/op/mod.hpp
@@ -5,28 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/mod.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Mod returns an element-wise division reminder with two given tensors applying
-/// multi-directional broadcast rules.
-class NGRAPH_API Mod : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a Mod node.
-    Mod() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-    ///
-    /// \param A - Dividend tensor
-    /// \param B - Divisor tensor
-    /// \param auto_broadcast Auto broadcast specification
-    Mod(const Output<Node>& A,
-        const Output<Node>& B,
-        const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v1::Mod;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/multiclass_nms.hpp b/ngraph/core/include/ngraph/op/multiclass_nms.hpp
index 5ecde65cae405d..d88e4d4b6e9d0e 100644
--- a/ngraph/core/include/ngraph/op/multiclass_nms.hpp
+++ b/ngraph/core/include/ngraph/op/multiclass_nms.hpp
@@ -5,65 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/nms_base.hpp"
+#include "openvino/op/multiclass_nms.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v8 {
-/// \brief MulticlassNms operation
-///
-class NGRAPH_API MulticlassNms : public util::NmsBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Structure that specifies attributes of the operation
-    struct Attributes {
-        // specifies order of output elements
-        SortResultType sort_result_type = SortResultType::NONE;
-        // specifies whenever it is necessary to sort selected boxes across batches or
-        // not
-        bool sort_result_across_batch = false;
-        // specifies the output tensor type
-        ngraph::element::Type output_type = ngraph::element::i64;
-        // specifies intersection over union threshold
-        float iou_threshold = 0.0f;
-        // specifies minimum score to consider box for the processing
-        float score_threshold = 0.0f;
-        // specifies maximum number of boxes to be selected per class, -1 meaning to
-        // keep all boxes
-        int nms_top_k = -1;
-        // specifies maximum number of boxes to be selected per batch element, -1
-        // meaning to keep all boxes
-        int keep_top_k = -1;
-        // specifies the background class id, -1 meaning to keep all classes
-        int background_class = -1;
-        // specifies eta parameter for adpative NMS, in close range [0, 1.0]
-        float nms_eta = 1.0f;
-        // specifies whether boxes are normalized or not
-        bool normalized = true;
-    };
-
-    MulticlassNms();
-
-    /// \brief Constructs a MulticlassNms operation
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param attrs Attributes of the operation
-    MulticlassNms(const Output<Node>& boxes, const Output<Node>& scores, const Attributes& attrs);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \brief Returns attributes of the operation MulticlassNms
-    const Attributes& get_attrs() const {
-        return m_attrs;
-    }
-
-protected:
-    Attributes m_attrs;
-    void validate() override;
-};
+using ov::op::v8::MulticlassNms;
 }  // namespace v8
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/multiply.hpp b/ngraph/core/include/ngraph/op/multiply.hpp
index 0826854ebf47f4..2af4196858df3b 100644
--- a/ngraph/core/include/ngraph/op/multiply.hpp
+++ b/ngraph/core/include/ngraph/op/multiply.hpp
@@ -5,32 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/multiply.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise multiplication operation.
-class NGRAPH_API Multiply : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a multiplication operation.
-    Multiply() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs a multiplication operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Multiply(const Output<Node>& arg0,
-             const Output<Node>& arg1,
-             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Multiply;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/mvn.hpp b/ngraph/core/include/ngraph/op/mvn.hpp
index 8795a7cbb8f2db..e4d887ab07043b 100644
--- a/ngraph/core/include/ngraph/op/mvn.hpp
+++ b/ngraph/core/include/ngraph/op/mvn.hpp
@@ -6,142 +6,19 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/mvn.hpp"
 
 namespace ngraph {
 namespace op {
-
 namespace v0 {
-/// \brief Operator performing Mean Variance Normalization
-///
-class NGRAPH_API MVN : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    MVN() = default;
-    /// \brief Constructs an MVN operation.
-    ///
-    /// \param data Input tensor with data
-    /// \param normalize_variance flag that denotes whether to perform variance
-    ///                           normalization.
-    /// \param across_channels flag that denotes if mean values are shared across
-    /// channels.
-    /// \param eps the number to be added to the variance to avoid division by zero when
-    ///            normalizing the value
-    ///
-    MVN(const Output<Node>& data, bool across_channels = true, bool normalize_variance = true, double eps = 1e-9);
-
-    /// \brief Constructs an MVN operation.
-    ///
-    /// \param data Input tensor with data
-    /// \param reduction_axes A list of axes, along which to reduce.
-    /// \param normalize_variance flag that denotes whether to perform variance
-    ///                           normalization.
-    /// \param eps the number to be added to the variance to avoid division by zero when
-    ///            normalizing the value
-    ///
-    MVN(const Output<Node>& data, AxisSet reduction_axes, bool normalize_variance = true, double eps = 1e-9);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    double get_eps() const {
-        return m_eps;
-    }
-    bool get_across_channels() const {
-        return m_across_channels;
-    }
-    bool get_normalize_variance() const {
-        return m_normalize_variance;
-    }
-    AxisSet get_reduction_axes() const {
-        return m_reduction_axes;
-    }
-    void set_reduction_axes(AxisSet axes) {
-        m_reduction_axes = axes;
-    }
-
-private:
-    double m_eps;
-    bool m_across_channels;
-    bool m_normalize_variance;
-    AxisSet m_reduction_axes;
-};
+using ov::op::v0::MVN;
 }  // namespace v0
 using v0::MVN;
 
-/// \brief Specifies how eps is applied in MVN
-enum class MVNEpsMode {
-    // Apply eps inside sqrt
-    INSIDE_SQRT,
-    // Apply eps outside sqrt
-    OUTSIDE_SQRT
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const MVNEpsMode& type);
+using ov::op::MVNEpsMode;
 
 namespace v6 {
-/// \brief Operator performing Mean Variance Normalization
-///
-class NGRAPH_API MVN : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    MVN() = default;
-    /// \brief Constructs an MVN operation.
-    ///
-    /// \param data Input tensor with data
-    /// \param reduction_axes A list of axes, along which to reduce.
-    /// \param normalize_variance flag that denotes whether to perform variance
-    ///                           normalization.
-    /// \param eps the number to be added to the variance to avoid division by zero when
-    ///            normalizing the value
-    /// \param eps_mode the mode of applying epsilon
-    ///
-    MVN(const Output<Node>& data,
-        const Output<Node>& reduction_axes,
-        bool normalize_variance,
-        float eps,
-        MVNEpsMode eps_mode);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    float get_eps() const {
-        return m_eps;
-    }
-    bool get_normalize_variance() const {
-        return m_normalize_variance;
-    }
-    MVNEpsMode get_eps_mode() const {
-        return m_eps_mode;
-    }
-
-private:
-    bool m_normalize_variance;
-    float m_eps;
-    MVNEpsMode m_eps_mode;
-};
+using ov::op::v6::MVN;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::MVNEpsMode> : public EnumAttributeAdapterBase<ngraph::op::MVNEpsMode> {
-public:
-    AttributeAdapter(ngraph::op::MVNEpsMode& value) : EnumAttributeAdapterBase<ngraph::op::MVNEpsMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::MVNEpsMode>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/negative.hpp b/ngraph/core/include/ngraph/op/negative.hpp
index e3c385dd72c730..b7c078e01f485d 100644
--- a/ngraph/core/include/ngraph/op/negative.hpp
+++ b/ngraph/core/include/ngraph/op/negative.hpp
@@ -5,26 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/negative.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise negative operation.
-class NGRAPH_API Negative : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a negative operation.
-    Negative() = default;
-    /// \brief Constructs a negative operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Negative(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Negative;
 }  // namespace v0
 using v0::Negative;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/non_max_suppression.hpp b/ngraph/core/include/ngraph/op/non_max_suppression.hpp
index ef6e6178139189..3b83d9fbc412ba 100644
--- a/ngraph/core/include/ngraph/op/non_max_suppression.hpp
+++ b/ngraph/core/include/ngraph/op/non_max_suppression.hpp
@@ -5,413 +5,25 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/non_max_suppression.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise addition operation.
-///
-class NGRAPH_API NonMaxSuppression : public Op {
-public:
-    enum class BoxEncodingType { CORNER, CENTER };
-
-    NGRAPH_RTTI_DECLARATION;
-
-    NonMaxSuppression() = default;
-
-    /// \brief Constructs a NonMaxSuppression operation.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
-    /// selected per class
-    /// \param iou_threshold Node producing intersection over union threshold
-    /// \param score_threshold Node producing minimum score threshold
-    /// \param box_encoding Specifies the format of boxes data encoding
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const Output<Node>& max_output_boxes_per_class,
-                      const Output<Node>& iou_threshold,
-                      const Output<Node>& score_threshold,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true);
-
-    /// \brief Constructs a NonMaxSuppression operation with default values for the last
-    ///        3 inputs
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box coordinates
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    BoxEncodingType get_box_encoding() const {
-        return m_box_encoding;
-    }
-    void set_box_encoding(const BoxEncodingType box_encoding) {
-        m_box_encoding = box_encoding;
-    }
-    bool get_sort_result_descending() const {
-        return m_sort_result_descending;
-    }
-    void set_sort_result_descending(const bool sort_result_descending) {
-        m_sort_result_descending = sort_result_descending;
-    }
-
-protected:
-    BoxEncodingType m_box_encoding = BoxEncodingType::CORNER;
-    bool m_sort_result_descending = true;
-
-private:
-    int64_t max_boxes_output_from_input() const;
-};
+using ov::op::v1::NonMaxSuppression;
 }  // namespace v1
 
 namespace v3 {
-/// \brief NonMaxSuppression operation
-///
-class NGRAPH_API NonMaxSuppression : public Op {
-public:
-    enum class BoxEncodingType { CORNER, CENTER };
-
-    static constexpr NodeTypeInfo type_info{"NonMaxSuppression", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    NonMaxSuppression() = default;
-
-    /// \brief Constructs a NonMaxSuppression operation.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
-    /// selected per class
-    /// \param iou_threshold Node producing intersection over union threshold
-    /// \param score_threshold Node producing minimum score threshold
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const Output<Node>& max_output_boxes_per_class,
-                      const Output<Node>& iou_threshold,
-                      const Output<Node>& score_threshold,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    /// \brief Constructs a NonMaxSuppression operation with default values for the last
-    ///        3 inputs
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box coordinates
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    BoxEncodingType get_box_encoding() const {
-        return m_box_encoding;
-    }
-    void set_box_encoding(const BoxEncodingType box_encoding) {
-        m_box_encoding = box_encoding;
-    }
-    bool get_sort_result_descending() const {
-        return m_sort_result_descending;
-    }
-    void set_sort_result_descending(const bool sort_result_descending) {
-        m_sort_result_descending = sort_result_descending;
-    }
-
-    element::Type get_output_type() const {
-        return m_output_type;
-    }
-    void set_output_type(const element::Type& output_type) {
-        m_output_type = output_type;
-    }
-    using Node::set_output_type;
-
-protected:
-    BoxEncodingType m_box_encoding = BoxEncodingType::CORNER;
-    bool m_sort_result_descending = true;
-    ngraph::element::Type m_output_type = ngraph::element::i64;
-    void validate();
-    int64_t max_boxes_output_from_input() const;
-};
+using ov::op::v3::NonMaxSuppression;
 }  // namespace v3
 
 namespace v4 {
-/// \brief NonMaxSuppression operation
-///
-class NGRAPH_API NonMaxSuppression : public op::v3::NonMaxSuppression {
-public:
-    static constexpr NodeTypeInfo type_info{"NonMaxSuppression", 4};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    NonMaxSuppression() = default;
-
-    /// \brief Constructs a NonMaxSuppression operation.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
-    /// selected per class
-    /// \param iou_threshold Node producing intersection over union threshold
-    /// \param score_threshold Node producing minimum score threshold
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const Output<Node>& max_output_boxes_per_class,
-                      const Output<Node>& iou_threshold,
-                      const Output<Node>& score_threshold,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    /// \brief Constructs a NonMaxSuppression operation with default values for the last
-    ///        3 inputs
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box coordinates
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v4::NonMaxSuppression;
 }  // namespace v4
 
 namespace v5 {
-/// \brief NonMaxSuppression operation
-///
-class NGRAPH_API NonMaxSuppression : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    enum class BoxEncodingType { CORNER, CENTER };
-
-    NonMaxSuppression() = default;
-
-    /// \brief Constructs a NonMaxSuppression operation with default values in the last
-    ///        4 inputs.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    /// \brief Constructs a NonMaxSuppression operation with default values in the last.
-    ///        3 inputs.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
-    /// selected per class
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const Output<Node>& max_output_boxes_per_class,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    /// \brief Constructs a NonMaxSuppression operation with default values in the last.
-    ///        2 inputs.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
-    /// selected per class
-    /// \param iou_threshold Node producing intersection over union threshold
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const Output<Node>& max_output_boxes_per_class,
-                      const Output<Node>& iou_threshold,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    /// \brief Constructs a NonMaxSuppression operation with default value in the last.
-    ///        input.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
-    /// selected per class
-    /// \param iou_threshold Node producing intersection over union threshold
-    /// \param score_threshold Node producing minimum score threshold
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const Output<Node>& max_output_boxes_per_class,
-                      const Output<Node>& iou_threshold,
-                      const Output<Node>& score_threshold,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    /// \brief Constructs a NonMaxSuppression operation.
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
-    /// selected per class
-    /// \param iou_threshold Node producing intersection over union threshold
-    /// \param score_threshold Node producing minimum score threshold
-    /// \param soft_nms_sigma Node specifying the sigma parameter for Soft-NMS
-    /// \param box_encoding Specifies the format of boxes data encoding
-    /// \param sort_result_descending Specifies whether it is necessary to sort selected
-    /// boxes across batches
-    /// \param output_type Specifies the output tensor type
-    NonMaxSuppression(const Output<Node>& boxes,
-                      const Output<Node>& scores,
-                      const Output<Node>& max_output_boxes_per_class,
-                      const Output<Node>& iou_threshold,
-                      const Output<Node>& score_threshold,
-                      const Output<Node>& soft_nms_sigma,
-                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
-                      const bool sort_result_descending = true,
-                      const ngraph::element::Type& output_type = ngraph::element::i64);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    BoxEncodingType get_box_encoding() const {
-        return m_box_encoding;
-    }
-    void set_box_encoding(const BoxEncodingType box_encoding) {
-        m_box_encoding = box_encoding;
-    }
-    bool get_sort_result_descending() const {
-        return m_sort_result_descending;
-    }
-    void set_sort_result_descending(const bool sort_result_descending) {
-        m_sort_result_descending = sort_result_descending;
-    }
-
-    element::Type get_output_type() const {
-        return m_output_type;
-    }
-    void set_output_type(const element::Type& output_type) {
-        m_output_type = output_type;
-    }
-    using Node::set_output_type;
-
-    int64_t max_boxes_output_from_input() const;
-    float iou_threshold_from_input() const;
-    float score_threshold_from_input() const;
-    float soft_nms_sigma_from_input() const;
-    bool is_soft_nms_sigma_constant_and_default() const;
-
-protected:
-    BoxEncodingType m_box_encoding = BoxEncodingType::CORNER;
-    bool m_sort_result_descending = true;
-    ngraph::element::Type m_output_type = ngraph::element::i64;
-    void validate();
-};
+using ov::op::v5::NonMaxSuppression;
 }  // namespace v5
 }  // namespace op
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v1::NonMaxSuppression::BoxEncodingType& type);
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v3::NonMaxSuppression::BoxEncodingType& type);
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v5::NonMaxSuppression::BoxEncodingType& type);
+using ov::operator<<;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v1::NonMaxSuppression::BoxEncodingType>
-    : public EnumAttributeAdapterBase<ngraph::op::v1::NonMaxSuppression::BoxEncodingType> {
-public:
-    AttributeAdapter(ngraph::op::v1::NonMaxSuppression::BoxEncodingType& value)
-        : EnumAttributeAdapterBase<ngraph::op::v1::NonMaxSuppression::BoxEncodingType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v1::NonMaxSuppression::BoxEncodingType>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v3::NonMaxSuppression::BoxEncodingType>
-    : public EnumAttributeAdapterBase<ngraph::op::v3::NonMaxSuppression::BoxEncodingType> {
-public:
-    AttributeAdapter(ngraph::op::v3::NonMaxSuppression::BoxEncodingType& value)
-        : EnumAttributeAdapterBase<ngraph::op::v3::NonMaxSuppression::BoxEncodingType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v3::NonMaxSuppression::BoxEncodingType>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v5::NonMaxSuppression::BoxEncodingType>
-    : public EnumAttributeAdapterBase<ngraph::op::v5::NonMaxSuppression::BoxEncodingType> {
-public:
-    AttributeAdapter(ngraph::op::v5::NonMaxSuppression::BoxEncodingType& value)
-        : EnumAttributeAdapterBase<ngraph::op::v5::NonMaxSuppression::BoxEncodingType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v5::NonMaxSuppression::BoxEncodingType>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/non_zero.hpp b/ngraph/core/include/ngraph/op/non_zero.hpp
index 84259e2dd48ead..a7c5d71cacd11d 100644
--- a/ngraph/core/include/ngraph/op/non_zero.hpp
+++ b/ngraph/core/include/ngraph/op/non_zero.hpp
@@ -5,63 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/non_zero.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief NonZero operation returning indices of non-zero elements in the input tensor.
-///
-/// \note The indices are returned by-dimension in row-major order. For example
-///       the following output contains 3 indices of a 3D input tensor elements:
-///       [[0, 0, 2],
-///        [0, 1, 1],
-///        [0, 1, 2]]
-///       The values point to input elements at [0,0,0], [0,1,1] and [2,1,2]
-class NGRAPH_API NonZero : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a NonZero operation.
-    NonZero() = default;
-    /// \brief Constructs a NonZero operation.
-    ///
-    /// \note The output type is int64.
-    ///
-    /// \param arg Node that produces the input tensor.
-    NonZero(const Output<Node>& arg);
-    /// \brief Constructs a NonZero operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    /// \param output_type produce indices. Currently, only 'int64' or 'int32'
-    /// are
-    ///                           supported
-    NonZero(const Output<Node>& arg, const std::string& output_type);
-    /// \brief Constructs a NonZero operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    /// \param output_type produce indices. Currently, only int64 or int32 are
-    ///                           supported
-    NonZero(const Output<Node>& arg, const element::Type& output_type);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    element::Type get_output_type() const {
-        return m_output_type;
-    }
-    void set_output_type(element::Type output_type) {
-        m_output_type = output_type;
-    }
-    // Overload collision with method on Node
-    using Node::set_output_type;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    element::Type m_output_type = element::i64;
-};
+using ov::op::v3::NonZero;
 }  // namespace v3
 using v3::NonZero;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/normalize_l2.hpp b/ngraph/core/include/ngraph/op/normalize_l2.hpp
index 3979e953ea1536..cad21c0f75a08c 100644
--- a/ngraph/core/include/ngraph/op/normalize_l2.hpp
+++ b/ngraph/core/include/ngraph/op/normalize_l2.hpp
@@ -9,47 +9,12 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/normalize_l2.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief  Normalization with L2 norm.
-///
-class NGRAPH_API NormalizeL2 : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    NormalizeL2() = default;
-    ///
-    /// \brief      Constructs a NormalizeL2 operation.
-    ///
-    /// \param      data            - Node producing the input tensor
-    /// \param      axes            - Node indicating axes along which reduction is
-    ///                               calculated
-    /// \param      eps             - The epsilon added to L2 norm.
-    /// \param      eps_mode        - Specifies how eps is combined with L2 value
-    ///                               calculated before division
-    ///
-    NormalizeL2(const Output<Node>& data, const Output<Node>& axes, float eps, EpsMode eps_mode);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    float get_eps() const {
-        return m_eps;
-    }
-    EpsMode get_eps_mode() const {
-        return m_eps_mode;
-    }
-    AxisSet get_reduction_axes() const;
-
-protected:
-    float m_eps;
-    EpsMode m_eps_mode;
-};
+using ov::op::v0::NormalizeL2;
 }  // namespace v0
-using v0::NormalizeL2;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/not.hpp b/ngraph/core/include/ngraph/op/not.hpp
index e441e39f903681..8973a13c42c123 100644
--- a/ngraph/core/include/ngraph/op/not.hpp
+++ b/ngraph/core/include/ngraph/op/not.hpp
@@ -5,28 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/logical_not.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise logical negation operation.
-class NGRAPH_API LogicalNot : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a logical negation operation.
-    LogicalNot() = default;
-    /// \brief Constructs a logical negation operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    LogicalNot(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::LogicalNot;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/not_equal.hpp b/ngraph/core/include/ngraph/op/not_equal.hpp
index a2d37109abcd91..4c0aa702b7c4b3 100644
--- a/ngraph/core/include/ngraph/op/not_equal.hpp
+++ b/ngraph/core/include/ngraph/op/not_equal.hpp
@@ -5,31 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_comparison.hpp"
+#include "openvino/op/not_equal.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise not-equal operation.
-class NGRAPH_API NotEqual : public util::BinaryElementwiseComparison {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a not-equal operation.
-    NotEqual() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
-    /// \brief Constructs a not-equal operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    NotEqual(const Output<Node>& arg0,
-             const Output<Node>& arg1,
-             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-};
+using ov::op::v1::NotEqual;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/one_hot.hpp b/ngraph/core/include/ngraph/op/one_hot.hpp
index 5f203cfd057379..ef96a185eb35e8 100644
--- a/ngraph/core/include/ngraph/op/one_hot.hpp
+++ b/ngraph/core/include/ngraph/op/one_hot.hpp
@@ -5,50 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/one_hot.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API OneHot : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a one-hot operation.
-    OneHot() = default;
-    /// \brief Constructs a one-hot operation.
-    ///
-    /// \param indices   Input tensor containing indices.
-    /// \param depth     Specifies number of classes and the size of one-hot dimension.
-    /// \param on_value  Specifies value that the locations in output tensor represented
-    ///                  by indices in input take.
-    /// \param off_value Specifies value that the locations in output tensor not
-    /// represented
-    ///                  by indices in input take.
-    /// \param axis      Axis along which one-hot representation in added.
-    OneHot(const Output<Node>& indices,
-           const Output<Node>& depth,
-           const Output<Node>& on_value,
-           const Output<Node>& off_value,
-           int64_t axis);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    void validate_and_infer_types() override;
-
-    virtual bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
-    bool has_evaluate() const override;
-
-    /// \return The index of the one-hot axis.
-    int64_t get_axis() const {
-        return m_axis;
-    }
-    void set_axis(int64_t axis) {
-        m_axis = axis;
-    }
-
-protected:
-    int64_t m_axis;
-};
+using ov::op::v1::OneHot;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/op.hpp b/ngraph/core/include/ngraph/op/op.hpp
index 8e8ba1c011b9cf..4e3ce52957c84f 100644
--- a/ngraph/core/include/ngraph/op/op.hpp
+++ b/ngraph/core/include/ngraph/op/op.hpp
@@ -7,14 +7,10 @@
 #include <string>
 
 #include "ngraph/node.hpp"
+#include "openvino/op/op.hpp"
 
 namespace ngraph {
 namespace op {
-/// Root of all actual ops
-class NGRAPH_API Op : public Node {
-protected:
-    Op() : Node() {}
-    Op(const OutputVector& arguments);
-};
+using ov::op::Op;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/or.hpp b/ngraph/core/include/ngraph/op/or.hpp
index 7f3d539122625b..9eccc75caa2953 100644
--- a/ngraph/core/include/ngraph/op/or.hpp
+++ b/ngraph/core/include/ngraph/op/or.hpp
@@ -7,35 +7,12 @@
 #include <memory>
 
 #include "ngraph/op/util/binary_elementwise_logical.hpp"
+#include "openvino/op/logical_or.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise logical-or operation.
-///
-class NGRAPH_API LogicalOr : public util::BinaryElementwiseLogical {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    LogicalOr() = default;
-    /// \brief Constructs a logical-or operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param arg1 Node that produces the second input tensor.<br>
-    /// `[d0, ...]`
-    /// \param auto_broadcast Auto broadcast specification
-    ///
-    /// Output `[d0, ...]`
-    ///
-    LogicalOr(const Output<Node>& arg0,
-              const Output<Node>& arg1,
-              const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::LogicalOr;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/pad.hpp b/ngraph/core/include/ngraph/op/pad.hpp
index 4570b0d65f28e5..c1cbf03c29f39c 100644
--- a/ngraph/core/include/ngraph/op/pad.hpp
+++ b/ngraph/core/include/ngraph/op/pad.hpp
@@ -7,73 +7,12 @@
 #include "ngraph/coordinate_diff.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/pad.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Generic padding operation.
-class NGRAPH_API Pad : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a generic padding operation.
-    ///
-    /// \param arg The output producing input tensor to be padded.
-    /// \param pads_begin The output which specifies the number of padding elements
-    /// added
-    /// before position 0 on each axis of arg.
-    /// \param pads_end The output which specifies the number of padding elements
-    /// after the last element on each axis.
-    /// \param arg_pad_value The scalar output with the value used for padding
-    /// if pad_mode is CONSTANT
-    /// \param pad_mode The padding mode: CONSTANT, EDGE, REFLECT or SYMMETRIC.
-    /// CONSTANT initializes new elements with arg_pad_value, EDGE uses the nearest
-    /// value from arg. REFLECT and SYMMETRIC tile the background by flipping arg
-    /// at the edge (SYMMETRIC) or on the last row/column/etc. (REFLECT).
-    Pad(const Output<Node>& arg,
-        const Output<Node>& pads_begin,
-        const Output<Node>& pads_end,
-        const Output<Node>& arg_pad_value,
-        PadMode pad_mode);
-
-    /// \brief Constructs a generic padding operation.
-    ///
-    /// \param arg The output producing input tensor to be padded.
-    /// \param pads_begin The output which specifies the number of padding elements
-    /// added
-    /// \param pads_end The output which specifies the number of padding elements
-    /// after the last element on each axis.
-    /// \param pad_mode The padding mode: CONSTANT, EDGE, REFLECT or SYMMETRIC.
-    Pad(const Output<Node>& arg, const Output<Node>& pads_begin, const Output<Node>& pads_end, PadMode pad_mode);
-
-    /// \brief Constructs a generic padding operation.
-    Pad() = default;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// return The node which specifies the number of padding elements
-    /// added at the beginning of each axis
-    CoordinateDiff get_pads_begin() const;
-    /// return The node which specifies the number of padding elements
-    /// added at the end of each axis
-    CoordinateDiff get_pads_end() const;
-
-    /// \return The padding mode.
-    PadMode get_pad_mode() const {
-        return m_pad_mode;
-    }
-    void set_pad_mode(PadMode pad_mode) {
-        m_pad_mode = pad_mode;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    PadMode m_pad_mode;
-    bool evaluate_pad(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v1::Pad;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/parameter.hpp b/ngraph/core/include/ngraph/op/parameter.hpp
index 9ac3feb7b8faf8..26a7bcbf08c348 100644
--- a/ngraph/core/include/ngraph/op/parameter.hpp
+++ b/ngraph/core/include/ngraph/op/parameter.hpp
@@ -5,78 +5,14 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/parameter.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief A function parameter.
-///
-/// Parameters are nodes that represent the arguments that will be passed to
-/// user-defined functions. Function creation requires a sequence of parameters.
-/// Basic graph operations do not need parameters attached to a function.
-class NGRAPH_API Parameter : public op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructions a tensor-typed parameter node.
-    Parameter() = default;
-    /// \brief Constructions a tensor-typed parameter node.
-    ///
-    /// \param element_type The element type of the parameter.
-    /// \param pshape The partial shape of the parameter.
-    Parameter(const ngraph::element::Type& element_type, const PartialShape& pshape);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool is_relevant_to_shapes() const;
-    void set_is_relevant_to_shapes(bool is_relevant);
-
-    const PartialShape& get_partial_shape() const {
-        return m_partial_shape;
-    }
-    PartialShape& get_partial_shape() {
-        return m_partial_shape;
-    }
-    void set_partial_shape(const PartialShape& partial_shape) {
-        m_partial_shape = partial_shape;
-    }
-    const element::Type& get_element_type() const {
-        return m_element_type;
-    }
-    void set_element_type(const element::Type& element_type) {
-        m_element_type = element_type;
-    }
-
-protected:
-    PartialShape m_partial_shape;
-    element::Type m_element_type;
-    bool m_is_relevant_to_shapes{false};
-};
+using ov::op::v0::Parameter;
 }  // namespace v0
 using v0::Parameter;
 }  // namespace op
 using ParameterVector = std::vector<std::shared_ptr<op::Parameter>>;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::ParameterVector> : public VisitorAdapter {
-public:
-    AttributeAdapter(ngraph::ParameterVector& ref);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<ParameterVector>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-
-protected:
-    ngraph::ParameterVector& m_ref;
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/power.hpp b/ngraph/core/include/ngraph/op/power.hpp
index b56f3b12371e8b..2ce0962868d6e5 100644
--- a/ngraph/core/include/ngraph/op/power.hpp
+++ b/ngraph/core/include/ngraph/op/power.hpp
@@ -5,45 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/power.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-// clang-format off
-            /// \brief Elementwise exponentiation operation.
-            ///
-            /// ## Inputs
-            ///
-            /// |        | Type                              | Description                                            |
-            /// | ------ | --------------------------------- | ------------------------------------------------------ |
-            /// | `arg0` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type.        |
-            /// | `arg1` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
-            ///
-            /// ## Output
-            ///
-            /// | Type                   | Description                                                                                                    |
-            /// | ---------------------- | -------------------------------------------------------------------------------------------------------------- |
-            /// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \texttt{arg0}[i_1,\dots,i_n]^{\texttt{arg1}[i_1,\dots,i_n]}\f$ |
-// clang-format on
-class NGRAPH_API Power : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Power() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs an exponentiation operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Power(const Output<Node>& arg0,
-          const Output<Node>& arg1,
-          const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Power;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/prelu.hpp b/ngraph/core/include/ngraph/op/prelu.hpp
index cc615c958bfbf1..bf69e1c8438b08 100644
--- a/ngraph/core/include/ngraph/op/prelu.hpp
+++ b/ngraph/core/include/ngraph/op/prelu.hpp
@@ -6,33 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/prelu.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Parametrized Relu
-/// x <  0 => f(x) = x * slope
-/// x >= 0 => f(x) = x
-///
-class NGRAPH_API PRelu : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    PRelu();
-    /// \brief Constructs a PRelu operation.
-    ///
-    /// \param data Input tensor
-    /// \param slope Multipliers for negative values
-    PRelu(const Output<Node>& data, const Output<Node>& slope);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    void validate_and_infer_types() override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::PRelu;
 }  // namespace v0
 using v0::PRelu;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/prior_box.hpp b/ngraph/core/include/ngraph/op/prior_box.hpp
index 12d5b814ac472a..0f0b760ef3ce9b 100644
--- a/ngraph/core/include/ngraph/op/prior_box.hpp
+++ b/ngraph/core/include/ngraph/op/prior_box.hpp
@@ -5,64 +5,13 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/prior_box.hpp"
 
 namespace ngraph {
 namespace op {
-struct PriorBoxAttrs {
-    // min_size         Desired min_size of prior boxes
-    // max_size         Desired max_size of prior boxes
-    // aspect_ratio     Aspect ratios of prior boxes
-    // clip             Clip output to [0,1]
-    // flip             Flip aspect ratios
-    // step             Distance between prior box centers
-    // offset           Box offset relative to top center of image
-    // variance         Values to adjust prior boxes with
-    // scale_all_sizes  Scale all sizes
-    std::vector<float> min_size;
-    std::vector<float> max_size;
-    std::vector<float> aspect_ratio;
-    std::vector<float> density;
-    std::vector<float> fixed_ratio;
-    std::vector<float> fixed_size;
-    bool clip = false;
-    bool flip = false;
-    float step = 0.0f;
-    float offset = 0.0f;
-    std::vector<float> variance;
-    bool scale_all_sizes = true;
-};
-
+using PriorBoxAttrs = ov::op::v0::PriorBox::Attributes;
 namespace v0 {
-/// \brief Layer which generates prior boxes of specified sizes
-/// normalized to input image size
-class NGRAPH_API PriorBox : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    PriorBox() = default;
-    /// \brief Constructs a PriorBox operation
-    ///
-    /// \param layer_shape    Shape of layer for which prior boxes are computed
-    /// \param image_shape    Shape of image to which prior boxes are scaled
-    /// \param attrs          PriorBox attributes
-    PriorBox(const Output<Node>& layer_shape, const Output<Node>& image_shape, const PriorBoxAttrs& attrs);
-
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    static int64_t number_of_priors(const PriorBoxAttrs& attrs);
-
-    static std::vector<float> normalized_aspect_ratio(const std::vector<float>& aspect_ratio, bool flip);
-    const PriorBoxAttrs& get_attrs() const {
-        return m_attrs;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    PriorBoxAttrs m_attrs;
-};
+using ov::op::v0::PriorBox;
 }  // namespace v0
 using v0::PriorBox;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/prior_box_clustered.hpp b/ngraph/core/include/ngraph/op/prior_box_clustered.hpp
index 77a1d5fca420cf..b5646c37427208 100644
--- a/ngraph/core/include/ngraph/op/prior_box_clustered.hpp
+++ b/ngraph/core/include/ngraph/op/prior_box_clustered.hpp
@@ -5,57 +5,14 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/prior_box_clustered.hpp"
 
 namespace ngraph {
 namespace op {
-struct NGRAPH_API PriorBoxClusteredAttrs {
-    // widths         Desired widths of prior boxes
-    // heights        Desired heights of prior boxes
-    // clip           Clip output to [0,1]
-    // step_widths    Distance between prior box centers
-    // step_heights   Distance between prior box centers
-    // step           Distance between prior box centers (when step_w = step_h)
-    // offset         Box offset relative to top center of image
-    // variances      Values to adjust prior boxes with
-    std::vector<float> widths;
-    std::vector<float> heights;
-    bool clip = true;
-    float step_widths = 0.0f;
-    float step_heights = 0.0f;
-    float step = 0.0f;
-    float offset = 0.0f;
-    std::vector<float> variances;
-};
+using PriorBoxClusteredAttrs = ov::op::v0::PriorBoxClustered::Attributes;
 
 namespace v0 {
-/// \brief Layer which generates prior boxes of specified sizes
-/// normalized to input image size
-class NGRAPH_API PriorBoxClustered : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    PriorBoxClustered() = default;
-    /// \brief Constructs a PriorBoxClustered operation
-    ///
-    /// \param layer_shape    Shape of layer for which prior boxes are computed
-    /// \param image_shape    Shape of image to which prior boxes are scaled
-    /// \param attrs          PriorBoxClustered attributes
-    PriorBoxClustered(const Output<Node>& layer_shape,
-                      const Output<Node>& image_shape,
-                      const PriorBoxClusteredAttrs& attrs);
-
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    const PriorBoxClusteredAttrs& get_attrs() const {
-        return m_attrs;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    PriorBoxClusteredAttrs m_attrs;
-};
+using ov::op::v0::PriorBoxClustered;
 }  // namespace v0
 using v0::PriorBoxClustered;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/proposal.hpp b/ngraph/core/include/ngraph/op/proposal.hpp
index 0c4e7b023d1638..8d83da40671a31 100644
--- a/ngraph/core/include/ngraph/op/proposal.hpp
+++ b/ngraph/core/include/ngraph/op/proposal.hpp
@@ -5,93 +5,19 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/proposal.hpp"
 
 namespace ngraph {
 namespace op {
-// base_size       Anchor sizes
-// pre_nms_topn    Number of boxes before nms
-// post_nms_topn   Number of boxes after nms
-// nms_thresh      Threshold for nms
-// feat_stride     Feature stride
-// min_size        Minimum box size
-// ratio   Ratios for anchor generation
-// scale   Scales for anchor generation
-// clip_before_nms Clip before NMs
-// clip_after_nms  Clip after NMs
-// normalize       Normalize boxes to [0,1]
-// box_size_scale  Scale factor for scaling box size
-// box_coordinate_scale Scale factor for scaling box coordiate
-// framework            Calculation frameworkrithm to use
-struct ProposalAttrs {
-    size_t base_size;
-    size_t pre_nms_topn;
-    size_t post_nms_topn;
-    float nms_thresh = 0.0f;
-    size_t feat_stride = 1;
-    size_t min_size = 1;
-    std::vector<float> ratio;
-    std::vector<float> scale;
-    bool clip_before_nms = true;
-    bool clip_after_nms = false;
-    bool normalize = false;
-    float box_size_scale = 1.0f;
-    float box_coordinate_scale = 1.0f;
-    std::string framework;
-    bool infer_probs = false;
-};
+using ProposalAttrs = ov::op::v0::Proposal::Attributes;
 
 namespace v0 {
-class NGRAPH_API Proposal : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Proposal() = default;
-    /// \brief Constructs a Proposal operation
-    ///
-    /// \param class_probs     Class probability scores
-    /// \param bbox_deltas     Prediction of bounding box deltas
-    /// \param image_shape     Shape of image
-    /// \param attrs           Proposal op attributes
-    Proposal(const Output<Node>& class_probs,
-             const Output<Node>& bbox_deltas,
-             const Output<Node>& image_shape,
-             const ProposalAttrs& attrs);
-
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    const ProposalAttrs& get_attrs() const {
-        return m_attrs;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-protected:
-    ProposalAttrs m_attrs;
-};
+using ov::op::v0::Proposal;
 }  // namespace v0
 
 namespace v4 {
-class NGRAPH_API Proposal : public op::v0::Proposal {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Proposal() = default;
-    /// \brief Constructs a Proposal operation
-    ///
-    /// \param class_probs     Class probability scores
-    /// \param bbox_deltas     Prediction of bounding box deltas
-    /// \param image_shape     Shape of image
-    /// \param attrs           Proposal op attributes
-    Proposal(const Output<Node>& class_probs,
-             const Output<Node>& bbox_deltas,
-             const Output<Node>& image_shape,
-             const ProposalAttrs& attrs);
-
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    const ProposalAttrs& get_attrs() const {
-        return m_attrs;
-    }
-};
+using ov::op::v4::Proposal;
 }  // namespace v4
-
 using v0::Proposal;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/psroi_pooling.hpp b/ngraph/core/include/ngraph/op/psroi_pooling.hpp
index 02d7815df99952..2f4ca9c5681e17 100644
--- a/ngraph/core/include/ngraph/op/psroi_pooling.hpp
+++ b/ngraph/core/include/ngraph/op/psroi_pooling.hpp
@@ -5,68 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/psroi_pooling.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API PSROIPooling : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    PSROIPooling() = default;
-    /// \brief Constructs a PSROIPooling operation
-    ///
-    /// \param input          Input feature map {N, C, ...}
-    /// \param coords         Coordinates of bounding boxes
-    /// \param output_dim     Output channel number
-    /// \param group_size     Number of groups to encode position-sensitive scores
-    /// \param spatial_scale  Ratio of input feature map over input image size
-    /// \param spatial_bins_x Numbers of bins to divide the input feature maps over
-    /// width
-    /// \param spatial_bins_y Numbers of bins to divide the input feature maps over
-    /// height
-    /// \param mode           Mode of pooling - Avg or Bilinear
-    PSROIPooling(const Output<Node>& input,
-                 const Output<Node>& coords,
-                 const size_t output_dim,
-                 const size_t group_size,
-                 const float spatial_scale,
-                 int spatial_bins_x,
-                 int spatial_bins_y,
-                 const std::string& mode);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    size_t get_output_dim() const {
-        return m_output_dim;
-    }
-    size_t get_group_size() const {
-        return m_group_size;
-    }
-    float get_spatial_scale() const {
-        return m_spatial_scale;
-    }
-    int get_spatial_bins_x() const {
-        return m_spatial_bins_x;
-    }
-    int get_spatial_bins_y() const {
-        return m_spatial_bins_y;
-    }
-    const std::string& get_mode() const {
-        return m_mode;
-    }
-
-private:
-    size_t m_output_dim;
-    size_t m_group_size;
-    float m_spatial_scale;
-    int m_spatial_bins_x;
-    int m_spatial_bins_y;
-    std::string m_mode;
-};
+using ov::op::v0::PSROIPooling;
 }  // namespace v0
 using v0::PSROIPooling;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/random_uniform.hpp b/ngraph/core/include/ngraph/op/random_uniform.hpp
index 242294cc748d89..bf0af07c2d14e1 100644
--- a/ngraph/core/include/ngraph/op/random_uniform.hpp
+++ b/ngraph/core/include/ngraph/op/random_uniform.hpp
@@ -6,68 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/random_uniform.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v8 {
-/// \brief Tensor RandomUniform operation.
-class NGRAPH_API RandomUniform : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    RandomUniform() = default;
-
-    ///
-    /// \brief      Constructs a RandomUniform operation.
-    ///
-    /// \param      out_shape         Node producing the tensor with output shape.
-    /// \param      min_val           Node producing the tensor with minimum value.
-    /// \param      max_val           Node producing the tensor with maximum value.
-    /// \param      out_type          Output type of the tensor.
-    /// \param      global_seed       Global seed value.
-    /// \param      op_seed           Operational seed value.
-    RandomUniform(const Output<Node>& out_shape,
-                  const Output<Node>& min_val,
-                  const Output<Node>& max_val,
-                  const ngraph::element::Type& out_type,
-                  uint64_t global_seed,
-                  uint64_t op_seed);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The output tensor type.
-    const ngraph::element::Type& get_out_type() const {
-        return m_output_type;
-    }
-    void set_out_type(const ngraph::element::Type& output_type) {
-        m_output_type = output_type;
-    }
-
-    /// \return The global seed value.
-    uint64_t get_global_seed() const {
-        return m_global_seed;
-    }
-    void set_global_seed(uint64_t seed) {
-        m_global_seed = seed;
-    }
-
-    /// \return The operational seed value.
-    uint64_t get_op_seed() const {
-        return m_op_seed;
-    }
-    void set_op_seed(uint64_t seed2) {
-        m_op_seed = seed2;
-    }
-
-protected:
-    ngraph::element::Type m_output_type;
-    uint64_t m_global_seed;
-    uint64_t m_op_seed;
-};
+using ov::op::v8::RandomUniform;
 }  // namespace v8
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/range.hpp b/ngraph/core/include/ngraph/op/range.hpp
index 294804baa21686..72fc1984fc8472 100644
--- a/ngraph/core/include/ngraph/op/range.hpp
+++ b/ngraph/core/include/ngraph/op/range.hpp
@@ -6,70 +6,15 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/range.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-/// \brief Range operation, analogous to `arange()` in Numpy.
-class NGRAPH_API Range : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs an unitialized range operation.
-    Range() = default;
-
-    /// \brief Constructs a range operation.
-    ///
-    /// \param start The tensor producing the start value. Must be a scalar of numeric
-    ///              element type.
-    /// \param stop The tensor producing the stop value. Must be a scalar of numeric
-    ///             element type.
-    /// \param step The tensor producing the step value. Must be a scalar of numeric
-    ///             element type.
-    /// \param output_type The type of the output.
-    Range(const Output<Node>& start, const Output<Node>& stop, const Output<Node>& step, element::Type output_type);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    void set_output_type(element::Type output_type) {
-        m_output_type = output_type;
-    }
-    // Overload collision with method on Node
-    using Node::set_output_type;
-
-private:
-    element::Type m_output_type;
-};
+using ov::op::v4::Range;
 }  // namespace v4
 namespace v0 {
-/// \brief Range operation, analogous to `range()` in Python.
-class NGRAPH_API Range : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs an unitialized range operation.
-    Range() = default;
-
-    /// \brief Constructs a range operation.
-    ///
-    /// \param start The tensor producing the start value. Must be a scalar of integer
-    ///              element type, and same element type as `stop` and `step`.
-    /// \param stop The tensor producing the stop value. Must be a scalar of integer
-    ///             element type, and same element type as `start` and `step`.
-    /// \param step The tensor producing the step value. Must be a scalar of integer
-    ///             element type, and same element type as `start` and `stop`.
-    Range(const Output<Node>& start, const Output<Node>& stop, const Output<Node>& step);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Range;
 }  // namespace v0
 using v0::Range;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/read_value.hpp b/ngraph/core/include/ngraph/op/read_value.hpp
index 1737cfce678eaf..8106aa9384aa26 100644
--- a/ngraph/core/include/ngraph/op/read_value.hpp
+++ b/ngraph/core/include/ngraph/op/read_value.hpp
@@ -7,84 +7,18 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/variable.hpp"
 #include "ngraph/op/util/variable_extension.hpp"
+#include "openvino/op/read_value.hpp"
 
 namespace ngraph {
 namespace op {
-class NGRAPH_API ReadValueBase : public Op, public VariableExtension {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ReadValueBase() = default;
-
-    /// \brief Constructs an AssignBase operation.
-    explicit ReadValueBase(const OutputVector& arguments) : Op(arguments) {}
-};
+using ov::op::util::ReadValueBase;
 
 namespace v3 {
-/// \brief ReadValue operation creates the variable with `variable_id` and returns value
-/// of this variable.
-class NGRAPH_API ReadValue : public ReadValueBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    ReadValue() = default;
-
-    /// \brief Constructs a ReadValue operation.
-    ///
-    /// \param init_value   Node that produces the input tensor.
-    /// \param variable_id  identificator of the variable to create.
-    ReadValue(const Output<Node>& init_value, const std::string& variable_id);
-
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::string get_variable_id() const override {
-        return m_variable_id;
-    }
-
-private:
-    std::string m_variable_id;
-};
+using ov::op::v3::ReadValue;
 }  // namespace v3
 
 namespace v6 {
-/// \brief ReadValue operation gets an input value from the variable with `variable_id`
-/// and returns it as an output.
-class NGRAPH_API ReadValue : public ReadValueBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    ReadValue() = default;
-
-    /// \brief Constructs a ReadValue operation.
-    ///
-    /// \param init_value Node that produces the input tensor.
-    /// \param variable Class for storing and synchronizing element types, shapes and
-    /// identifiers
-    /// between pairs of Assign/ReadValue nodes.
-    ReadValue(const Output<Node>& init_value, const std::shared_ptr<Variable>& variable);
-
-    void validate_and_infer_types() override;
-
-    void revalidate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::string get_variable_id() const override {
-        NGRAPH_CHECK(m_variable, "Variable is not initialized. Variable_id is unavailable");
-        return m_variable->get_info().variable_id;
-    }
-
-    bool evaluate(const HostTensorVector& outputs,
-                  const HostTensorVector& inputs,
-                  const EvaluationContext& evaluation_context) const override;
-    bool has_evaluate() const override;
-
-    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
-};
+using ov::op::v6::ReadValue;
 }  // namespace v6
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/reduce_l1.hpp b/ngraph/core/include/ngraph/op/reduce_l1.hpp
index 991eaa19abf412..aa0dd2001c74a9 100644
--- a/ngraph/core/include/ngraph/op/reduce_l1.hpp
+++ b/ngraph/core/include/ngraph/op/reduce_l1.hpp
@@ -5,36 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/arithmetic_reductions_keep_dims.hpp"
+#include "openvino/op/reduce_l1.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-/// \brief Reduction operation using L1 norm: L1(x) = sum(abs(x)) if all dimensions are
-/// specified for the normalisation.
-///
-/// Reduces the tensor, eliminating the specified reduction axes by taking the L1-norm.
-class NGRAPH_API ReduceL1 : public util::ArithmeticReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a reducet L1-norm operation.
-    ReduceL1() = default;
-    /// \brief Constructs a reduce L1-norm operation.
-    ///
-    /// \param arg The tensor to be reduced.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to true it holds axes that are used for reduction.
-    ReduceL1(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
-
-    /// \return The default value for Reduce.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v4::ReduceL1;
 }  // namespace v4
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/reduce_l2.hpp b/ngraph/core/include/ngraph/op/reduce_l2.hpp
index 2629a365396127..7f9aef888ca22d 100644
--- a/ngraph/core/include/ngraph/op/reduce_l2.hpp
+++ b/ngraph/core/include/ngraph/op/reduce_l2.hpp
@@ -5,35 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/arithmetic_reductions_keep_dims.hpp"
+#include "openvino/op/reduce_l2.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-/// \brief Reduction operation using L2 norm:
-///
-/// Reduces the tensor, eliminating the specified reduction axes by taking the L2-norm.
-class NGRAPH_API ReduceL2 : public util::ArithmeticReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a reducet L2-norm operation.
-    ReduceL2() = default;
-    /// \brief Constructs a reduce L2-norm operation.
-    ///
-    /// \param arg The tensor to be reduced.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to true it holds axes that are used for reduction.
-    ReduceL2(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
-
-    /// \return The default value for Reduce.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v4::ReduceL2;
 }  // namespace v4
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/reduce_logical_and.hpp b/ngraph/core/include/ngraph/op/reduce_logical_and.hpp
index 2d2ffcc957596c..ced9f28b8bc1c2 100644
--- a/ngraph/core/include/ngraph/op/reduce_logical_and.hpp
+++ b/ngraph/core/include/ngraph/op/reduce_logical_and.hpp
@@ -5,31 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/logical_reduction_keep_dims.hpp"
+#include "openvino/op/reduce_logical_and.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Performs a reduction using "logical and"
-///
-/// The reduction is performed over slices of the first input. The slices shape depends
-/// on the values passed to the second input - the axes.
-class NGRAPH_API ReduceLogicalAnd : public util::LogicalReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    ReduceLogicalAnd() = default;
-    /// \brief Constructs a ReduceLogicalAnd node.
-    ///
-    /// \param data - The input tensor with data to be reduced
-    /// \param reduction_axes - The input tensor with information about axes over which
-    /// the first tensor should be sliced prior to the reduction operation
-    /// \param keep_dims - Indicates if the axes used for reduction should be held/kept
-    ReduceLogicalAnd(const Output<Node>& data, const Output<Node>& reduction_axes, const bool keep_dims = false);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::ReduceLogicalAnd;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/reduce_logical_or.hpp b/ngraph/core/include/ngraph/op/reduce_logical_or.hpp
index 43ec7a04aa89e4..26111f556b543b 100644
--- a/ngraph/core/include/ngraph/op/reduce_logical_or.hpp
+++ b/ngraph/core/include/ngraph/op/reduce_logical_or.hpp
@@ -5,31 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/logical_reduction_keep_dims.hpp"
+#include "openvino/op/reduce_logical_or.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Performs a reduction using "logical or"
-///
-/// The reduction is performed over slices of the first input. The slices shape depends
-/// on the values passed to the second input - the axes.
-class NGRAPH_API ReduceLogicalOr : public util::LogicalReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    ReduceLogicalOr() = default;
-    /// \brief Constructs a ReduceLogicalOr node.
-    ///
-    /// \param data - The input tensor with data to be reduced
-    /// \param reduction_axes - The input tensor with information about axes over which
-    /// the first tensor should be sliced prior to the reduction operation
-    /// \param keep_dims - Indicates if the axes used for reduction should be held/kept
-    ReduceLogicalOr(const Output<Node>& data, const Output<Node>& reduction_axes, const bool keep_dims = false);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::ReduceLogicalOr;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/reduce_mean.hpp b/ngraph/core/include/ngraph/op/reduce_mean.hpp
index 488f153a2aaedb..836c9ead84f1e5 100644
--- a/ngraph/core/include/ngraph/op/reduce_mean.hpp
+++ b/ngraph/core/include/ngraph/op/reduce_mean.hpp
@@ -6,25 +6,12 @@
 
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/util/arithmetic_reductions_keep_dims.hpp"
+#include "openvino/op/reduce_mean.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API ReduceMean : public util::ArithmeticReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    ReduceMean() = default;
-
-    /// \param arg The tensor to be summed.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
-    ReduceMean(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::ReduceMean;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/reduce_prod.hpp b/ngraph/core/include/ngraph/op/reduce_prod.hpp
index 4199c8b57e88a9..51f85ded5d2007 100644
--- a/ngraph/core/include/ngraph/op/reduce_prod.hpp
+++ b/ngraph/core/include/ngraph/op/reduce_prod.hpp
@@ -5,37 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/arithmetic_reductions_keep_dims.hpp"
+#include "openvino/op/reduce_prod.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Product reduction operation.
-///
-/// Reduces the tensor, eliminating the specified reduction axes by taking the product.
-class NGRAPH_API ReduceProd : public util::ArithmeticReductionKeepDims {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a product reduction operation.
-    ReduceProd() = default;
-    /// \brief Constructs a product reduction operation.
-    ///
-    /// \param arg The tensor to be reduced.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to true it holds axes that are used for reduction.
-    ReduceProd(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
-
-    /// \return The default value for Product.
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    virtual std::shared_ptr<Node> get_default_value() const override;
-    NGRAPH_SUPPRESS_DEPRECATED_END
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-};
+using ov::op::v1::ReduceProd;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/reduce_sum.hpp b/ngraph/core/include/ngraph/op/reduce_sum.hpp
index 9ef5a433882f81..30d287960551db 100644
--- a/ngraph/core/include/ngraph/op/reduce_sum.hpp
+++ b/ngraph/core/include/ngraph/op/reduce_sum.hpp
@@ -6,86 +6,12 @@
 
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/util/arithmetic_reductions_keep_dims.hpp"
+#include "openvino/op/reduce_sum.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-// clang-format off
-            /// \brief Tensor sum operation.
-            ///
-            /// Element-wise sums the input tensor, eliminating the specified reduction axes.
-            /// For example:
-            ///
-            /// \f[
-            ///     \mathit{sum}\left(\{0\},
-            ///         \left[ \begin{array}{ccc}
-            ///                1 & 2 \\ 3 & 4 \\ 5 & 6 \end{array} \right]\right) =
-            ///     \left[ (1 + 3 + 5), (2 + 4 + 6) \right] =
-            ///     \left[ 9, 12 \right]~~~\text{(dimension 0 (rows) is eliminated)}
-            /// \f]
-            ///
-            /// \f[
-            ///     \mathit{sum}\left(\{1\},
-            ///         \left[ \begin{array}{ccc}
-            ///                1 & 2 \\ 3 & 4 \\ 5 & 6 \end{array} \right]\right) =
-            ///     \left[ (1 + 2), (3 + 4), (5 + 6) \right] =
-            ///     \left[ 3, 7, 11 \right]~~~\text{(dimension 1 (columns) is eliminated)}
-            /// \f]
-            ///
-            /// \f[
-            ///     \mathit{sum}\left(\{0,1\},
-            ///         \left[ \begin{array}{ccc}
-            ///                1 & 2 \\ 3 & 4 \\ 5 & 6 \end{array} \right]\right) =
-            ///      (1 + 2) + (3 + 4) + (5 + 6) =
-            ///      21~~~\text{(both dimensions (rows and columns) are eliminated)}
-            /// \f]
-            ///
-            /// ## Parameters
-            ///
-            /// |                      | Description                                            |
-            /// | -------------------- | ----------------------------------------               |
-            /// | `reduction_axes`     | The axes to eliminate through summation.               |
-            /// | `keep_dims`          | If set to 1 it holds axes that are used for reduction. |
-            ///
-            /// ## Inputs
-            ///
-            /// |       | Type                              | Description                                            |
-            /// | ----- | --------------------------------- | ------------------------------------------------------ |
-            /// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | An input tensor of any shape and numeric element type. |
-            ///
-            /// ## Output
-            ///
-            /// | Type                                      | Description                                                                                                      |
-            /// | ----------------------------------------- | ---------------------------------------------------------------------------------------------------------------- |
-            /// | \f$N[\textit{delete}(A,d_1,\dots,d_n)]\f$ | The tensor \f$T\f$, where \f$T\f$ is the input tensor with the `reduction_axes` \f$A\f$ eliminated by summation. |
-            // clang-format off
-            class NGRAPH_API ReduceSum : public util::ArithmeticReductionKeepDims
-            {
-            public:
-                NGRAPH_RTTI_DECLARATION;
-                /// \brief Constructs a summation operation.
-                ReduceSum() = default;
-                /// \brief Constructs a summation operation.
-                ///
-                /// \param arg The tensor to be summed.
-                /// \param reduction_axes The axis positions (0-based) to be eliminated.
-                /// \param keep_dims If set to 1 it holds axes that are used for reduction.
-                ReduceSum(const Output<Node>& arg,
-                          const Output<Node>& reduction_axes,
-                          bool keep_dims = false);
-
-                virtual std::shared_ptr<Node>
-                    clone_with_new_inputs(const OutputVector& new_args) const override;
-
-                /// \return The default value for Sum.
-                NGRAPH_SUPPRESS_DEPRECATED_START
-                virtual std::shared_ptr<Node> get_default_value() const override;
-                NGRAPH_SUPPRESS_DEPRECATED_END
-
-                bool evaluate(const HostTensorVector& outputs,
-                              const HostTensorVector& inputs) const override;
-                bool has_evaluate() const override;
-            };
-        }
-    }
-}
+using ov::op::v1::ReduceSum;
+}  // namespace v1
+}  // namespace op
+}  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/region_yolo.hpp b/ngraph/core/include/ngraph/op/region_yolo.hpp
index f3430d3cdb5360..8f3efbc0a76c71 100644
--- a/ngraph/core/include/ngraph/op/region_yolo.hpp
+++ b/ngraph/core/include/ngraph/op/region_yolo.hpp
@@ -5,80 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/region_yolo.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API RegionYolo : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    RegionYolo() = default;
-    ///
-    /// \brief      Constructs a RegionYolo operation
-    ///
-    /// \param[in]  input        Input
-    /// \param[in]  coords       Number of coordinates for each region
-    /// \param[in]  classes      Number of classes for each region
-    /// \param[in]  regions      Number of regions
-    /// \param[in]  do_softmax   Compute softmax
-    /// \param[in]  mask         Mask
-    /// \param[in]  axis         Axis to begin softmax on
-    /// \param[in]  end_axis     Axis to end softmax on
-    /// \param[in]  anchors      A flattened list of pairs `[width, height]` that
-    /// describes
-    ///                          prior box sizes.
-    ///
-    RegionYolo(const Output<Node>& input,
-               const size_t coords,
-               const size_t classes,
-               const size_t regions,
-               const bool do_softmax,
-               const std::vector<int64_t>& mask,
-               const int axis,
-               const int end_axis,
-               const std::vector<float>& anchors = std::vector<float>{});
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    size_t get_num_coords() const {
-        return m_num_coords;
-    }
-    size_t get_num_classes() const {
-        return m_num_classes;
-    }
-    size_t get_num_regions() const {
-        return m_num_regions;
-    }
-    bool get_do_softmax() const {
-        return m_do_softmax;
-    }
-    const std::vector<int64_t>& get_mask() const {
-        return m_mask;
-    }
-    const std::vector<float>& get_anchors() const {
-        return m_anchors;
-    }
-    int get_axis() const {
-        return m_axis;
-    }
-    int get_end_axis() const {
-        return m_end_axis;
-    }
-
-private:
-    size_t m_num_coords;
-    size_t m_num_classes;
-    size_t m_num_regions;
-    bool m_do_softmax;
-    std::vector<int64_t> m_mask;
-    std::vector<float> m_anchors{};
-    int m_axis;
-    int m_end_axis;
-};
+using ov::op::v0::RegionYolo;
 }  // namespace v0
 using v0::RegionYolo;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/relu.hpp b/ngraph/core/include/ngraph/op/relu.hpp
index 1b38d55bb303e3..6bf7253ef1fd02 100644
--- a/ngraph/core/include/ngraph/op/relu.hpp
+++ b/ngraph/core/include/ngraph/op/relu.hpp
@@ -10,27 +10,12 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/relu.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise Relu operation.
-///
-class NGRAPH_API Relu : public ngraph::op::util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Relu() = default;
-    /// \brief Constructs a Relu operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Relu(const Output<ngraph::Node>& arg);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-};
+using ov::op::v0::Relu;
 }  // namespace v0
 using v0::Relu;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/reorg_yolo.hpp b/ngraph/core/include/ngraph/op/reorg_yolo.hpp
index ee0ff0b163329d..1e10622dc7a5b2 100644
--- a/ngraph/core/include/ngraph/op/reorg_yolo.hpp
+++ b/ngraph/core/include/ngraph/op/reorg_yolo.hpp
@@ -5,37 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/reorg_yolo.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API ReorgYolo : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ReorgYolo() = default;
-    /// \brief Constructs a ReorgYolo operation
-    ///
-    /// \param input          Input
-    /// \param stride         Stride to reorganize input by
-    ReorgYolo(const Output<Node>& input, const size_t stride);
-
-    // Constructor with `strides` for backward compatibility
-    ReorgYolo(const Output<Node>& input, const Strides& strides);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    Strides get_strides() const {
-        return m_strides;
-    }
-
-private:
-    Strides m_strides;
-};
+using ov::op::v0::ReorgYolo;
 }  // namespace v0
 using v0::ReorgYolo;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/reshape.hpp b/ngraph/core/include/ngraph/op/reshape.hpp
index f5ab9e1263e5c1..72730ee9d7e42e 100644
--- a/ngraph/core/include/ngraph/op/reshape.hpp
+++ b/ngraph/core/include/ngraph/op/reshape.hpp
@@ -8,62 +8,12 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/op/reshape.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Tensor dynamic reshape operation.
-///
-/// "Converts" an input tensor into a new shape with the same number of elements.
-/// This op does not touch the actual data. If needed, use Transpose for that purpose.
-///
-class NGRAPH_API Reshape : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Reshape() = default;
-    /// \brief Constructs a dynamic reshape operation. This operation does not perform
-    ///        transpose.
-    ///
-    /// \param arg The tensor to be reshaped.
-    /// \param shape_pattern The node that defines output shape shape_pattern.
-    ///        If the input shape is \f$(a_0,\dots,a_{k-1})\f$ then the output shape
-    ///        must
-    ///        be of the form \f$(b_0,\dots,b_{j-1})\f$ where \f$\Pi(a_i) = \Pi(b_i)\f$.
-    ///        A value of -1 is allowed for at most one dimension, in which case the
-    ///        dimension size is inferred based on element count of input tensor.
-    /// \param special_zero Treats zeros in `shape_pattern` as wildcard flags indicating
-    /// a
-    ///        copy from input shape at the same index.
-    ///
-    Reshape(const Output<Node>& arg, const Output<Node>& shape_pattern, bool special_zero);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool get_special_zero() const {
-        return m_special_zero;
-    }
-    void set_special_zero(bool special_zero) {
-        m_special_zero = special_zero;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
-
-protected:
-    bool m_special_zero;
-    bool evaluate_reshape(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-
-private:
-    void calculate_output_shape(std::vector<Dimension>& reshape_pattern,
-                                const int64_t& minus_one_idx,
-                                const PartialShape& input_pshape,
-                                std::vector<Dimension>& output_shape) const;
-};
+using ov::op::v1::Reshape;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/result.hpp b/ngraph/core/include/ngraph/op/result.hpp
index da47ff4b83fb3d..4eb82338023253 100644
--- a/ngraph/core/include/ngraph/op/result.hpp
+++ b/ngraph/core/include/ngraph/op/result.hpp
@@ -7,62 +7,14 @@
 #include <memory>
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/result.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API Result : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Allows a value to be used as a function result.
-    Result() = default;
-    /// \brief Allows a value to be used as a function result.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Result(const Output<Node>& arg, bool needs_default_layout = false);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    void set_needs_default_layout(bool val) {
-        m_needs_default_layout = val;
-    }
-    bool needs_default_layout() const {
-        return m_needs_default_layout;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
-
-private:
-    bool m_needs_default_layout{false};
-};
+using ov::op::v0::Result;
 }  // namespace v0
-
 using v0::Result;
 }  // namespace op
 using ResultVector = std::vector<std::shared_ptr<op::Result>>;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::ResultVector> : public VisitorAdapter {
-public:
-    AttributeAdapter(ngraph::ResultVector& ref);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<ResultVector>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-
-protected:
-    ngraph::ResultVector& m_ref;
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/reverse.hpp b/ngraph/core/include/ngraph/op/reverse.hpp
index cbbdb7500131f3..6874c94977aec9 100644
--- a/ngraph/core/include/ngraph/op/reverse.hpp
+++ b/ngraph/core/include/ngraph/op/reverse.hpp
@@ -5,76 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/reverse.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API Reverse : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    enum class Mode { INDEX, MASK };
-
-    Reverse() = default;
-    /// \brief Constructs a reverse operation.
-    ///
-    /// \param data The input tensor, some of whose axes are to be reversed.
-    /// \param reversed_axes The axes to reverse in a form of a set of indices or
-    /// boolean mask.
-    /// \param mode The way reversed_axes should be interpreted - a set or a mask.
-    Reverse(const Output<Node>& data, const Output<Node>& reversed_axes, const std::string& mode);
-
-    Reverse(const Output<Node>& data, const Output<Node>& reversed_axes, const Mode mode);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \return The second input data interpretation mode.
-    Mode get_mode() const {
-        return m_mode;
-    }
-    void set_mode(const Mode mode) {
-        m_mode = mode;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    Mode mode_from_string(const std::string& mode) const;
-
-    /// \brief Indicates how the values from the second input should be interpreted.
-    ///
-    /// The second input can contain a set of indices pointing to axes in the data
-    /// tensor shape.
-    /// Alternatively it can contain a boolean mask that indicates which axes should be
-    /// reversed.
-    Mode m_mode;
-
-private:
-    bool evaluate_reverse(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v1::Reverse;
 }  // namespace v1
 }  // namespace op
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v1::Reverse::Mode& type);
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v1::Reverse::Mode>
-    : public EnumAttributeAdapterBase<ngraph::op::v1::Reverse::Mode> {
-public:
-    AttributeAdapter(ngraph::op::v1::Reverse::Mode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v1::Reverse::Mode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v1::Reverse::Mode>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/reverse_sequence.hpp b/ngraph/core/include/ngraph/op/reverse_sequence.hpp
index 836c89e11ea98b..694a4b9859371b 100644
--- a/ngraph/core/include/ngraph/op/reverse_sequence.hpp
+++ b/ngraph/core/include/ngraph/op/reverse_sequence.hpp
@@ -5,57 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/reverse_sequence.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API ReverseSequence : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ReverseSequence() = default;
-    /// \brief Constructs a ReverseSequence operation.
-    ///
-    /// \param arg         tensor with input data to reverse
-    /// \param seq_lengths 1D tensor of integers with sequence lengths in the input
-    /// tensor.
-    /// \param batch_axis  index of the batch dimension.
-    /// \param seq_axis    index of the sequence dimension.
-    ReverseSequence(const Output<Node>& arg,
-                    const Output<Node>& seq_lengths,
-                    int64_t batch_axis = 0,
-                    int64_t seq_axis = 1);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    size_t get_batch_axis() const {
-        return m_normalized_batch_axis;
-    }
-    int64_t get_origin_batch_axis() const {
-        return m_batch_axis;
-    }
-    void set_batch_axis(int64_t batch_axis) {
-        m_batch_axis = batch_axis;
-    }
-    size_t get_sequence_axis() const {
-        return m_normalized_seq_axis;
-    }
-    int64_t get_origin_sequence_axis() const {
-        return m_seq_axis;
-    }
-    void set_sequence_axis(int64_t sequence_axis) {
-        m_seq_axis = sequence_axis;
-    }
-
-private:
-    int64_t m_batch_axis;
-    int64_t m_seq_axis = 1;
-    size_t m_normalized_batch_axis;
-    size_t m_normalized_seq_axis;
-};
+using ov::op::v0::ReverseSequence;
 }  // namespace v0
 using v0::ReverseSequence;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/rnn_cell.hpp b/ngraph/core/include/ngraph/op/rnn_cell.hpp
index 4a1dbad316b547..a176689d25a8b0 100644
--- a/ngraph/core/include/ngraph/op/rnn_cell.hpp
+++ b/ngraph/core/include/ngraph/op/rnn_cell.hpp
@@ -13,121 +13,12 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/activation_functions.hpp"
 #include "ngraph/op/util/rnn_cell_base.hpp"
+#include "openvino/op/rnn_cell.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-///
-/// \brief      Class for single RNN cell node.
-///
-/// \note       It follows notation and equations defined as in ONNX standard:
-///             https://github.com/onnx/onnx/blob/master/docs/Operators.md#RNN
-///
-/// \note       It calculates following equations:
-///
-///             Ht = f(Xt*(Wi^T) + Ht-1*(Ri^T) + Wbi + Rbi)
-///
-///             *       - Is a dot product,
-///             f       - is activation functions.
-///
-/// \note       This class represents only single *cell* (for current time step)
-///             and not the whole RNN Sequence layer
-///
-/// \sa         LSTMSequence, LSTMCell, GRUCell
-///
-class NGRAPH_API RNNCell : public util::RNNCellBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    RNNCell();
-    ///
-    /// \brief      Constructs RNNCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape: [hidden_size,
-    ///                                   input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [hidden_size, hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    ///
-    RNNCell(const Output<Node>& X,
-            const Output<Node>& initial_hidden_state,
-            const Output<Node>& W,
-            const Output<Node>& R,
-            std::size_t hidden_size,
-            const std::vector<std::string>& activations = std::vector<std::string>{"tanh"},
-            const std::vector<float>& activations_alpha = {},
-            const std::vector<float>& activations_beta = {},
-            float clip = 0.f);
-
-    ///
-    /// \brief      Constructs RNNCell node.
-    ///
-    /// \param[in]  X                     The input tensor with shape: [batch_size,
-    ///                                   input_size].
-    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
-    ///                                   with shape: [batch_size, hidden_size].
-    /// \param[in]  W                     The weight tensor with shape: [hidden_size,
-    ///                                   input_size].
-    /// \param[in]  R                     The recurrence weight tensor with shape:
-    ///                                   [hidden_size, hidden_size].
-    /// \param[in]  B                     The bias tensor for input gate with shape:
-    ///                                   [hidden_size].
-    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
-    /// \param[in]  activations           The vector of activation functions used inside
-    ///                                   recurrent cell.
-    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  activations_beta      The vector of beta parameters for activation
-    ///                                   functions in order respective to activation
-    ///                                   list.
-    /// \param[in]  clip                  The value defining clipping range [-clip,
-    ///                                   clip] on input of activation functions.
-    ///
-    RNNCell(const Output<Node>& X,
-            const Output<Node>& initial_hidden_state,
-            const Output<Node>& W,
-            const Output<Node>& R,
-            const Output<Node>& B,
-            std::size_t hidden_size,
-            const std::vector<std::string>& activations = std::vector<std::string>{"tanh"},
-            const std::vector<float>& activations_alpha = {},
-            const std::vector<float>& activations_beta = {},
-            float clip = 0.f);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-private:
-    ///
-    /// \brief      Creates the default bias input initialized with zeros.
-    ///
-    /// \return     The object of Output class.
-    ///
-    Output<Node> get_default_bias_input() const;
-
-    ///
-    /// \brief The Activation function f.
-    ///
-    util::ActivationFunction m_activation_f;
-
-    static constexpr std::size_t s_gates_count{1};
-};
+using ov::op::v0::RNNCell;
 }  // namespace v0
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/rnn_sequence.hpp b/ngraph/core/include/ngraph/op/rnn_sequence.hpp
index 4aa6fe1fa758eb..7f982b8f4347f2 100644
--- a/ngraph/core/include/ngraph/op/rnn_sequence.hpp
+++ b/ngraph/core/include/ngraph/op/rnn_sequence.hpp
@@ -10,42 +10,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/rnn_cell_base.hpp"
+#include "openvino/op/rnn_sequence.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v5 {
-class NGRAPH_API RNNSequence : public util::RNNCellBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    RNNSequence();
-
-    RNNSequence(const Output<Node>& X,
-                const Output<Node>& H_t,
-                const Output<Node>& sequence_lengths,
-                const Output<Node>& W,
-                const Output<Node>& R,
-                const Output<Node>& B,
-                size_t hidden_size,
-                op::RecurrentSequenceDirection direction,
-                const std::vector<std::string>& activations = std::vector<std::string>{"tanh"},
-                const std::vector<float>& activations_alpha = {},
-                const std::vector<float>& activations_beta = {},
-                float clip = 0.f);
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    op::RecurrentSequenceDirection get_direction() const {
-        return m_direction;
-    }
-
-protected:
-    op::RecurrentSequenceDirection m_direction;
-};
+using ov::op::v5::RNNSequence;
 }  // namespace v5
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/roi_align.hpp b/ngraph/core/include/ngraph/op/roi_align.hpp
index 03f333c98a1dd9..abb7297998c84d 100644
--- a/ngraph/core/include/ngraph/op/roi_align.hpp
+++ b/ngraph/core/include/ngraph/op/roi_align.hpp
@@ -5,101 +5,13 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/roi_align.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-class NGRAPH_API ROIAlign : public Op {
-public:
-    static constexpr NodeTypeInfo type_info{"ROIAlign", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    enum class PoolingMode { AVG, MAX };
-
-    ROIAlign() = default;
-    /// \brief Constructs a ROIAlign node matching the ONNX ROIAlign specification
-    ///
-    /// \param input           Input feature map {N, C, H, W}
-    /// \param rois            Regions of interest to pool over
-    /// \param batch_indices   Indices of images in the batch matching
-    ///                        the number or ROIs
-    /// \param pooled_h        Height of the ROI output features
-    /// \param pooled_w        Width of the ROI output features
-    /// \param sampling_ratio  Number of sampling points used to compute
-    ///                        an output element
-    /// \param spatial_scale   Spatial scale factor used to translate ROI coordinates
-    /// \param mode            Method of pooling - 'avg' or 'max'
-    ROIAlign(const Output<Node>& input,
-             const Output<Node>& rois,
-             const Output<Node>& batch_indices,
-             const int pooled_h,
-             const int pooled_w,
-             const int sampling_ratio,
-             const float spatial_scale,
-             const std::string& mode);
-
-    ROIAlign(const Output<Node>& input,
-             const Output<Node>& rois,
-             const Output<Node>& batch_indices,
-             const int pooled_h,
-             const int pooled_w,
-             const int sampling_ratio,
-             const float spatial_scale,
-             const PoolingMode mode);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    int get_pooled_h() const {
-        return m_pooled_h;
-    }
-    int get_pooled_w() const {
-        return m_pooled_w;
-    }
-    int get_sampling_ratio() const {
-        return m_sampling_ratio;
-    }
-    float get_spatial_scale() const {
-        return m_spatial_scale;
-    }
-    PoolingMode get_mode() const {
-        return m_mode;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    PoolingMode mode_from_string(const std::string& mode) const;
-
-private:
-    int m_pooled_h;
-    int m_pooled_w;
-    int m_sampling_ratio;
-    float m_spatial_scale;
-    PoolingMode m_mode;
-};
+using ov::op::v3::ROIAlign;
 }  // namespace v3
 using v3::ROIAlign;
 }  // namespace op
-
-std::ostream& operator<<(std::ostream& s, const op::v3::ROIAlign::PoolingMode& mode);
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v3::ROIAlign::PoolingMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v3::ROIAlign::PoolingMode> {
-public:
-    AttributeAdapter(ngraph::op::v3::ROIAlign::PoolingMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v3::ROIAlign::PoolingMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v3::ROIAlign::PoolingMode>", 3};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/roi_pooling.hpp b/ngraph/core/include/ngraph/op/roi_pooling.hpp
index 9edc39f9ac0670..fcf687897de418 100644
--- a/ngraph/core/include/ngraph/op/roi_pooling.hpp
+++ b/ngraph/core/include/ngraph/op/roi_pooling.hpp
@@ -5,52 +5,13 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/roi_pooling.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API ROIPooling : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ROIPooling() = default;
-    /// \brief Constructs a ROIPooling operation
-    ///
-    /// \param input          Input feature map {N, C, H, W}
-    /// \param coords         Coordinates of bounding boxes
-    /// \param output_size    Height/Width of ROI output features
-    /// \param spatial_scale  Ratio of input feature map over input image size
-    /// \param method         Method of pooling - Max or Bilinear
-    ROIPooling(const Output<Node>& input,
-               const Output<Node>& coords,
-               const Shape& output_size,
-               const float spatial_scale,
-               const std::string& method = "max");
-
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    const Shape& get_output_size() const {
-        return m_output_size;
-    }
-    float get_spatial_scale() const {
-        return m_spatial_scale;
-    }
-    const std::string& get_method() const {
-        return m_method;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    Shape m_output_size{0, 0};
-    float m_spatial_scale;
-    std::string m_method = "max";
-};
-
+using ov::op::v0::ROIPooling;
 }  // namespace v0
 using v0::ROIPooling;
-
 }  // namespace op
-
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/roll.hpp b/ngraph/core/include/ngraph/op/roll.hpp
index 6f376a93def0c9..76e1e4675aa884 100644
--- a/ngraph/core/include/ngraph/op/roll.hpp
+++ b/ngraph/core/include/ngraph/op/roll.hpp
@@ -6,34 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/roll.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v7 {
-/// \brief Tensor roll operation.
-class NGRAPH_API Roll : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Roll() = default;
-
-    ///
-    /// \brief      Constructs a roll operation.
-    ///
-    /// \param      data         Node producing the tensor to be shifted.
-    /// \param      shift        Node producing the 0D or 1D tensor which specifies the
-    /// number of places by which the elements are shifted.
-    /// \param      axes         Node producing the 0D or 1D tensor which specifies axes
-    /// along which elements are shifted.
-    ///
-    Roll(const Output<Node>& data, const Output<Node>& shift, const Output<Node>& axes);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v7::Roll;
 }  // namespace v7
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/round.hpp b/ngraph/core/include/ngraph/op/round.hpp
index 38a462132f0631..6e00c0db103b24 100644
--- a/ngraph/core/include/ngraph/op/round.hpp
+++ b/ngraph/core/include/ngraph/op/round.hpp
@@ -7,64 +7,12 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/round.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v5 {
-/// \brief Elementwise round operation. The output is round to the nearest integer
-/// for each value. In case of halfs, the rule is defined in attribute 'mode':
-///     'HALF_TO_EVEN' - round halfs to the nearest even integer.
-///     'HALF_AWAY_FROM_ZERO': - round in such a way that the result heads away from
-/// zero.
-
-class NGRAPH_API Round : public ngraph::op::Op {
-public:
-    enum class RoundMode { HALF_TO_EVEN, HALF_AWAY_FROM_ZERO };
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a round operation.
-    Round() = default;
-
-    /// \brief Constructs a round operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    /// \param mode Rule to resolve halfs
-    Round(const Output<Node>& arg, const RoundMode mode);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-    RoundMode get_mode() const {
-        return m_mode;
-    }
-
-private:
-    RoundMode m_mode;
-};
+using ov::op::v5::Round;
 }  // namespace v5
 }  // namespace op
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v5::Round::RoundMode& type);
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v5::Round::RoundMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v5::Round::RoundMode> {
-public:
-    AttributeAdapter(ngraph::op::v5::Round::RoundMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v5::Round::RoundMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v5::Round::RoundMode>", 5};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/scatter_elements_update.hpp b/ngraph/core/include/ngraph/op/scatter_elements_update.hpp
index 78847c2a33eb95..667b84d30b3cb0 100644
--- a/ngraph/core/include/ngraph/op/scatter_elements_update.hpp
+++ b/ngraph/core/include/ngraph/op/scatter_elements_update.hpp
@@ -9,36 +9,12 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/runtime/aligned_buffer.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/op/scatter_elements_update.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-class NGRAPH_API ScatterElementsUpdate : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ScatterElementsUpdate() = default;
-    /// \brief Constructs a ScatterElementsUpdate node
-
-    /// \param data            Input data
-    /// \param indices         Data entry index that will be updated
-    /// \param updates         Update values
-    /// \param axis            Axis to scatter on
-    ScatterElementsUpdate(const Output<Node>& data,
-                          const Output<Node>& indices,
-                          const Output<Node>& updates,
-                          const Output<Node>& axis);
-
-    virtual void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool evaluate_scatter_element_update(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v3::ScatterElementsUpdate;
 }  // namespace v3
 using v3::ScatterElementsUpdate;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/scatter_nd_update.hpp b/ngraph/core/include/ngraph/op/scatter_nd_update.hpp
index 044025ee1a2cb3..d43dede27b027e 100644
--- a/ngraph/core/include/ngraph/op/scatter_nd_update.hpp
+++ b/ngraph/core/include/ngraph/op/scatter_nd_update.hpp
@@ -6,28 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/scatter_nd_base.hpp"
+#include "openvino/op/scatter_nd_update.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Add updates to slices from inputs addressed by indices
-class NGRAPH_API ScatterNDUpdate : public util::ScatterNDBase {
-public:
-    static constexpr NodeTypeInfo type_info{"ScatterNDUpdate", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    ScatterNDUpdate() = default;
-    /// \param inputs Tensor
-    /// \param indices Index tensor: Data type must be `element::i32` or `element::i64`
-    /// \param updates Tensor: Must have same type as inputs
-    ScatterNDUpdate(const Output<Node>& inputs, const Output<Node>& indices, const Output<Node>& updates)
-        : util::ScatterNDBase(inputs, indices, updates) {}
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v3::ScatterNDUpdate;
 }  // namespace v3
 using v3::ScatterNDUpdate;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/scatter_update.hpp b/ngraph/core/include/ngraph/op/scatter_update.hpp
index d3ec15f94b3923..f89c2dc8656c5d 100644
--- a/ngraph/core/include/ngraph/op/scatter_update.hpp
+++ b/ngraph/core/include/ngraph/op/scatter_update.hpp
@@ -7,41 +7,12 @@
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/scatter_base.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/op/scatter_update.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-///
-/// \brief      Set new values to slices from data addressed by indices
-///
-class NGRAPH_API ScatterUpdate : public util::ScatterBase {
-public:
-    static constexpr NodeTypeInfo type_info{"ScatterUpdate", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    ScatterUpdate() = default;
-    ///
-    /// \brief      Constructs ScatterUpdate operator object.
-    ///
-    /// \param      data     The input tensor to be updated.
-    /// \param      indices  The tensor with indexes which will be updated.
-    /// \param      updates  The tensor with update values.
-    /// \param[in]  axis     The axis at which elements will be updated.
-    ///
-    ScatterUpdate(const Output<Node>& data,
-                  const Output<Node>& indices,
-                  const Output<Node>& updates,
-                  const Output<Node>& axis);
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool evaluate_scatter_update(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v3::ScatterUpdate;
 }  // namespace v3
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/select.hpp b/ngraph/core/include/ngraph/op/select.hpp
index 2c33bb2b8d6d25..e9eb2e1e17b33e 100644
--- a/ngraph/core/include/ngraph/op/select.hpp
+++ b/ngraph/core/include/ngraph/op/select.hpp
@@ -5,66 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/select.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-// clang-format off
-            /// \brief Elementwise selection operation.
-            ///
-            /// ## Inputs
-            ///
-            /// |        | Type                                          | Description                                                  |
-            /// | ------ | --------------------------------------------- | ------------------------------------------------------------ |
-            /// | `arg0` | \f$\texttt{bool}[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape, with element `bool`.                  |
-            /// | `arg1` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$             | A tensor of a shape that is broadcast-compatible with `arg0`, with any element type. |
-            /// | `arg2` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$             | A tensor of a shape that is broadcast-compatible with `arg0`, and same element type as `arg1`. |
-            /// | `auto_broadcast`| AutoBroadcastSpec                             | Auto broadcast specification.                                |
-            ///
-            /// ## Output
-            ///
-            /// | Type                   | Description                                                                                                                                                             |
-            /// | ---------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-            /// | \f$E[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \texttt{arg1}[i_1,\dots,i_n]\text{ if }\texttt{arg0}[i_1,\dots,i_n] \neq 0\text{, else }\texttt{arg2}[i_1,\dots,i_n]\f$ |
-// clang-format on
-class NGRAPH_API Select : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a selection operation.
-    Select() : m_auto_broadcast(AutoBroadcastSpec(AutoBroadcastType::NUMPY)) {}
-
-    /// \brief Constructs a selection operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param arg2 Node that produces the third input tensor.
-    /// \param auto_broadcast Auto broadcast specification. Default is Numpy-style
-    ///                       implicit broadcasting.
-    Select(const Output<Node>& arg0,
-           const Output<Node>& arg1,
-           const Output<Node>& arg2,
-           const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    const AutoBroadcastSpec& get_auto_broadcast() const {
-        return m_auto_broadcast;
-    }
-    void set_auto_broadcast(const AutoBroadcastSpec& auto_broadcast) {
-        m_auto_broadcast = auto_broadcast;
-    }
-    // TODO: Move all uses of get_autob to get_auto_broadcast() and remove this.
-    const AutoBroadcastSpec& get_autob() const override {
-        return m_auto_broadcast;
-    }
-    virtual bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
-    bool has_evaluate() const override;
-
-private:
-    AutoBroadcastSpec m_auto_broadcast;
-};
+using ov::op::v1::Select;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/selu.hpp b/ngraph/core/include/ngraph/op/selu.hpp
index 89e0a08f69e9ca..8236dc6790464f 100644
--- a/ngraph/core/include/ngraph/op/selu.hpp
+++ b/ngraph/core/include/ngraph/op/selu.hpp
@@ -6,28 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/selu.hpp"
+
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Performs a SELU activation function on all elements of the input node
-class NGRAPH_API Selu : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Selu() = default;
-    /// \brief Constructs a Selu node.
-    ///
-    /// \param data - Node producing the input tensor
-    /// \param alpha - Alpha coefficient of SELU operation
-    /// \param lambda - Lambda coefficient of SELU operation
-    Selu(const Output<Node>& data, const Output<Node>& alpha, const Output<Node>& lambda);
-
-    void validate_and_infer_types() override;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v0::Selu;
 }  // namespace v0
 using v0::Selu;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/shape_of.hpp b/ngraph/core/include/ngraph/op/shape_of.hpp
index 9e1d97f05a7c7c..00c8f80e0a9a7f 100644
--- a/ngraph/core/include/ngraph/op/shape_of.hpp
+++ b/ngraph/core/include/ngraph/op/shape_of.hpp
@@ -5,66 +5,16 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/shape_of.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v3 {
-/// \brief Operation that returns the shape of its input argument as a tensor.
-class NGRAPH_API ShapeOf : public Op {
-public:
-    static constexpr NodeTypeInfo type_info{"ShapeOf", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    ShapeOf() = default;
-    /// \brief Constructs a shape-of operation.
-    ShapeOf(const Output<Node>& arg, const element::Type output_type = element::i64);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    void validate_and_infer_types() override;
-
-    element::Type get_output_type() const {
-        return m_output_type;
-    }
-    void set_output_type(element::Type output_type) {
-        m_output_type = output_type;
-    }
-    // Overload collision with method on Node
-    using Node::set_output_type;
-
-    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& output_values) const override;
-    bool evaluate_upper(const HostTensorVector& output_values) const override;
-    bool constant_fold(OutputVector& output_values, const OutputVector& input_values) override;
-
-private:
-    element::Type m_output_type;
-};
+using ov::op::v3::ShapeOf;
 }  // namespace v3
 
 namespace v0 {
-/// \brief Operation that returns the shape of its input argument as a tensor.
-class NGRAPH_API ShapeOf : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    ShapeOf() = default;
-    /// \brief Constructs a shape-of operation.
-    ShapeOf(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    void validate_and_infer_types() override;
-
-    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& output_values) const override;
-    bool evaluate_upper(const HostTensorVector& output_values) const override;
-    bool constant_fold(OutputVector& output_values, const OutputVector& input_values) override;
-};
+using ov::op::v0::ShapeOf;
 }  // namespace v0
 using v0::ShapeOf;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/shuffle_channels.hpp b/ngraph/core/include/ngraph/op/shuffle_channels.hpp
index f72ba64b45c1f1..9e68fd92aa7ac1 100644
--- a/ngraph/core/include/ngraph/op/shuffle_channels.hpp
+++ b/ngraph/core/include/ngraph/op/shuffle_channels.hpp
@@ -8,48 +8,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/shuffle_channels.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Permutes data in the channel dimension of the input
-class NGRAPH_API ShuffleChannels : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ShuffleChannels() = default;
-    /// \brief Constructs a ShuffleChannels node.
-    ///
-    /// \param data     Node producing the input tensor.
-    /// \param axis     Channel dimension index in the data tensor.
-    ///                 A negative value means that the index should be
-    ///                 calculated from the back of the input data shape.
-    /// \param group    Number of group the channel dimension should be split into.
-    ///
-    ShuffleChannels(const Output<Node>& data, const int64_t axis = 1, const int64_t group = 1);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    size_t get_zero_based_axis() const;
-
-    virtual void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    int64_t get_axis() const {
-        return m_axis;
-    }
-    int64_t get_group() const {
-        return m_group;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool evaluate_shuffle_channels(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-
-    int64_t m_axis;
-    int64_t m_group;
-};
+using ov::op::v0::ShuffleChannels;
 }  // namespace v0
 using v0::ShuffleChannels;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/sigmoid.hpp b/ngraph/core/include/ngraph/op/sigmoid.hpp
index 0bb61ddd78056b..b5c13da1593e23 100644
--- a/ngraph/core/include/ngraph/op/sigmoid.hpp
+++ b/ngraph/core/include/ngraph/op/sigmoid.hpp
@@ -8,22 +8,12 @@
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
 #include "ngraph/util.hpp"
+#include "openvino/op/sigmoid.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API Sigmoid : public util::UnaryElementwiseArithmetic {
-public:
-    static constexpr NodeTypeInfo type_info{"Sigmoid", 0};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    Sigmoid(const Output<Node>& arg);
-    Sigmoid() = default;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Sigmoid;
 }  // namespace v0
 using v0::Sigmoid;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/sign.hpp b/ngraph/core/include/ngraph/op/sign.hpp
index c647da35c59867..5bca5fe909d1d7 100644
--- a/ngraph/core/include/ngraph/op/sign.hpp
+++ b/ngraph/core/include/ngraph/op/sign.hpp
@@ -5,27 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/sign.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise sign operation.
-///
-class NGRAPH_API Sign : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Sign() = default;
-    /// \brief Constructs an elementwise sign operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Sign(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Sign;
 }  // namespace v0
 using v0::Sign;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/sin.hpp b/ngraph/core/include/ngraph/op/sin.hpp
index edac3b9da51532..4dd276f09ba820 100644
--- a/ngraph/core/include/ngraph/op/sin.hpp
+++ b/ngraph/core/include/ngraph/op/sin.hpp
@@ -5,42 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/sin.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-// clang-format off
-        /// \brief Elementwise sine operation.
-        ///
-        /// ## Inputs
-        ///
-        /// |       | Type                              | Description                                     |
-        /// | ----- | --------------------------------- | ----------------------------------------------- |
-        /// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
-        ///
-        /// ## Output
-        ///
-        /// | Type                   | Description                                                                          |
-        /// | ---------------------- | ------------------------------------------------------------------------------------ |
-        /// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \sin(\texttt{arg}[i_1,\dots,i_n])\f$ |
-// clang-format on
-class NGRAPH_API Sin : public util::UnaryElementwiseArithmetic {
-public:
-    static constexpr NodeTypeInfo type_info{"Sin", 0};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs a sine operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Sin(const Output<Node>& arg);
-    Sin() = default;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Sin;
 }  // namespace v0
 using v0::Sin;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/sinh.hpp b/ngraph/core/include/ngraph/op/sinh.hpp
index 6ddb594fc22246..927f33bdae3b8a 100644
--- a/ngraph/core/include/ngraph/op/sinh.hpp
+++ b/ngraph/core/include/ngraph/op/sinh.hpp
@@ -5,25 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/sinh.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise hyperbolic sine (sinh) operation.
-class NGRAPH_API Sinh : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a hyperbolic sine operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Sinh(const Output<Node>& arg);
-    Sinh() = default;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Sinh;
 }  // namespace v0
 using v0::Sinh;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/sink.hpp b/ngraph/core/include/ngraph/op/sink.hpp
index 0dbec0190796d8..53e9fa9d523df2 100644
--- a/ngraph/core/include/ngraph/op/sink.hpp
+++ b/ngraph/core/include/ngraph/op/sink.hpp
@@ -7,20 +7,11 @@
 #include <vector>
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/sink.hpp"
 
 namespace ngraph {
 namespace op {
-/// Root of nodes that can be sink nodes
-class NGRAPH_API Sink : public Op {
-public:
-    virtual ~Sink() = 0;
-    NGRAPH_RTTI_DECLARATION;
-
-protected:
-    Sink() : Op() {}
-
-    explicit Sink(const OutputVector& arguments) : Op(arguments) {}
-};
+using ov::op::Sink;
 }  // namespace op
 using SinkVector = std::vector<std::shared_ptr<op::Sink>>;
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/slice.hpp b/ngraph/core/include/ngraph/op/slice.hpp
new file mode 100644
index 00000000000000..44305383502b4a
--- /dev/null
+++ b/ngraph/core/include/ngraph/op/slice.hpp
@@ -0,0 +1,16 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+#include "openvino/op/slice.hpp"
+
+namespace ngraph {
+namespace op {
+namespace v8 {
+using ov::op::v8::Slice;
+}  // namespace v8
+}  // namespace op
+}  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/softmax.hpp b/ngraph/core/include/ngraph/op/softmax.hpp
index 9eae046c216486..f0fadb841a451f 100644
--- a/ngraph/core/include/ngraph/op/softmax.hpp
+++ b/ngraph/core/include/ngraph/op/softmax.hpp
@@ -5,42 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/softmax.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-class NGRAPH_API Softmax : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Softmax() : m_axis(0) {}
-    /// \brief Constructs a softmax operation.
-    ///
-    /// \param arg Node that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param axis The axis position (0-based) on which to calculate the softmax.
-    ///
-    /// Output `[d0, ...]`
-    ///
-    Softmax(const Output<Node>& arg, const size_t axis = 1);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    size_t get_axis() const {
-        return m_axis;
-    }
-    void set_axis(const size_t axis) {
-        m_axis = axis;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    size_t m_axis;
-};
+using ov::op::v1::Softmax;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/softplus.hpp b/ngraph/core/include/ngraph/op/softplus.hpp
index cc49918d5e968c..2c627d19eddb9b 100644
--- a/ngraph/core/include/ngraph/op/softplus.hpp
+++ b/ngraph/core/include/ngraph/op/softplus.hpp
@@ -6,30 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/softplus.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-/// \brief A Self Regularized Non-Monotonic Neural Activation Function
-/// f(x) =  ln(exp(x) + 1.)
-///
-class NGRAPH_API SoftPlus : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    SoftPlus() = default;
-    /// \brief Constructs an SoftPlus operation.
-    ///
-    /// \param data Input tensor
-    SoftPlus(const Output<Node>& arg);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v4::SoftPlus;
 }  // namespace v4
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/space_to_batch.hpp b/ngraph/core/include/ngraph/op/space_to_batch.hpp
index 6564947339eaa7..6ace3da579391b 100644
--- a/ngraph/core/include/ngraph/op/space_to_batch.hpp
+++ b/ngraph/core/include/ngraph/op/space_to_batch.hpp
@@ -5,50 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/space_to_batch.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief SpaceToBatch permutes data tensor blocks of spatial data into batch
-/// dimension.
-///
-/// \note  Values from spatial blocks dimensions are moved in the batch dimension.
-///
-///        Output node produces a tensor with shape: tensor with shape
-///        `[batch * block_shape[0] * block_shape[1] * ... * block_shape[N - 1],
-///         (pads_begin[1] + D_1 + pads_end[1]) / block_shape[1],
-///         (pads_begin[2] + D_2 + pads_end[2]) / block_shape[2], ...,
-///         (pads_begin[N - 1] + D_{N - 1} + pads_end[N - 1]) / block_shape[N - 1]`
-///         of the same type as `data` input.
-class NGRAPH_API SpaceToBatch : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    SpaceToBatch() = default;
-
-    /// \brief Constructs a SpaceToBatch operation.
-    ///
-    /// \param data Node producing the data tensor
-    /// \param block_shape The sizes of the block of values to be moved
-    /// \param pads_begin Specifies the padding for the beginning along each axis of
-    /// `data` input
-    /// \param pads_end Specifies the padding for the ending along each axis of `data`
-    /// input.
-    SpaceToBatch(const Output<Node>& data,
-                 const Output<Node>& block_shape,
-                 const Output<ngraph::Node>& pads_begin,
-                 const Output<ngraph::Node>& pads_end);
-
-    void validate_and_infer_types() override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool evaluate_space_to_batch(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v1::SpaceToBatch;
 }  // namespace v1
 using v1::SpaceToBatch;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/space_to_depth.hpp b/ngraph/core/include/ngraph/op/space_to_depth.hpp
index d72c725f60efda..121279414e6643 100644
--- a/ngraph/core/include/ngraph/op/space_to_depth.hpp
+++ b/ngraph/core/include/ngraph/op/space_to_depth.hpp
@@ -5,77 +5,13 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/space_to_depth.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief SpaceToDepth permutes input tensor blocks of spatial data into depth
-/// dimension.
-///
-/// \note  Values from the height and width dimensions are moved to the depth dimension.
-///
-///        Output node produces a tensor with shape:
-///        [N, C * blocksize * blocksize, H / blocksize, W / blocksize]
-class NGRAPH_API SpaceToDepth : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    enum class SpaceToDepthMode {
-        // The output depth is gathered from [block_size, ..., block_size, C]
-        BLOCKS_FIRST,
-        // The output depth is gathered from [C, block_size, ..., block_size]
-        DEPTH_FIRST
-    };
-
-    SpaceToDepth() = default;
-    /// \brief Constructs a SpaceToDepth operation.
-    ///
-    /// \param data - Node producing the input tensor
-    /// \param mode Specifies how the output depth dimension is gathered
-    /// from block coordinates and the old depth dimension.
-    /// \param block_size - the size of the block of values to be moved
-    SpaceToDepth(const Output<Node>& data, const SpaceToDepthMode& mode, std::size_t block_size = 1);
-
-    SpaceToDepth(const Output<Node>& data, const std::string& mode, std::size_t block_size = 1);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::size_t get_block_size() const {
-        return m_blocksize;
-    }
-    SpaceToDepthMode get_mode() const {
-        return m_mode;
-    }
-    void validate_and_infer_types() override;
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    std::size_t m_blocksize;
-    SpaceToDepthMode m_mode;
-};
+using ov::op::v0::SpaceToDepth;
 }  // namespace v0
 using v0::SpaceToDepth;
 }  // namespace op
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::v0::SpaceToDepth::SpaceToDepthMode& type);
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::v0::SpaceToDepth::SpaceToDepthMode>
-    : public EnumAttributeAdapterBase<ngraph::op::v0::SpaceToDepth::SpaceToDepthMode> {
-public:
-    AttributeAdapter(ngraph::op::v0::SpaceToDepth::SpaceToDepthMode& value)
-        : EnumAttributeAdapterBase<ngraph::op::v0::SpaceToDepth::SpaceToDepthMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v0::SpaceToDepth::SpaceToDepthMode>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/split.hpp b/ngraph/core/include/ngraph/op/split.hpp
index fa3023697d29e7..591b5d915d882c 100644
--- a/ngraph/core/include/ngraph/op/split.hpp
+++ b/ngraph/core/include/ngraph/op/split.hpp
@@ -9,41 +9,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/split.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Splits the input tensor into a list of equal sized tensors
-class NGRAPH_API Split : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a split operation.
-    Split() = default;
-    /// \brief Constructs a split operation.
-    /// \param data        The tensor to be split.
-    /// \param axis        The index of an axis in "data" along which to perform
-    ///                    the split.
-    /// \param num_splits  The number of pieces that the data tensor should be
-    ///                    split into.
-    Split(const Output<Node>& data, const Output<Node>& axis, const size_t num_splits);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    size_t get_num_splits() const {
-        return m_num_splits;
-    }
-    void set_num_splits(const size_t num_splits) {
-        m_num_splits = num_splits;
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    size_t m_num_splits;
-};
+using ov::op::v1::Split;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/sqrt.hpp b/ngraph/core/include/ngraph/op/sqrt.hpp
index f6b55158c179d2..bcad6a2392bafa 100644
--- a/ngraph/core/include/ngraph/op/sqrt.hpp
+++ b/ngraph/core/include/ngraph/op/sqrt.hpp
@@ -5,40 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/sqrt.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-// clang-format off
-        /// \brief Elementwise square root operation.
-        ///
-        /// ## Inputs
-        ///
-        /// |       | Type                              | Description                                     |
-        /// | ----- | --------------------------------- | ----------------------------------------------- |
-        /// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
-        ///
-        /// ## Output
-        ///
-        /// | Type                   | Description                                                                           |
-        /// | ---------------------- | ------------------------------------------------------------------------------------- |
-        /// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \sqrt{\texttt{arg}[i_1,\dots,i_n]}\f$ |
-// clang-format on
-class NGRAPH_API Sqrt : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a square operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Sqrt(const Output<Node>& arg);
-    Sqrt() = default;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Sqrt;
 }  // namespace v0
 using v0::Sqrt;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/squared_difference.hpp b/ngraph/core/include/ngraph/op/squared_difference.hpp
index 9c9888e4cf28b6..4b22f17f83a197 100644
--- a/ngraph/core/include/ngraph/op/squared_difference.hpp
+++ b/ngraph/core/include/ngraph/op/squared_difference.hpp
@@ -5,30 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/squared_difference.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Calculates an element-wise squared difference between two tensors
-///
-/// y[i] = (x1[i] - x2[i])^2
-class NGRAPH_API SquaredDifference : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constrcuts an uninitialized squared difference operation
-    SquaredDifference() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-    /// \brief Constructs the squared difference operation.
-    ///
-    /// \param x1 First input tensor
-    /// \param x2 Second input tensor
-    /// \param auto_broadcast Auto broadcast specification
-    SquaredDifference(const Output<Node>& x1,
-                      const Output<Node>& x2,
-                      const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v0::SquaredDifference;
 }  // namespace v0
 using v0::SquaredDifference;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/squeeze.hpp b/ngraph/core/include/ngraph/op/squeeze.hpp
index 6c1d78586f86e1..bec910010c0e17 100644
--- a/ngraph/core/include/ngraph/op/squeeze.hpp
+++ b/ngraph/core/include/ngraph/op/squeeze.hpp
@@ -9,33 +9,12 @@
 #include "ngraph/axis_vector.hpp"
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/squeeze.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API Squeeze : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Squeeze();
-    Squeeze(const Output<Node>& data, const Output<Node>& axes);
-    Squeeze(const Output<Node>& data);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool is_dynamic() const override;
-
-private:
-    Output<Node> get_default_axes_input() const;
-};
+using ov::op::v0::Squeeze;
 }  // namespace v0
 using v0::Squeeze;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/strided_slice.hpp b/ngraph/core/include/ngraph/op/strided_slice.hpp
index 6c3cff7fa81b3c..8239d67cf6bd10 100644
--- a/ngraph/core/include/ngraph/op/strided_slice.hpp
+++ b/ngraph/core/include/ngraph/op/strided_slice.hpp
@@ -10,102 +10,12 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/strided_slice.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Takes a slice of an input tensor, i.e., the sub-tensor that resides within a
-///        bounding box, optionally with stride.
-class NGRAPH_API StridedSlice : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    StridedSlice() = default;
-
-    /// \brief Constructs a dynamic tensor strided slice operation.
-    ///
-    /// \param data             The tensor to be sliced.
-    /// \param begin            1D tensor with begin indexes for input blob slicing.
-    /// \param end              1D tensor with end indexes for input blob slicing.
-    /// \param strides          The slicing strides; for example, strides of `{n,m}`
-    ///                         means to take every nth row and every mth column
-    ///                         of the input matrix.
-    /// \param begin_mask       When begin_mask[i] equal to 1 means that the
-    ///                         corresponding dimension of the begin input is ignored.
-    /// \param end_mask         When end_mask[i] is 1, the corresponding dimension of
-    ///                         the end input is ignored.
-    /// \param new_axis_mask    If new_axis_mask[i] is 1, a length 1 dimension
-    ///                         is inserted on the i-th position.
-    /// \param shrink_axis_mask If shrink_axis_mask[i] is 1, the dimension
-    ///                         on the i-th position is deleted.
-    /// \param ellipsis_mask    It inserts missing dimensions
-    ///                         on a position of a non-zero bit.
-    StridedSlice(const Output<Node>& data,
-                 const Output<Node>& begin,
-                 const Output<Node>& end,
-                 const Output<Node>& strides,
-                 const std::vector<int64_t>& begin_mask,
-                 const std::vector<int64_t>& end_mask,
-                 const std::vector<int64_t>& new_axis_mask = std::vector<int64_t>{},
-                 const std::vector<int64_t>& shrink_axis_mask = std::vector<int64_t>{},
-                 const std::vector<int64_t>& ellipsis_mask = std::vector<int64_t>{});
-
-    /// \brief Constructs a dynamic tensor strided slice operation.
-    ///
-    /// \param data             The tensor to be sliced.
-    /// \param begin            1D tensor with begin indexes for input blob slicing.
-    /// \param end              1D tensor with end indexes for input blob slicing.
-    /// \param begin_mask       When begin_mask[i] equal to 1 means that the
-    ///                         corresponding dimension of the begin input is ignored.
-    /// \param end_mask         When end_mask[i] is 1, the corresponding dimension of
-    ///                         the end input is ignored.
-    /// \param new_axis_mask    If new_axis_mask[i] is 1, a length 1 dimension
-    ///                         is inserted on the i-th position.
-    /// \param shrink_axis_mask If shrink_axis_mask[i] is 1, the dimension
-    ///                         on the i-th position is deleted.
-    /// \param ellipsis_mask    It inserts missing dimensions
-    ///                         on a position of a non-zero bit.
-    StridedSlice(const Output<Node>& data,
-                 const Output<Node>& begin,
-                 const Output<Node>& end,
-                 const std::vector<int64_t>& begin_mask,
-                 const std::vector<int64_t>& end_mask,
-                 const std::vector<int64_t>& new_axis_mask = std::vector<int64_t>{},
-                 const std::vector<int64_t>& shrink_axis_mask = std::vector<int64_t>{},
-                 const std::vector<int64_t>& ellipsis_mask = std::vector<int64_t>{});
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    const std::vector<int64_t>& get_begin_mask() const {
-        return m_begin_mask;
-    }
-    const std::vector<int64_t>& get_end_mask() const {
-        return m_end_mask;
-    }
-    const std::vector<int64_t>& get_new_axis_mask() const {
-        return m_new_axis_mask;
-    }
-    const std::vector<int64_t>& get_shrink_axis_mask() const {
-        return m_shrink_axis_mask;
-    }
-    const std::vector<int64_t>& get_ellipsis_mask() const {
-        return m_ellipsis_mask;
-    }
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    void validate_and_infer_types() override;
-    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-
-private:
-    AxisSet convert_mask_to_axis_set(const std::vector<int64_t>& mask) const;
-
-    std::vector<int64_t> m_begin_mask;
-    std::vector<int64_t> m_end_mask;
-    std::vector<int64_t> m_new_axis_mask;
-    std::vector<int64_t> m_shrink_axis_mask;
-    std::vector<int64_t> m_ellipsis_mask;
-};
+using ov::op::v1::StridedSlice;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/subtract.hpp b/ngraph/core/include/ngraph/op/subtract.hpp
index d6ba078714c634..93fdf98e702983 100644
--- a/ngraph/core/include/ngraph/op/subtract.hpp
+++ b/ngraph/core/include/ngraph/op/subtract.hpp
@@ -5,30 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
+#include "openvino/op/subtract.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise subtraction operation.
-class NGRAPH_API Subtract : public util::BinaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Subtract() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
-
-    /// \brief Constructs a subtraction operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.
-    /// \param arg1 Node that produces the second input tensor.
-    /// \param auto_broadcast Auto broadcast specification
-    Subtract(const Output<Node>& arg0,
-             const Output<Node>& arg1,
-             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Subtract;
 }  // namespace v1
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/swish.hpp b/ngraph/core/include/ngraph/op/swish.hpp
index 980e3390c1b8bd..d125ec55797624 100644
--- a/ngraph/core/include/ngraph/op/swish.hpp
+++ b/ngraph/core/include/ngraph/op/swish.hpp
@@ -6,34 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/swish.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v4 {
-/// \brief A Swish Activation Function
-/// f(x) =  x / (1.0 + exp(-beta * x)) or
-/// f(x) = x * sigmoid(beta * x)
-///
-class NGRAPH_API Swish : public ngraph::op::Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    Swish() = default;
-
-    /// \brief Constructs an Swish operation.
-    ///
-    /// \param data Input tensor
-    /// \param beta Scalar with beta value. If the argument is not specified then use
-    /// the default value 1.0
-    Swish(const Output<Node>& arg, const Output<Node>& beta);
-    explicit Swish(const Output<Node>& arg);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v4::Swish;
 }  // namespace v4
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/tan.hpp b/ngraph/core/include/ngraph/op/tan.hpp
index 33dc9e32bec933..992f237e09cf39 100644
--- a/ngraph/core/include/ngraph/op/tan.hpp
+++ b/ngraph/core/include/ngraph/op/tan.hpp
@@ -5,39 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/tan.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-// clang-format off
-        /// \brief Elementwise tangent operation.
-        ///
-        /// ## Inputs
-        ///
-        /// |       | Type                              | Description                                     |
-        /// | ----- | --------------------------------- | ----------------------------------------------- |
-        /// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
-        ///
-        /// ## Output
-        ///
-        /// | Type                   | Description                                                                          |
-        /// | ---------------------- | ------------------------------------------------------------------------------------ |
-        /// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \tan(\texttt{arg}[i_1,\dots,i_n])\f$ |
-// clang-format on
-class NGRAPH_API Tan : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Constructs a tangent operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Tan(const Output<Node>& arg);
-    Tan() = default;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Tan;
 }  // namespace v0
 using v0::Tan;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/tanh.hpp b/ngraph/core/include/ngraph/op/tanh.hpp
index a891ff691ce761..0d2d92938865c2 100644
--- a/ngraph/core/include/ngraph/op/tanh.hpp
+++ b/ngraph/core/include/ngraph/op/tanh.hpp
@@ -5,26 +5,12 @@
 #pragma once
 
 #include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+#include "openvino/op/tanh.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Elementwise hyperbolic tangent operation.
-class NGRAPH_API Tanh : public util::UnaryElementwiseArithmetic {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a hyperbolic tangent operation.
-    ///
-    /// \param arg Node that produces the input tensor.
-    Tanh(const Output<Node>& arg);
-    Tanh() = default;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Tanh;
 }  // namespace v0
 using v0::Tanh;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/tensor_iterator.hpp b/ngraph/core/include/ngraph/op/tensor_iterator.hpp
index 405710363d4eba..528d2394bcfcdd 100644
--- a/ngraph/core/include/ngraph/op/tensor_iterator.hpp
+++ b/ngraph/core/include/ngraph/op/tensor_iterator.hpp
@@ -9,35 +9,12 @@
 #include "ngraph/function.hpp"
 #include "ngraph/op/parameter.hpp"
 #include "ngraph/op/util/sub_graph_base.hpp"
+#include "openvino/op/tensor_iterator.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief  Iterate a body over tensors, accumulating into tensors.
-class NGRAPH_API TensorIterator : public op::util::SubGraphOp {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    TensorIterator() = default;
-    explicit TensorIterator(const OutputVector& values);
-
-    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    /// \return the body of the iteration
-    std::shared_ptr<Function> get_body() const {
-        return m_bodies[0];
-    }
-    /// \param body set the body of the iteration
-    void set_body(const std::shared_ptr<Function>& body) {
-        set_function(body);
-    }
-    void validate_and_infer_types() override;
-    void revalidate_and_infer_types_for_body_ops();
-
-private:
-    void try_to_set_num_iterations_if_no_slice_inputs();
-};
+using ov::op::v0::TensorIterator;
 }  // namespace v0
 using v0::TensorIterator;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/tile.hpp b/ngraph/core/include/ngraph/op/tile.hpp
index cc9c886472ce8e..fb3b5436175eed 100644
--- a/ngraph/core/include/ngraph/op/tile.hpp
+++ b/ngraph/core/include/ngraph/op/tile.hpp
@@ -6,34 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/op/tile.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-/// \brief Dynamic Tiling operation which repeats a tensor multiple times
-///        along each dimension
-class NGRAPH_API Tile : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Tile() = default;
-    /// \brief Perform dynamic padding of a tensor
-    ///
-    /// \param data The node producing input tensor to be padded.
-    /// \param repeats The node producing the per-dimension replication factor
-    Tile(const Output<Node>& data, const Output<Node>& repeats);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool evaluate_tile(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v0::Tile;
 }  // namespace v0
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/topk.hpp b/ngraph/core/include/ngraph/op/topk.hpp
index 8ce1eef6f117c9..c6cb2a9cf842ac 100644
--- a/ngraph/core/include/ngraph/op/topk.hpp
+++ b/ngraph/core/include/ngraph/op/topk.hpp
@@ -9,157 +9,16 @@
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/constant.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/topk.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Computes indices and values of the k maximum/minimum values
-///        for each slice along specified axis.
-class NGRAPH_API TopK : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    using SortType = TopKSortType;
-    using Mode = TopKMode;
-
-    /// \brief Constructs a TopK operation
-    TopK() = default;
-    /// \brief Constructs a TopK operation with two outputs: values and indices.
-    ///        By default the indices output is described by i32 data type.
-    ///
-    /// \param data The input tensor
-    /// \param k Specifies how many maximum/minimum elements should be computed
-    ///          (note: scalar input tensor)
-    /// \param axis The axis along which to compute top k indices
-    /// \param mode Specifies which operation (min or max) is used to select
-    ///             the biggest element of two.
-    /// \param sort Specifies order of output elements and/or indices
-    ///             Accepted values: none, index, value
-    /// \param index_element_type Specyfies type of produced indices
-    TopK(const Output<Node>& data,
-         const Output<Node>& k,
-         const int64_t axis,
-         const std::string& mode,
-         const std::string& sort,
-         const element::Type& index_element_type = element::i32);
-
-    TopK(const Output<Node>& data,
-         const Output<Node>& k,
-         const int64_t axis,
-         const Mode mode,
-         const SortType sort,
-         const element::Type& index_element_type = element::i32);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    /// \brief Returns axis value after normalization
-    /// \note If input rank required to normalization is dynamic, the exception is
-    /// thrown
-    uint64_t get_axis() const;
-    /// \brief Returns axis value before normalization
-    int64_t get_provided_axis() const {
-        return m_axis;
-    }
-    void set_axis(const int64_t axis);
-    Mode get_mode() const {
-        return m_mode;
-    }
-    void set_mode(const Mode mode) {
-        m_mode = mode;
-    }
-    SortType get_sort_type() const {
-        return m_sort;
-    }
-    void set_sort_type(const SortType sort) {
-        m_sort = sort;
-    }
-    element::Type get_index_element_type() const {
-        return m_index_element_type;
-    }
-    void set_index_element_type(const element::Type& index_element_type) {
-        m_index_element_type = index_element_type;
-    }
-    /// \brief Returns the value of K, if available
-    ///
-    /// \note If the second input to this op is a constant, the value is retrieved
-    ///       and returned. If the input is not constant(dynamic) this method returns 0
-    size_t get_k() const;
-    void set_k(size_t k);
-    size_t get_default_output_index() const override {
-        return no_default_index();
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    int64_t m_axis;
-    uint64_t m_normalized_axis;
-    Mode m_mode;
-    SortType m_sort;
-    element::Type m_index_element_type{element::i32};
-
-    virtual size_t read_k_from_constant_node(const std::shared_ptr<Node>& node,
-                                             const element::Type& k_element_type) const;
-
-    template <typename T>
-    size_t validate_and_get_k(const std::shared_ptr<op::Constant>& k_constant) const;
-    Shape compute_output_shape(const std::string& node_description,
-                               const PartialShape input_partial_shape,
-                               const int64_t k) const;
-    void set_axis(const Rank input_rank, const int64_t axis);
-};
+using ov::op::v1::TopK;
 }  // namespace v1
 
 namespace v3 {
-/// \brief Computes indices and values of the k maximum/minimum values
-///        for each slice along specified axis.
-class NGRAPH_API TopK : public v1::TopK {
-public:
-    static constexpr NodeTypeInfo type_info{"TopK", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs a TopK operation
-    TopK() = default;
-    /// \brief Constructs a TopK operation with two outputs: values and indices.
-    ///        By default the indices output is described by i32 data type.
-    ///
-    /// \param data The input tensor
-    /// \param k Specifies how many maximum/minimum elements should be computed
-    ///          (note: scalar input tensor)
-    /// \param axis The axis along which to compute top k indices
-    /// \param mode Specifies which operation (min or max) is used to select
-    ///             the biggest element of two.
-    /// \param sort Specifies order of output elements and/or indices
-    ///             Accepted values: none, index, value
-    /// \param index_element_type Specyfies type of produced indices
-    TopK(const Output<Node>& data,
-         const Output<Node>& k,
-         const int64_t axis,
-         const std::string& mode,
-         const std::string& sort,
-         const element::Type& index_element_type = element::i32);
-
-    TopK(const Output<Node>& data,
-         const Output<Node>& k,
-         const int64_t axis,
-         const Mode mode,
-         const SortType sort,
-         const element::Type& index_element_type = element::i32);
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-protected:
-    virtual size_t read_k_from_constant_node(const std::shared_ptr<Node>& node,
-                                             const element::Type& k_element_type) const override;
-};
+using ov::op::v3::TopK;
 }  // namespace v3
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/transpose.hpp b/ngraph/core/include/ngraph/op/transpose.hpp
index 92127203c4da2f..41620e7539eb33 100644
--- a/ngraph/core/include/ngraph/op/transpose.hpp
+++ b/ngraph/core/include/ngraph/op/transpose.hpp
@@ -7,35 +7,12 @@
 #include "ngraph/axis_vector.hpp"
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/transpose.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Tensor transpose operation.
-class NGRAPH_API Transpose : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Transpose() = default;
-    ///
-    /// \brief      Constructs a transpose operation.
-    ///
-    /// \param      arg          Node producing the tensor to be transposed.
-    /// \param      input_order  Node producing the permutation to apply to the axes
-    ///                          of the input shape. Must be a vector with shape [n],
-    ///                          where n is the rank of arg. The tensor's value must
-    ///                          contain every integer in the range [0, n-1].
-    ///
-    Transpose(const Output<Node>& arg, const Output<Node>& input_order);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::Transpose;
 }  // namespace v1
 using v1::Transpose;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/unsqueeze.hpp b/ngraph/core/include/ngraph/op/unsqueeze.hpp
index ffc0b5efdb4269..a71ce25e7c61bc 100644
--- a/ngraph/core/include/ngraph/op/unsqueeze.hpp
+++ b/ngraph/core/include/ngraph/op/unsqueeze.hpp
@@ -9,28 +9,12 @@
 #include "ngraph/axis_vector.hpp"
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
+#include "openvino/op/unsqueeze.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v0 {
-class NGRAPH_API Unsqueeze : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Unsqueeze() = default;
-    Unsqueeze(const Output<Node>& data, const Output<Node>& axes);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-    bool evaluate_lower(const HostTensorVector& output_values) const override;
-    bool evaluate_upper(const HostTensorVector& output_values) const override;
-
-    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-};
+using ov::op::v0::Unsqueeze;
 }  // namespace v0
 using v0::Unsqueeze;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/util/activation_functions.hpp b/ngraph/core/include/ngraph/op/util/activation_functions.hpp
index b8285e643a311e..27e40e969df542 100644
--- a/ngraph/core/include/ngraph/op/util/activation_functions.hpp
+++ b/ngraph/core/include/ngraph/op/util/activation_functions.hpp
@@ -9,98 +9,25 @@
 
 #include "ngraph/except.hpp"
 #include "ngraph/node.hpp"
-
-#ifdef _WIN32
-#    pragma warning(push)
-
-#    pragma warning(disable : 4100)
-#endif
-
-// Prevents the compiler from complaining about or optimizing away variables
-// that appear unused on Linux
-#if (defined(__GNUC__) && !defined(__clang__))
-#    undef NG_ATTRIBUTE_UNUSED
-#    define NG_ATTRIBUTE_UNUSED __attribute__((__unused__))
-#else
-#    define NG_ATTRIBUTE_UNUSED
-#endif
-
-#define UNUSED_PARAMETER NG_ATTRIBUTE_UNUSED = 0
+#include "openvino/op/util/activation_functions.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
 namespace error {
-struct UnknownActivationFunction : ngraph_error {
-    UnknownActivationFunction(const std::string& func_name)
-        : ngraph_error{"Unknown activation function: " + func_name} {}
-};
+using ov::op::util::error::UnknownActivationFunction;
 }  // namespace error
 
 namespace detail {
-std::shared_ptr<Node> sigmoid(const std::shared_ptr<Node>& arg,
-                              float alpha UNUSED_PARAMETER,
-                              float beta UNUSED_PARAMETER);
-std::shared_ptr<Node> tanh(const std::shared_ptr<Node>& arg, float alpha UNUSED_PARAMETER, float beta UNUSED_PARAMETER);
-std::shared_ptr<Node> relu(const std::shared_ptr<Node>& arg, float alpha UNUSED_PARAMETER, float beta UNUSED_PARAMETER);
-std::shared_ptr<Node> hardsigmoid(const std::shared_ptr<Node>& arg, float alpha, float beta);
+using ov::op::util::detail::hardsigmoid;
+using ov::op::util::detail::relu;
+using ov::op::util::detail::sigmoid;
+using ov::op::util::detail::tanh;
 }  // namespace detail
 
-using ActivationFunctionType = std::shared_ptr<Node> (*)(const std::shared_ptr<Node>&, float, float);
-
-///
-/// \brief      Class representing activation function used in RNN cells.
-///
-class NGRAPH_API ActivationFunction {
-public:
-    ActivationFunction(ActivationFunctionType f, float alpha, float beta);
-    ActivationFunction(ActivationFunctionType f, float alpha);
-    ActivationFunction(ActivationFunctionType f);
-    ActivationFunction() = default;
-
-    ///
-    /// \brief  Calls stored activation function with provided node argument.
-    ///
-    std::shared_ptr<Node> operator()(const std::shared_ptr<Node>& arg) const;
-
-    void set_alpha(float alpha) {
-        m_alpha = alpha;
-    }
-    void set_beta(float beta) {
-        m_beta = beta;
-    }
-
-private:
-    /// \brief Activation function wrapper.
-    ActivationFunctionType m_function;
-    /// \brief Activation function alpha parameter (may be unused).
-    float m_alpha;
-    /// \brief Activation function beta parameter (may be unused).
-    float m_beta;
-};
-
-/// \brief      Gets the activation function by name.
-///
-/// \param[in]  func_name  The function name
-///
-/// \throws     UnknownActivationFunction When provided func_name is unknown.
-///
-/// \return     The activation function object.
-///
-ActivationFunction get_activation_func_by_name(const std::string& func_name);
+using ov::op::util::ActivationFunction;
+using ov::op::util::ActivationFunctionType;
+using ov::op::util::get_activation_func_by_name;
 }  // namespace util
-
 }  // namespace op
-
 }  // namespace ngraph
-
-#ifdef _WIN32
-#    pragma warning(pop)
-#endif
-
-#ifdef UNUSED_PARAMETER
-#    undef UNUSED_PARAMETER
-#endif
-#ifdef NG_ATTRIBUTE_UNUSED
-#    undef NG_ATTRIBUTE_UNUSED
-#endif
diff --git a/ngraph/core/include/ngraph/op/util/arithmetic_reduction.hpp b/ngraph/core/include/ngraph/op/util/arithmetic_reduction.hpp
index 483904ec339fdf..bbf18b0f8d925d 100644
--- a/ngraph/core/include/ngraph/op/util/arithmetic_reduction.hpp
+++ b/ngraph/core/include/ngraph/op/util/arithmetic_reduction.hpp
@@ -6,39 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/reduction_base.hpp"
+#include "openvino/op/util/arithmetic_reduction.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Abstract base class for arithmetic reduction operations, i.e., operations
-///        where chosen axes of the input tensors are eliminated (reduced out) by
-///        repeated application of a particular binary arithmetic operation.
-class NGRAPH_API ArithmeticReduction : public ReductionBase {
-protected:
-    /// \brief Constructs an arithmetic reduction operation.
-    ArithmeticReduction();
-
-    /// \brief Constructs an arithmetic reduction operation.
-    ///
-    /// \param arg Output that produces the first input tensor.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    ArithmeticReduction(const Output<Node>& arg, const Output<Node>& reduction_axes);
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-    void validate_and_infer_types() override;
-
-    /// \return true if reduction axes are constant else false.
-    bool reduction_axes_constant() const;
-
-    /// \return The axis positions (0-based) to be eliminated through reduction.
-    /// \throws CheckFailure if the reduction axes are not constant. (Use
-    ///           reduction_axes_constant to check.)
-    const AxisSet get_reduction_axes() const;
-
-    /// \brief Change the reduction axes
-    void set_reduction_axes(const AxisSet& reduction_axes);
-};
+using ov::op::util::ArithmeticReduction;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/arithmetic_reductions_keep_dims.hpp b/ngraph/core/include/ngraph/op/util/arithmetic_reductions_keep_dims.hpp
index ca60de06727e34..e320ba47ae3ee0 100644
--- a/ngraph/core/include/ngraph/op/util/arithmetic_reductions_keep_dims.hpp
+++ b/ngraph/core/include/ngraph/op/util/arithmetic_reductions_keep_dims.hpp
@@ -6,37 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/arithmetic_reduction.hpp"
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-class NGRAPH_API ArithmeticReductionKeepDims : public util::ArithmeticReduction {
-protected:
-    ArithmeticReductionKeepDims() = default;
-
-    /// \param arg The tensor to be summed.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
-    ArithmeticReductionKeepDims(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-    void validate_and_infer_types() override;
-
-    /// \return If set to 1 it holds axes that are used for reduction.
-    /// For each such axis, output dimension is equal to 1.
-    bool get_keep_dims() const {
-        return m_keep_dims;
-    }
-    void set_keep_dims(bool keep_dims) {
-        m_keep_dims = keep_dims;
-    }
-
-private:
-    bool m_keep_dims = false;
-};
+using ov::op::util::ArithmeticReductionKeepDims;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/attr_types.hpp b/ngraph/core/include/ngraph/op/util/attr_types.hpp
index c14e996e8a5571..46bde99ba53874 100644
--- a/ngraph/core/include/ngraph/op/util/attr_types.hpp
+++ b/ngraph/core/include/ngraph/op/util/attr_types.hpp
@@ -10,332 +10,20 @@
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/ngraph_visibility.hpp"
 #include "ngraph/type.hpp"
+#include "openvino/op/util/attr_types.hpp"
 
 namespace ngraph {
 namespace op {
-/// \brief Modes for the `Pad` operator.
-enum class PadMode { CONSTANT = 0, EDGE, REFLECT, SYMMETRIC };
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const PadMode& type);
-
-/// \brief Padding Type used for `Convolution` and `Pooling`
-///
-/// Follows ONNX padding type definitions
-/// EXPLICIT   - Pad dimensions are explicity specified
-/// SAME_LOWER - Pad dimensions computed to match input shape
-///              Ceil(num_dims/2) at the beginning and
-///              Floor(num_dims/2) at the end
-/// SAME_UPPER - Pad dimensions computed to match input shape
-///              Floor(num_dims/2) at the beginning and
-///              Ceil(num_dims/2) at the end
-/// VALID      - No padding
-/// AUTO       - Deprecated. User should not use it in the future
-/// NOTSET     - Deprecated. User should not use it in the future
-
-enum class PadType {
-    EXPLICIT = 0,
-    SAME_LOWER,
-    SAME_UPPER,
-    VALID,
-    AUTO = SAME_UPPER,
-    NOTSET = EXPLICIT,
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const PadType& type);
-
-/// \brief Rounding Type used for `Pooling` operators.
-enum class RoundingType {
-    FLOOR = 0,
-    CEIL = 1,
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const RoundingType& type);
-
-/// \brief Specifies the algorithm to use for implicit broadcasting of a tensor
-///        to align with another tensor
-///
-/// NONE  - No implicit broadcasting of tensor
-/// NUMPY - Numpy-style implicit broadcasting
-///         (https://docs.scipy.org/doc/numpy/user/basics.broadcasting.html)
-///         Right-align dimensions of the two tensors, with missing dimensions
-///         treated as size 1 dimensions. After alignment, for each dimension,
-///         their sizes should either match or one of them should be of size 1.
-///         Size 1 dimension will be implicitly broadcast to match the other
-///         size.
-///
-///         E.g.,
-///              A: Shape(2, 1, 6)
-///              B: Shape(   3, 1)
-///         Result: Shape(2, 3, 6)
-///
-///              A: Shape(2, 1, 6)
-///              B: Shape(   3, 1)
-///         Result: Shape(2, 3, 6)
-/// PDPD  - PaddlePaddle-style implicit broadcasting
-///         (https://github.com/PaddlePaddle/Paddle/blob/release/1.5/paddle/
-///                  fluid/operators/elementwise/elementwise_op.h#L126)
-///         Broadcast B to match the shape of A, where axis is the start
-///         dimension index to align B with A. If axis is -1 (default), i
-///         axis = rank(A) - rank(B). The trailing dimensions of size 1 for B
-///         will be ignored.
-///
-///         E.g.,
-///              A: Shape(2, 3, 4, 5)
-///              B: Shape(   3, 4   ) with axis =1
-///         Result: Shape(2, 3, 4, 5)
-///
-///              A: Shape(2, 3, 4, 5)
-///              B: Shape(   3, 1   ) with axis = 1
-///         Result: Shape(2, 3, 4, 5)
-///
-/// TODO: Add more implicit broadcast modes used by frameworks
-enum class AutoBroadcastType {
-    NONE = 0,
-    EXPLICIT = NONE,
-    NUMPY,
-    PDPD,
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const AutoBroadcastType& type);
-/// \brief BroadcastType specifies rules used for mapping of input tensor axes to output
-/// shape axes.
-///
-/// \note  Broadcasting rules are different for Broadcast op and for element-wise ops.
-///        AutoBroadcastType::NUMPY is equivalent of BroadcastType::BIDIRECTIONAL
-///        according to spec.
-///
-/// EXPLICIT      - Mapping of the input data shape to output shape
-///                 based on axes_mapping input.
-/// NUMPY         - Numpy broadcasting rules, aligned with ONNX Broadcasting.
-///                 (https://github.com/onnx/onnx/blob/master/docs/Broadcasting.md)
-/// PDPD          - PaddlePaddle-style implicit broadcasting.
-///                 For more informaction see AutoBroadcastType documentation.
-/// BIDIRECTIONAL - The broadcast rule is similar to
-///                 numpy.array(input) * numpy.ones(target_shape).
-///                 Dimensions are right alignment.
-enum class BroadcastType { NONE, EXPLICIT = NONE, NUMPY, PDPD, BIDIRECTIONAL };
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const BroadcastType& type);
-
-/// \brief Specifies how eps is combined with L2 value
-enum class EpsMode {
-    // Add bias to norm
-    ADD,
-    // Calculate max of norm and bias
-    MAX
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const EpsMode& type);
-
-enum class TopKSortType {
-    // Returned values are not sorte
-    NONE,
-    // Sort result based on element indices
-    SORT_INDICES,
-    // Sort result based on element values
-    SORT_VALUES,
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const TopKSortType& type);
-
-enum class TopKMode {
-    MAX,
-    MIN,
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const TopKMode& type);
-
-/// \brief Implicit broadcast specification
-struct NGRAPH_API AutoBroadcastSpec {
-    AutoBroadcastSpec() : m_type(AutoBroadcastType::NONE), m_axis(0) {}
-    AutoBroadcastSpec(AutoBroadcastType type) : m_type(type), m_axis(0) {}
-    AutoBroadcastSpec(const char* type) : AutoBroadcastSpec(type_from_string(type)) {}
-    AutoBroadcastSpec(AutoBroadcastType type, int64_t axis) : m_type(type), m_axis(axis) {}
-
-    AutoBroadcastType m_type;  // Implicit broadcasting algorithm
-    int64_t m_axis;            // Axis to start alignment on
-
-    bool operator==(const AutoBroadcastSpec& a) const {
-        return a.m_type == m_type && a.m_axis == m_axis;
-    }
-
-    bool operator!=(const AutoBroadcastSpec& a) const {
-        return !(*this == a);
-    }
-    static const AutoBroadcastSpec NUMPY;
-    static const AutoBroadcastSpec NONE;
-
-private:
-    AutoBroadcastType type_from_string(const std::string& type) const;
-};
-
-/// \brief Implicit broadcast specification
-struct NGRAPH_API BroadcastModeSpec {
-    BroadcastModeSpec() : m_type(BroadcastType::NUMPY), m_axis(0) {}
-    BroadcastModeSpec(BroadcastType type) : m_type(type), m_axis(0) {}
-    BroadcastModeSpec(const char* type) : BroadcastModeSpec(as_enum<BroadcastType>(type)) {}
-    BroadcastModeSpec(BroadcastType type, int64_t axis) : m_type(type), m_axis(axis) {}
-
-    BroadcastType m_type;  // Implicit broadcasting algorithm
-    int64_t m_axis;        // Axis to start alignment on
-
-    bool operator==(const BroadcastModeSpec& a) const {
-        return a.m_type == m_type && a.m_axis == m_axis;
-    }
-};
-
-///
-/// \brief      This class defines possible recurrent sequence directions.
-///
-enum class RecurrentSequenceDirection { FORWARD, REVERSE, BIDIRECTIONAL };
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const RecurrentSequenceDirection& direction);
+using ov::op::AutoBroadcastSpec;
+using ov::op::AutoBroadcastType;
+using ov::op::BroadcastModeSpec;
+using ov::op::BroadcastType;
+using ov::op::EpsMode;
+using ov::op::PadMode;
+using ov::op::PadType;
+using ov::op::RecurrentSequenceDirection;
+using ov::op::RoundingType;
+using ov::op::TopKMode;
+using ov::op::TopKSortType;
 }  // namespace op
 }  // namespace ngraph
-
-namespace ov {
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::PadMode> : public EnumAttributeAdapterBase<ngraph::op::PadMode> {
-public:
-    AttributeAdapter(ngraph::op::PadMode& value) : EnumAttributeAdapterBase<ngraph::op::PadMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::PadMode>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::PadType> : public EnumAttributeAdapterBase<ngraph::op::PadType> {
-public:
-    AttributeAdapter(ngraph::op::PadType& value) : EnumAttributeAdapterBase<ngraph::op::PadType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::PadType>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::RoundingType>
-    : public EnumAttributeAdapterBase<ngraph::op::RoundingType> {
-public:
-    AttributeAdapter(ngraph::op::RoundingType& value) : EnumAttributeAdapterBase<ngraph::op::RoundingType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::RoundingType>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::AutoBroadcastType>
-    : public EnumAttributeAdapterBase<ngraph::op::AutoBroadcastType> {
-public:
-    AttributeAdapter(ngraph::op::AutoBroadcastType& value)
-        : EnumAttributeAdapterBase<ngraph::op::AutoBroadcastType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::AutoBroadcastType>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::BroadcastType>
-    : public EnumAttributeAdapterBase<ngraph::op::BroadcastType> {
-public:
-    AttributeAdapter(ngraph::op::BroadcastType& value) : EnumAttributeAdapterBase<ngraph::op::BroadcastType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::BroadcastType>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::EpsMode> : public EnumAttributeAdapterBase<ngraph::op::EpsMode> {
-public:
-    AttributeAdapter(ngraph::op::EpsMode& value) : EnumAttributeAdapterBase<ngraph::op::EpsMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::EpsMode>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::TopKSortType>
-    : public EnumAttributeAdapterBase<ngraph::op::TopKSortType> {
-public:
-    AttributeAdapter(ngraph::op::TopKSortType& value) : EnumAttributeAdapterBase<ngraph::op::TopKSortType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::TopKSortType>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::TopKMode> : public EnumAttributeAdapterBase<ngraph::op::TopKMode> {
-public:
-    AttributeAdapter(ngraph::op::TopKMode& value) : EnumAttributeAdapterBase<ngraph::op::TopKMode>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::TopKMode>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-template <>
-class AttributeAdapter<ngraph::op::AutoBroadcastSpec> : public VisitorAdapter {
-public:
-    AttributeAdapter(ngraph::op::AutoBroadcastSpec& value) : m_ref(value) {}
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::AutoBroadcastSpec>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-
-protected:
-    ngraph::op::AutoBroadcastSpec& m_ref;
-};
-
-template <>
-class AttributeAdapter<ngraph::op::BroadcastModeSpec> : public VisitorAdapter {
-public:
-    AttributeAdapter(ngraph::op::BroadcastModeSpec& value) : m_ref(value) {}
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::BroadcastModeSpec>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-
-protected:
-    ngraph::op::BroadcastModeSpec& m_ref;
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::RecurrentSequenceDirection>
-    : public EnumAttributeAdapterBase<ngraph::op::RecurrentSequenceDirection> {
-public:
-    AttributeAdapter(ngraph::op::RecurrentSequenceDirection& value)
-        : EnumAttributeAdapterBase<ngraph::op::RecurrentSequenceDirection>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::RecurrentSequenceDirection>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/util/binary_elementwise_arithmetic.hpp b/ngraph/core/include/ngraph/op/util/binary_elementwise_arithmetic.hpp
index f1ff6b1e9cb977..91f3262756133e 100644
--- a/ngraph/core/include/ngraph/op/util/binary_elementwise_arithmetic.hpp
+++ b/ngraph/core/include/ngraph/op/util/binary_elementwise_arithmetic.hpp
@@ -6,65 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-// clang-format off
-            /// \brief Abstract base class for elementwise binary arithmetic operations, i.e.,
-            ///        operations where the same scalar binary arithmetic operation is applied to
-            ///        each corresponding pair of elements in the two input tensors. Implicit
-            ///        broadcast of input tensors is supported through one of the AutoBroadcast
-            ///        modes.
-            ///
-            /// For example, if the underlying arithmetic operation (determined by the subclass) is
-            /// \f$\mathit{op}(x,y)\f$, the input tensors
-            /// \f$[[x_0,y_0],[z_0,w_0]]\f$ and \f$[[x_1,y_1],[z_1,w_1]]\f$ will be mapped to
-            /// \f$[[\mathit{op}(x_0,x_1),\mathit{op}(y_0,y_1)],[\mathit{op}(z_0,z_1),\mathit{op}(w_0,w_1)]]\f$.
-            ///
-            /// ## Inputs
-            ///
-            /// |        | Type                              | Description                                                              |
-            /// | ------ | --------------------------------- | ------------------------------------------------------------------------ |
-            /// | `arg0` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape. The element type \f$N\f$ may be any numeric type. |
-            /// | `arg1` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same element type as `arg0`.                             |
-            /// | `autob`| AutoBroadcastSpec                 | Auto broadcast specification.                                            |
-            ///
-            /// ## Output
-            ///
-            /// | Type                   | Description                                                                                                                                                                                                                      |
-            /// | ---------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-            /// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg0}[i_1,\dots,i_n],\texttt{arg1}[i_1,\dots,i_n])\f$. This will always have the same shape and element type as the input tensors (after auto broadcasting). |
-// clang-format on
-class NGRAPH_API BinaryElementwiseArithmetic : public Op {
-protected:
-    BinaryElementwiseArithmetic(const AutoBroadcastSpec& autob);
-
-    /// \brief Constructs a binary elementwise arithmetic operation.
-    ///
-    /// \param arg0 Output that produces the first input tensor.
-    /// \param arg1 Output that produces the second input tensor.
-    BinaryElementwiseArithmetic(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& autob);
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    void validate_and_infer_types() override;
-
-    const AutoBroadcastSpec& get_autob() const override {
-        return m_autob;
-    }
-    void set_autob(const AutoBroadcastSpec& autob) {
-        m_autob = autob;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-
-private:
-    AutoBroadcastSpec m_autob;
-    void validate_and_infer_elementwise_arithmetic(const op::AutoBroadcastSpec& autob);
-};
+using ov::op::util::BinaryElementwiseArithmetic;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/binary_elementwise_comparison.hpp b/ngraph/core/include/ngraph/op/util/binary_elementwise_comparison.hpp
index 2da954b649dac5..57470ebca4ceef 100644
--- a/ngraph/core/include/ngraph/op/util/binary_elementwise_comparison.hpp
+++ b/ngraph/core/include/ngraph/op/util/binary_elementwise_comparison.hpp
@@ -6,66 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/util/binary_elementwise_comparison.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-// clang-format off
-            /// \brief Abstract base class for elementwise binary comparison operations, i.e.,
-            ///        operations where the same scalar binary comparison operation is applied to
-            ///        each corresponding pair of elements in two input tensors. Implicit
-            ///        broadcast of input tensors is supported through one of the AutoBroadcast
-            ///        modes.
-            ///
-            /// For example, if the underlying comparison operation (determined by the subclass) is
-            /// \f$\mathit{op}(x,y)\f$, the input tensors \f$[[x_0,y_0],[z_0,w_0]]\f$ and
-            /// \f$[[x_1,y_1],[z_1,w_1]]\f$ will be mapped to
-            /// \f$[[\mathit{op}(x_0,x_1),\mathit{op}(y_0,y_1)],[\mathit{op}(z_0,z_1),\mathit{op}(w_0,w_1)]]\f$.
-            ///
-            /// ## Inputs
-            ///
-            /// |        | Type                              | Description                                            |
-            /// | ------ | --------------------------------- | ------------------------------------------------------ |
-            /// | `arg0` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and element type.                |
-            /// | `arg1` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
-            /// | `autob`| AutoBroadcastSpec                 | Auto broadcast specification.                          |
-            ///
-            /// ## Output
-            ///
-            /// | Type                               | Description                                                                                                                                                                                                        |
-            /// | ---------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-            /// | \f$\texttt{bool}[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg0}[i_1,\dots,i_n],\texttt{arg1}[i_1,\dots,i_n])\f$. This will always have the same shape as the input tensors, and the element type `bool`. |
-// clang-format on
-class NGRAPH_API BinaryElementwiseComparison : public Op {
-protected:
-    /// \brief Constructs a binary elementwise comparison operation.
-    BinaryElementwiseComparison(const AutoBroadcastSpec& autob);
-
-    /// \brief Constructs a binary elementwise comparison operation.
-    ///
-    /// \param arg0 Output that produces the first input tensor.
-    /// \param arg1 Output that produces the second input tensor.
-    /// \param autob AutoBroadcast mode.
-    BinaryElementwiseComparison(const Output<Node>& arg0,
-                                const Output<Node>& arg1,
-                                const AutoBroadcastSpec& autob = AutoBroadcastSpec());
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    void validate_and_infer_types() override;
-
-    const AutoBroadcastSpec& get_autob() const override {
-        return m_autob;
-    }
-    void set_autob(const AutoBroadcastSpec& autob) {
-        m_autob = autob;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    AutoBroadcastSpec m_autob;
-};
+using ov::op::util::BinaryElementwiseComparison;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/binary_elementwise_logical.hpp b/ngraph/core/include/ngraph/op/util/binary_elementwise_logical.hpp
index b48d8f69a1f509..20a8dc76699ce4 100644
--- a/ngraph/core/include/ngraph/op/util/binary_elementwise_logical.hpp
+++ b/ngraph/core/include/ngraph/op/util/binary_elementwise_logical.hpp
@@ -5,64 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/binary_elementwise_logical.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-// clang-format off
-            /// \brief Abstract base class for elementwise binary logical operations, i.e.,
-            ///        operations where the same scalar binary logical operation is applied to
-            ///        each corresponding pair of elements in two boolean input tensors. Implicit
-            ///        broadcast of input tensors is supported through one of the AutoBroadcast
-            ///        modes.
-            ///
-            /// For example, if the underlying operation (determined by the subclass) is
-            /// \f$\mathit{op}(x,y)\f$, the input tensors \f$[[x_0,y_0],[z_0,w_0]]\f$ and
-            /// \f$[[x_1,y_1],[z_1,w_1]]\f$ will be mapped to
-            /// \f$[[\mathit{op}(x_0,x_1),\mathit{op}(y_0,y_1)],[\mathit{op}(z_0,z_1),\mathit{op}(w_0,w_1)]]\f$.
-            ///
-            /// ## Inputs
-            ///
-            /// |        | Type                                          | Description                                            |
-            /// | ------ | --------------------------------------------- | ------------------------------------------------------ |
-            /// | `arg0` | \f$\texttt{bool}[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape, with element type `bool`.       |
-            /// | `arg1` | \f$\texttt{bool}[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
-            /// | `autob`| AutoBroadcastSpec                             | Auto broadcast specification.                          |
-            ///
-            /// ## Output
-            ///
-            /// | Type                               | Description                                                                                                                                                                                                        |
-            /// | ---------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
-            /// | \f$\texttt{bool}[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg0}[i_1,\dots,i_n],\texttt{arg1}[i_1,\dots,i_n])\f$. This will always have the same shape as the input tensors, and the element type `bool`. |
-// clang-format on
-class NGRAPH_API BinaryElementwiseLogical : public Op {
-protected:
-    NGRAPH_RTTI_DECLARATION;
-
-    BinaryElementwiseLogical();
-
-    /// \brief Constructs a binary elementwise logical operation.
-    ///
-    /// \param arg0 Output that produces the first input tensor.
-    /// \param arg1 Output that produces the second input tensor.
-    BinaryElementwiseLogical(const Output<Node>& arg0,
-                             const Output<Node>& arg1,
-                             const AutoBroadcastSpec& autob = AutoBroadcastSpec());
-
-public:
-    void validate_and_infer_types() override;
-
-    const AutoBroadcastSpec& get_autob() const override {
-        return m_autob;
-    }
-    void set_autob(const AutoBroadcastSpec& autob) {
-        m_autob = autob;
-    }
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    AutoBroadcastSpec m_autob = AutoBroadcastSpec::NUMPY;
-};
+using ov::op::util::BinaryElementwiseLogical;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/broadcast_base.hpp b/ngraph/core/include/ngraph/op/util/broadcast_base.hpp
index c9af35af715eba..12dfb6833feda0 100644
--- a/ngraph/core/include/ngraph/op/util/broadcast_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/broadcast_base.hpp
@@ -2,84 +2,18 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
+#pragma once
+
 #include "ngraph/axis_set.hpp"
 #include "ngraph/axis_vector.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
-
-#pragma once
+#include "openvino/op/util/broadcast_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-class NGRAPH_API BroadcastBase : public Op {
-protected:
-    BroadcastBase() = default;
-    /// \brief Constructs a broadcast operation.
-    ///
-    /// \param arg            The input tensor to be broadcast.
-    /// \param target_shape   The shape of the output tensor.
-    /// \param axes_mapping   The axis positions (0-based) in the result that correspond
-    ///                       to input axes.
-    /// \param broadcast_mode Broadcast specification to use for determining broadcast
-    ///                       axes. 'axes_mapping' should not be provided if mode other
-    ///
-    BroadcastBase(const Output<Node>& arg,
-                  const Output<Node>& target_shape,
-                  const Output<Node>& axes_mapping,
-                  const BroadcastModeSpec& broadcast_mode = BroadcastType::EXPLICIT);
-
-    /// \brief Constructs a broadcast operation.
-    ///
-    /// \param arg            The input tensor to be broadcast.
-    /// \param target_shape   The shape of the output tensor.
-    /// \param broadcast_mode Broadcast specification to use for determining broadcast
-    ///                       axes
-    BroadcastBase(const Output<Node>& arg,
-                  const Output<Node>& target_shape,
-                  const BroadcastModeSpec& broadcast_mode = BroadcastType::NUMPY);
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    void validate_and_infer_types() override;
-    /// \return true and the AxisSet if broadcast axes can be fully determined.
-    virtual std::pair<bool, AxisSet> get_broadcast_axes() const;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-
-protected:
-    BroadcastModeSpec m_mode;
-
-    bool evaluate_broadcast(const HostTensorPtr& arg0,
-                            const HostTensorPtr& out,
-                            const std::pair<bool, AxisSet> pair_broadcast_axes,
-                            const Shape output_shape) const;
-
-    bool evaluate_broadcast(const HostTensorPtr& arg0, const HostTensorPtr& out, const AxisSet& broadcast_axes) const;
-
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-
-    PartialShape get_result_shape_pdpd(const PartialShape& arg0_shape,
-                                       const PartialShape& target_shape,
-                                       const op::BroadcastModeSpec& broadcast_spec) const;
-
-    void validate_target_shape_numpy(const PartialShape& arg_shape, const PartialShape& target_shape) const;
-
-    static std::pair<bool, AxisSet> get_broadcast_axes_numpy_pdpd(const Shape& arg_shape,
-                                                                  const Shape& result_shape,
-                                                                  const op::BroadcastModeSpec& broadcast_spec);
-
-    static std::pair<bool, AxisSet> get_broadcast_axes_none(const AxisVector axes_mapping_val,
-                                                            const size_t target_shape);
-
-    void validate_target_shape_none(const PartialShape& arg_shape,
-                                    const AxisVector& axes_mapping_val,
-                                    const PartialShape& target_shape) const;
-
-    Shape get_target_shape(const HostTensorPtr& input1) const;
-};
+using ov::op::util::BroadcastBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/deformable_convolution_base.hpp b/ngraph/core/include/ngraph/op/util/deformable_convolution_base.hpp
index dd8ed971089a13..09f6314071a9c0 100644
--- a/ngraph/core/include/ngraph/op/util/deformable_convolution_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/deformable_convolution_base.hpp
@@ -7,99 +7,12 @@
 #include "ngraph/coordinate_diff.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/util/deformable_convolution_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Base class for operations DeformableConvolution v1 and DeformableConvolution
-/// v8.
-class NGRAPH_API DeformableConvolutionBase : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a conversion operation.
-    DeformableConvolutionBase() = default;
-
-    /// \brief Constructs a conversion operation.
-    /// \param strides            Convolution strides.
-    /// \param pads_begin         Amount of padding to be added to the beginning along
-    ///                           each axis. For example in case of a 2D input the value
-    ///                           of (1, 2) means that 1 element will be added to the
-    ///                           top and 2 elements to the left.
-    /// \param pads_end           Amount of padding to be added to the end along each
-    ///                           axis.
-    /// \param dilations          The distance in width and height between the weights
-    ///                           in the filters tensor.
-    /// \param auto_pad           Specifies how the automatic calculation of padding
-    ///                           should be done.
-    /// \param group              The number of groups which both output and input
-    ///                           should be split into.
-    /// \param deformable_group   The number of groups which deformable values and
-    ///                           output should be split into along the channel axis.
-    DeformableConvolutionBase(const OutputVector& arguments,
-                              const Strides& strides,
-                              const CoordinateDiff& pads_begin,
-                              const CoordinateDiff& pads_end,
-                              const Strides& dilations,
-                              const PadType& auto_pad = PadType::EXPLICIT,
-                              int64_t group = 1,
-                              int64_t deformable_group = 1);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    void validate_and_infer_types() override;
-
-    const Strides& get_strides() const {
-        return m_strides;
-    }
-    void set_strides(const Strides& strides) {
-        m_strides = strides;
-    }
-    const Strides& get_dilations() const {
-        return m_dilations;
-    }
-    void set_dilations(const Strides& dilations) {
-        m_dilations = dilations;
-    }
-    const CoordinateDiff& get_pads_begin() const {
-        return m_pads_begin;
-    }
-    void set_pads_begin(const CoordinateDiff& pads_begin) {
-        m_pads_begin = pads_begin;
-    }
-    const CoordinateDiff& get_pads_end() const {
-        return m_pads_end;
-    }
-    void set_pads_end(const CoordinateDiff& pads_end) {
-        m_pads_end = pads_end;
-    }
-    const PadType& get_auto_pad() const {
-        return m_auto_pad;
-    }
-    void set_auto_pad(const PadType& auto_pad) {
-        m_auto_pad = auto_pad;
-    }
-    int64_t get_group() const {
-        return m_group;
-    }
-    void set_group(const int64_t group) {
-        m_group = group;
-    }
-    int64_t get_deformable_group() const {
-        return m_deformable_group;
-    }
-    void set_deformable_group(const int64_t deformable_group) {
-        m_deformable_group = deformable_group;
-    }
-
-protected:
-    Strides m_strides;
-    Strides m_dilations;
-    CoordinateDiff m_pads_begin;
-    CoordinateDiff m_pads_end;
-    PadType m_auto_pad;
-    int64_t m_group;
-    int64_t m_deformable_group;
-};
+using ov::op::util::DeformableConvolutionBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/elementwise_args.hpp b/ngraph/core/include/ngraph/op/util/elementwise_args.hpp
index 6d87523827d3db..faf9ce154d2e11 100644
--- a/ngraph/core/include/ngraph/op/util/elementwise_args.hpp
+++ b/ngraph/core/include/ngraph/op/util/elementwise_args.hpp
@@ -5,13 +5,12 @@
 #pragma once
 
 #include "ngraph/node.hpp"
+#include "openvino/op/util/elementwise_args.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-std::tuple<element::Type, PartialShape> validate_and_infer_elementwise_args(
-    Node* node,
-    const op::AutoBroadcastSpec& autob = op::AutoBroadcastSpec());
+using ov::op::util::validate_and_infer_elementwise_args;
 }
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/embeddingbag_offsets_base.hpp b/ngraph/core/include/ngraph/op/util/embeddingbag_offsets_base.hpp
index 40ca4d3f8f9b01..28005440fedde6 100644
--- a/ngraph/core/include/ngraph/op/util/embeddingbag_offsets_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/embeddingbag_offsets_base.hpp
@@ -6,61 +6,12 @@
 
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/util/index_reduction.hpp"
+#include "openvino/op/util/embeddingbag_offsets_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Returns embeddings for given indices
-class NGRAPH_API EmbeddingBagOffsetsBase : public Op {
-public:
-    static constexpr NodeTypeInfo type_info{"EmbeddingBagOffsetsBase", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs a EmbeddingBagOffsetsBase operation.
-    EmbeddingBagOffsetsBase() = default;
-    /// \brief Constructs a EmbeddingBagOffsetsBase operation.
-    ///
-    /// EmbeddingBagOffsetsBase constructs an output tensor by replacing every index in
-    /// a
-    /// given
-    /// input tensor with a row (from the weights matrix) at that index
-    ///
-    /// \param emb_table tensor containing the embedding lookup table of the module of
-    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
-    /// \param tensor of shape [num_indices] and of type T_IND. Required
-    /// \param offsets tensor of shape [batch] and of type T_IND containing the starting
-    /// index positions of each "bag" in indices. Required.
-    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
-    /// Each value in this tensor are multiplied with each
-    /// value pooled from embedding table for each index. Optional.
-    /// \param default_index scalar of type T_IND containing default index in embedding
-    /// table to fill empty "bags". If not provided empty "bags"
-    /// are filled with zeros. Optional.
-
-    EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
-                            const Output<Node>& indices,
-                            const Output<Node>& offsets,
-                            const Output<Node>& default_index,
-                            const Output<Node>& per_sample_weights);
-
-    EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
-                            const Output<Node>& indices,
-                            const Output<Node>& offsets,
-                            const Output<Node>& default_index);
-
-    EmbeddingBagOffsetsBase(const Output<Node>& emb_table, const Output<Node>& indices, const Output<Node>& offsets);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    static constexpr int EMB_TABLE = 0;
-    static constexpr int INDICES = 1;
-    static constexpr int OFFSETS = 2;
-    static constexpr int DEFAULT_INDEX = 3;
-    static constexpr int PER_SAMPLE_WEIGHTS = 4;
-};
+using ov::op::util::EmbeddingBagOffsetsBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/embeddingbag_packed_base.hpp b/ngraph/core/include/ngraph/op/util/embeddingbag_packed_base.hpp
index 75409bc27f1115..b6891bd075d37a 100644
--- a/ngraph/core/include/ngraph/op/util/embeddingbag_packed_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/embeddingbag_packed_base.hpp
@@ -6,47 +6,12 @@
 
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/util/index_reduction.hpp"
+#include "openvino/op/util/embeddingbag_packed_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Returns embeddings for given indices
-class NGRAPH_API EmbeddingBagPackedBase : public Op {
-public:
-    static constexpr NodeTypeInfo type_info{"EmbeddingBagPackedBase", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    /// \brief Constructs a EmbeddingBagPackedBase operation.
-    EmbeddingBagPackedBase() = default;
-    /// \brief Constructs a EmbeddingBagPackedBase operation.
-    ///
-    /// EmbeddingBagPackedBase constructs an output tensor by replacing every index in a
-    /// given
-    /// input tensor with a row (from the weights matrix) at that index
-    ///
-    /// \param emb_table Tensor containing the embedding lookup table of the module of
-    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
-    /// \param  indices Tensor of shape `[batch, indices_per_bag]` and of type *T_IND*.
-    /// Required.
-    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
-    /// Each value in this tensor are multiplied with each
-    /// value pooled from embedding table for each index. Optional.
-
-    EmbeddingBagPackedBase(const Output<Node>& emb_table,
-                           const Output<Node>& indices,
-                           const Output<Node>& per_sample_weights);
-
-    EmbeddingBagPackedBase(const Output<Node>& emb_table, const Output<Node>& indices);
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    static constexpr int EMB_TABLE = 0;
-    static constexpr int INDICES = 1;
-    static constexpr int PER_SAMPLE_WEIGHTS = 2;
-};
+using ov::op::util::EmbeddingBagPackedBase;
 }  // namespace util
 using util::EmbeddingBagPackedBase;
 }  // namespace op
diff --git a/ngraph/core/include/ngraph/op/util/fft_base.hpp b/ngraph/core/include/ngraph/op/util/fft_base.hpp
index c56302161cc0f0..03692ba624eff0 100644
--- a/ngraph/core/include/ngraph/op/util/fft_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/fft_base.hpp
@@ -6,35 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/util/fft_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Base class for operations DFT and DFT.
-class NGRAPH_API FFTBase : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    FFTBase() = default;
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-protected:
-    /// \brief Constructs an FFT operation. FFT is performed for full size axes.
-    ///
-    /// \param data  Input data
-    /// \param axes Axes to perform FFT
-    FFTBase(const Output<Node>& data, const Output<Node>& axes);
-
-    /// \brief Constructs a FFT operation.
-    ///
-    /// \param data  Input data
-    /// \param axes Axes to perform FFT
-    /// \param signal_size Signal sizes for 'axes'
-    FFTBase(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size);
-
-    void validate();
-};
+using ov::op::util::FFTBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/gather_base.hpp b/ngraph/core/include/ngraph/op/util/gather_base.hpp
index b4f10630297374..9d6ce9bb44fcd8 100644
--- a/ngraph/core/include/ngraph/op/util/gather_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/gather_base.hpp
@@ -5,38 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/gather_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief GatherBase basic class for Gather v1 and v7
-class NGRAPH_API GatherBase : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    GatherBase() = default;
-
-    /// \param data The tensor from which slices are gathered
-    /// \param indices Tensor with indexes to gather
-    /// \param axis The tensor is a dimension index to gather data from
-    /// \param batch_dims The number of batch dimension in data and indices tensors
-    GatherBase(const Output<Node>& data,
-               const Output<Node>& indices,
-               const Output<Node>& axis,
-               const int64_t batch_dims = 0);
-
-    void validate_and_infer_types() override;
-    virtual int64_t get_axis() const;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-
-    bool evaluate_lower(const HostTensorVector& outputs) const override;
-    bool evaluate_upper(const HostTensorVector& outputs) const override;
-
-    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
-
-protected:
-    int64_t m_batch_dims = 0;
-};
+using ov::op::util::GatherBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/index_reduction.hpp b/ngraph/core/include/ngraph/op/util/index_reduction.hpp
index e34f49bf11a0e5..2e86e4400973e3 100644
--- a/ngraph/core/include/ngraph/op/util/index_reduction.hpp
+++ b/ngraph/core/include/ngraph/op/util/index_reduction.hpp
@@ -10,28 +10,12 @@
 #include <utility>
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/index_reduction.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-class NGRAPH_API IndexReduction : public Op {
-protected:
-    IndexReduction();
-
-    IndexReduction(const Output<Node>& arg, uint64_t axis, const element::Type& index_element_type);
-
-public:
-    uint64_t get_reduction_axis() const;
-    void set_reduction_axis(uint64_t value);
-    element::Type get_index_element_type() const;
-    void set_index_element_type(const element::Type& index_element_type);
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-protected:
-    uint64_t m_axis{0};
-    element::Type m_index_element_type;
-};
+using ov::op::util::IndexReduction;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/logical_reduction.hpp b/ngraph/core/include/ngraph/op/util/logical_reduction.hpp
index f9fc564a3095ea..c84764199b7e24 100644
--- a/ngraph/core/include/ngraph/op/util/logical_reduction.hpp
+++ b/ngraph/core/include/ngraph/op/util/logical_reduction.hpp
@@ -6,41 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/reduction_base.hpp"
+#include "openvino/op/util/logical_reduction.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Abstract base class for logical reduction operations, i.e., operations where
-///        chosen axes of the input tensors are eliminated (reduced out) by repeated
-///        application of a particular binary logical operation.
-class NGRAPH_API LogicalReduction : public ReductionBase {
-protected:
-    /// \brief Constructs a logical reduction operation.
-    LogicalReduction();
-    /// \brief Constructs a logical reduction operation.
-    ///
-    /// \param arg Output that produces the first input tensor.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    LogicalReduction(const Output<Node>& arg, const AxisSet& reduction_axes);
-    /// \brief Constructs a 'dynamic' logical reduction operation.
-    ///
-    /// \param arg Node that produces the first input tensor.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    LogicalReduction(const Output<Node>& arg, const Output<Node>& reduction_axes);
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-    void validate_and_infer_types() override;
-
-    /// \return true if reduction axes are constant else false.
-    bool reduction_axes_constant() const;
-
-    /// \return The axis positions (0-based) to be eliminated through reduction.
-    /// \throws CheckFailure if the reduction axes are not constant. (Use
-    ///           reduction_axes_constant to check.)
-    const AxisSet get_reduction_axes() const;
-    void set_reduction_axes(const AxisSet& reduction_axes);
-};
+using ov::op::util::LogicalReduction;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/logical_reduction_keep_dims.hpp b/ngraph/core/include/ngraph/op/util/logical_reduction_keep_dims.hpp
index edbd9a6254be6a..deab4fe1b22eeb 100644
--- a/ngraph/core/include/ngraph/op/util/logical_reduction_keep_dims.hpp
+++ b/ngraph/core/include/ngraph/op/util/logical_reduction_keep_dims.hpp
@@ -6,37 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/logical_reduction.hpp"
+#include "openvino/op/util/logical_reduction_keep_dims.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-class NGRAPH_API LogicalReductionKeepDims : public util::LogicalReduction {
-protected:
-    LogicalReductionKeepDims() = default;
-
-    /// \param arg The tensor to be reduced.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
-    LogicalReductionKeepDims(const Output<Node>& arg, const Output<Node>& reduction_axes, const bool keep_dims = false);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-    void validate_and_infer_types() override;
-
-    /// \return If set to 1 it holds axes that are used for reduction.
-    /// For each such axis, output dimension is equal to 1.
-    bool get_keep_dims() const {
-        return m_keep_dims;
-    }
-    void set_keep_dims(bool keep_dims) {
-        m_keep_dims = keep_dims;
-    }
-
-private:
-    bool m_keep_dims = false;
-};
+using ov::op::util::LogicalReductionKeepDims;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/max_pool_base.hpp b/ngraph/core/include/ngraph/op/util/max_pool_base.hpp
index 48a42c7cf8843d..e049033e166b8d 100644
--- a/ngraph/core/include/ngraph/op/util/max_pool_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/max_pool_base.hpp
@@ -6,91 +6,12 @@
 
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/util/max_pool_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-class NGRAPH_API MaxPoolBase : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    MaxPoolBase() = default;
-
-    /// \param arg The node producing the input data batch tensor.
-    /// \param strides The strides.
-    /// \param pads_begin The beginning of padding shape.
-    /// \param pads_end The end of padding shape.
-    /// \param kernel The kernel shape.
-    /// \param rounding_mode Whether to use ceiling or floor rounding type while
-    /// computing output shape.
-    /// \param auto_pad The pad type for automatically computing padding sizes.
-    MaxPoolBase(const Output<Node>& arg,
-                const Strides& strides,
-                const Shape& pads_begin,
-                const Shape& pads_end,
-                const Shape& kernel,
-                const op::RoundingType rounding_mode = op::RoundingType::FLOOR,
-                const PadType auto_pad = op::PadType::EXPLICIT);
-
-    void validate_and_infer_types() override;
-
-    /// \return The kernel shape.
-    const Shape& get_kernel() const {
-        return m_kernel;
-    }
-    void set_kernel(const Shape& kernel) {
-        m_kernel = kernel;
-    }
-    /// \return The strides.
-    const Strides& get_strides() const {
-        return m_strides;
-    }
-    void set_strides(const Strides& strides) {
-        m_strides = strides;
-    }
-    /// \return The beginning of padding shape.
-    const Shape& get_pads_begin() const {
-        return m_pads_begin;
-    }
-    void set_pads_begin(const Shape& pads_begin) {
-        m_pads_begin = pads_begin;
-    }
-    /// \return The end of padding shape.
-    const Shape& get_pads_end() const {
-        return m_pads_end;
-    }
-    void set_adding_above(const Shape& pads_end) {
-        m_pads_end = pads_end;
-    }
-    /// \return The pad type for pooling.
-    PadType get_auto_pad() const {
-        return m_auto_pad;
-    }
-    void set_auto_pad(const PadType auto_pad) {
-        m_auto_pad = auto_pad;
-    }
-    /// \return The ceiling mode being used for output shape computations
-    op::RoundingType get_rounding_type() const {
-        return m_rounding_type;
-    }
-    void set_rounding_type(op::RoundingType rounding_type) {
-        m_rounding_type = rounding_type;
-    }
-
-protected:
-    bool update_auto_padding(const PartialShape& in_shape,
-                             const Strides& filter_dilations,
-                             Shape& new_pads_end,
-                             Shape& new_pads_begin) const;
-
-    PartialShape infer_output_shape(const Strides& dilations);
-
-    Shape m_kernel;
-    Strides m_strides;
-    Shape m_pads_begin;
-    Shape m_pads_end;
-    PadType m_auto_pad;
-    op::RoundingType m_rounding_type;
-};
+using ov::op::util::MaxPoolBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/multi_subgraph_base.hpp b/ngraph/core/include/ngraph/op/util/multi_subgraph_base.hpp
index 16919a8a21b5f0..17571911213304 100644
--- a/ngraph/core/include/ngraph/op/util/multi_subgraph_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/multi_subgraph_base.hpp
@@ -8,317 +8,16 @@
 #include <ngraph/op/parameter.hpp>
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/multi_subgraph_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Abstract base class for sub-graph based ops, i.e ops that have some
-/// sub-graphs
-///
-class NGRAPH_API MultiSubGraphOp : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    /// \brief Abstract class describes a connection between a MultiSubGraphOp input and
-    /// the body.
-    class InputDescription {
-    protected:
-        ///
-        /// \brief      Constructs a new instance.
-        ///
-        /// \param      input_index           Position of the MultiSubGraphOp input
-        /// \param      body_parameter_index  Body parameter to receive input
-        ///
-        InputDescription(uint64_t input_index, uint64_t body_parameter_index);
-        InputDescription() = default;
-
-    public:
-        using type_info_t = DiscreteTypeInfo;
-        virtual ~InputDescription() = default;
-        virtual std::shared_ptr<InputDescription> copy() const = 0;
-
-        virtual const type_info_t& get_type_info() const = 0;
-
-        uint64_t m_input_index{0};
-        uint64_t m_body_parameter_index{0};
-    };
-
-    /// \brief Abstract class describes how a MultiSubGraphOp output is produced from
-    /// the body.
-    class OutputDescription {
-    protected:
-        ///
-        /// \brief      Constructs a new instance.
-        ///
-        /// \param      body_value_index  A body value that produces the output
-        /// \param      output_index      The MultiSubGraphOp output index
-        ///
-        OutputDescription(uint64_t body_value_index, uint64_t output_index);
-        OutputDescription() = default;
-
-    public:
-        using type_info_t = DiscreteTypeInfo;
-        virtual ~OutputDescription() = default;
-        virtual std::shared_ptr<OutputDescription> copy() const = 0;
-        virtual const type_info_t& get_type_info() const = 0;
-
-        uint64_t m_body_value_index{0};
-        uint64_t m_output_index{0};
-    };
-
-    ///
-    /// \brief      Describes a body input formed from slices of an input to
-    ///             MultiSubGraphOp.
-    ///
-    class NGRAPH_API SliceInputDescription : public InputDescription {
-    public:
-        NGRAPH_RTTI_DECLARATION;
-        ///
-        /// \brief      Constructs a new instance.
-        ///
-        /// \param      input_index           Position of the MultiSubGraphOp input
-        /// \param      body_parameter_index  Body parameter position to receive input
-        /// \param      start                 First index for slices
-        /// \param      stride                Step amount for slices
-        /// \param      part_size             Width of slices
-        /// \param      end                   Last index for slices
-        /// \param      axis                  Axis being sliced
-        ///
-        SliceInputDescription(uint64_t input_index,
-                              uint64_t body_parameter_index,
-                              int64_t start,
-                              int64_t stride,
-                              int64_t part_size,
-                              int64_t end,
-                              int64_t axis);
-        SliceInputDescription() = default;
-        std::shared_ptr<InputDescription> copy() const override;
-        int64_t m_start{0};
-        int64_t m_stride{0};
-        int64_t m_part_size{0};
-        int64_t m_end{0};
-        int64_t m_axis{0};
-    };
-
-    ///
-    /// \brief      Describes a body input initialized from a MultiSubGraphOp input
-    ///             on the first iteration, and then a body output thereafter.
-    ///
-    class NGRAPH_API MergedInputDescription : public InputDescription {
-    public:
-        NGRAPH_RTTI_DECLARATION;
-        ///
-        /// \brief      Constructs a new instance.
-        ///
-        /// \param      input_index           Position of the MultiSubGraphOp input
-        ///                                   supplying a value to body_parameter for
-        ///                                   the initial iteration.
-        /// \param      body_parameter_index  Body parameter position to receive input.
-        /// \param      body_value_index      Body value to supply body_parameter for
-        /// successive
-        ///                                   iterations.
-        ///
-        MergedInputDescription(uint64_t input_index, uint64_t body_parameter_index, uint64_t body_value_index);
-        MergedInputDescription() = default;
-        std::shared_ptr<InputDescription> copy() const override;
-        uint64_t m_body_value_index{0};
-    };
-
-    /// \brief Produces an output by concatenating an output from each iteration
-    class NGRAPH_API ConcatOutputDescription : public OutputDescription {
-    public:
-        NGRAPH_RTTI_DECLARATION;
-        ///
-        /// \brief      Constructs a new instance.
-        ///
-        /// \param      body_value_index  A body value that produces the output
-        /// \param      output_index      The MultiSubGraphOp output index
-        /// \param      start             First index for slices
-        /// \param      stride            Step amount for slices
-        /// \param      part_size         Width of slices
-        /// \param      end               Last index for slices
-        /// \param      axis              Axis being sliced
-        ///
-        ConcatOutputDescription(uint64_t body_value_index,
-                                uint64_t output_index,
-                                int64_t start,
-                                int64_t stride,
-                                int64_t part_size,
-                                int64_t end,
-                                int64_t axis);
-        ConcatOutputDescription() = default;
-
-        std::shared_ptr<OutputDescription> copy() const override;
-        int64_t m_start{0};
-        int64_t m_stride{0};
-        int64_t m_part_size{0};
-        int64_t m_end{0};
-        int64_t m_axis{0};
-    };
-
-    /// \brief Produces an input
-    class NGRAPH_API InvariantInputDescription : public InputDescription {
-    public:
-        NGRAPH_RTTI_DECLARATION;
-        ///
-        /// \brief      Constructs a new instance.
-        ///
-        /// \param      input_index           Position of the MultiSubGraphOp input
-        /// \param      body_parameter_index  Body parameter to receive input
-        ///
-        InvariantInputDescription(uint64_t input_index, uint64_t body_parameter_index);
-        InvariantInputDescription() = default;
-        std::shared_ptr<InputDescription> copy() const override;
-    };
-
-    /// \brief Produces an output from a specific iteration
-    class NGRAPH_API BodyOutputDescription : public MultiSubGraphOp::OutputDescription {
-    public:
-        NGRAPH_RTTI_DECLARATION;
-        ///
-        /// \brief      Constructs a new instance.
-        ///
-        /// \param      body_value_index  A body value that produces the output
-        /// \param      output_index      The SubGraphOp output index
-        /// \param      iteration         which iteration (typically -1, final) will
-        ///                               supply the value
-        ///
-        BodyOutputDescription(uint64_t body_value_index, uint64_t output_index, int64_t iteration = -1);
-        BodyOutputDescription() = default;
-        std::shared_ptr<MultiSubGraphOp::OutputDescription> copy() const override;
-        int64_t m_iteration{0};
-    };
-    using MultiSubgraphInputDescriptionPtr = std::shared_ptr<MultiSubGraphOp::InputDescription>;
-    using MultiSubgraphOutputDescriptionPtr = std::shared_ptr<MultiSubGraphOp::OutputDescription>;
-    using MultiSubgraphInputDescriptionVector = std::vector<MultiSubgraphInputDescriptionPtr>;
-    using MultiSubgraphOutputDescriptionVector = std::vector<MultiSubgraphOutputDescriptionPtr>;
-
-    /// \brief     Gets internal sub-graph by index in MultiSubGraphOp
-    ///
-    /// \param     index sub-graph's index in op
-    /// \return pointer to ngraph::Function with sub-graph
-    virtual const std::shared_ptr<Function>& get_function(int index) const {
-        return m_bodies[index];
-    };
-    /// \brief     Adds sub-graph to MultiSubGraphOp
-    ///
-    /// \param index   index of new sub-graph
-    /// \param func    func new sub_graph as ngraph::Function
-    virtual void set_function(int index, const std::shared_ptr<Function>& func) {
-        m_bodies[index] = func;
-    }
-    /// \brief     Gets vector with connections beewtwen operation inputs
-    /// and internal sub-graph parameters
-    ///
-    /// \param index   index of internal sub-graph
-    /// \return vector of input descriptions
-    const MultiSubgraphInputDescriptionVector& get_input_descriptions(int index) const {
-        return m_input_descriptions[index];
-    }
-    /// \brief     Gets vector with connections beewtwen operation inputs
-    /// and internal sub-graph parameters
-    ///
-    /// \param index   index of internal sub-graph
-    /// \return vector of input descriptions
-    MultiSubgraphInputDescriptionVector& get_input_descriptions(int index) {
-        return m_input_descriptions[index];
-    }
-    /// \brief     Gets vector with connections beewtwen operation outputs
-    /// and internal sub-graph results
-    ///
-    /// \param index   index of internal sub-graph
-    /// \return vector of output descriptions
-    const MultiSubgraphOutputDescriptionVector& get_output_descriptions(int index) const {
-        return m_output_descriptions[index];
-    }
-    /// \brief     Gets vector with connections beewtwen operation outputs
-    /// and internal sub-graph results
-    ///
-    /// \param index   index of internal sub-graph
-    /// \return vector of output descriptions
-    MultiSubgraphOutputDescriptionVector& get_output_descriptions(int index) {
-        return m_output_descriptions[index];
-    }
-    /// \brief     Sets vector with connections beewtwen operation inputs
-    /// and internal sub-graph parameters
-    ///
-    /// \param index   index of internal sub-graph
-    /// \param inputs  vector of input descriptions
-    void set_input_descriptions(int index, const MultiSubgraphInputDescriptionVector& inputs) {
-        m_input_descriptions[index] = inputs;
-    }
-
-    /// \brief     Sets vector with connections beewtwen operation outputs
-    /// and internal sub-graph results
-    ///
-    /// \param index   index of internal sub-graph
-    /// \param outputs vector of input descriptions
-    void set_output_descriptions(int index, const MultiSubgraphOutputDescriptionVector& outputs) {
-        m_output_descriptions[index] = outputs;
-    }
-
-    ///
-    /// \brief     Set input decriptions for MultiSubGraphOp input.
-    ///
-    /// \param      value              The value supplied as an input to the block.
-    /// \param      bodies_parameters  vector of bodies parameters.
-    virtual void set_invariant_inputs(const Output<Node>& value, const ParameterVector& bodies_parameters);
-    ///
-    /// \brief     Set output decriptions for MultiSubGraphOp output.
-    ///
-    /// \param      bodies_results  vector of bodies results for one output.
-    /// \return     value           Output node for bodies_results.
-    virtual Output<Node> set_body_outputs(const ResultVector& bodies_results);
-
-    MultiSubGraphOp(const MultiSubGraphOp&) = delete;
-    MultiSubGraphOp(MultiSubGraphOp&&) = default;
-
-    MultiSubGraphOp& operator=(const MultiSubGraphOp&) = delete;
-    MultiSubGraphOp& operator=(MultiSubGraphOp&&) = default;
-
-protected:
-    // Find an input corresponding to value, adding one if necessary.
-    Input<Node> input_for_value(const Output<Node>& value);
-
-    MultiSubGraphOp(size_t number_of_bodies);
-    MultiSubGraphOp() = default;
-    MultiSubGraphOp(const OutputVector& args, size_t number_of_bodies);
-    explicit MultiSubGraphOp(const OutputVector& args);
-
-    std::vector<std::shared_ptr<Function>> m_bodies;
-    std::vector<MultiSubgraphInputDescriptionVector> m_input_descriptions;
-    std::vector<MultiSubgraphOutputDescriptionVector> m_output_descriptions;
-};
-using MultiSubgraphInputDescriptionPtr = util::MultiSubGraphOp::MultiSubgraphInputDescriptionPtr;
-using MultiSubgraphOutputDescriptionPtr = util::MultiSubGraphOp::MultiSubgraphOutputDescriptionPtr;
+using ov::op::util::MultiSubGraphOp;
+using MultiSubgraphInputDescriptionPtr = ov::op::util::MultiSubGraphOp::InputDescription::Ptr;
+using MultiSubgraphOutputDescriptionPtr = ov::op::util::MultiSubGraphOp::OutputDescription::Ptr;
 using MultiSubgraphInputDescriptionVector = util::MultiSubGraphOp::MultiSubgraphInputDescriptionVector;
 using MultiSubgraphOutputDescriptionVector = util::MultiSubGraphOp::MultiSubgraphOutputDescriptionVector;
-
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::InputDescription>>>
-    : public DirectValueAccessor<std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::InputDescription>>> {
-public:
-    AttributeAdapter(std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::InputDescription>>& value)
-        : DirectValueAccessor<std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::InputDescription>>>(
-              value) {}
-
-    NGRAPH_RTTI_DECLARATION;
-};
-
-template <>
-class NGRAPH_API AttributeAdapter<std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::OutputDescription>>>
-    : public DirectValueAccessor<std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::OutputDescription>>> {
-public:
-    AttributeAdapter(std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::OutputDescription>>& value)
-        : DirectValueAccessor<std::vector<std::shared_ptr<ngraph::op::util::MultiSubGraphOp::OutputDescription>>>(
-              value) {}
-
-    NGRAPH_RTTI_DECLARATION;
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/util/nms_base.hpp b/ngraph/core/include/ngraph/op/util/nms_base.hpp
index 1d5519354965c8..a625f169bfcd1e 100644
--- a/ngraph/core/include/ngraph/op/util/nms_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/nms_base.hpp
@@ -5,91 +5,13 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/nms_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Base class for operations NmsBase and MatrixNms
-///
-class NGRAPH_API NmsBase : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    enum class SortResultType {
-        CLASSID,  // sort selected boxes by class id (ascending) in each batch element
-        SCORE,    // sort selected boxes by score (descending) in each batch element
-        NONE      // do not guarantee the order in each batch element
-    };
-
-    NmsBase() = delete;
-
-    /// \brief Constructs a NmsBase operation
-    ///
-    /// \param output_type Specifies the output tensor type
-    /// \param nms_top_k Specifies maximum number of boxes to be selected per
-    /// class, -1 meaning to keep all boxes
-    /// \param keep_top_k Specifies maximum number of boxes to be selected per
-    /// batch element, -1 meaning to keep all boxes
-    NmsBase(ngraph::element::Type& output_type, int& nms_top_k, int& keep_top_k);
-
-    /// \brief Constructs a NmsBase operation
-    ///
-    /// \param boxes Node producing the box coordinates
-    /// \param scores Node producing the box scores
-    /// \param output_type Specifies the output tensor type
-    /// \param nms_top_k Specifies maximum number of boxes to be selected per
-    /// class, -1 meaning to keep all boxes
-    /// \param keep_top_k Specifies maximum number of boxes to be selected per
-    /// batch element, -1 meaning to keep all boxes
-    NmsBase(const Output<Node>& boxes,
-            const Output<Node>& scores,
-            ngraph::element::Type& output_type,
-            int& nms_top_k,
-            int& keep_top_k);
-
-    void validate_and_infer_types() override;
-
-    const element::Type& get_output_type() const {
-        return m_output_type;
-    }
-    void set_output_type(const element::Type& output_type) {
-        m_output_type = output_type;
-    }
-    using Node::set_output_type;
-
-    int get_nms_top_k() const {
-        return m_nms_top_k;
-    }
-
-    int get_keep_top_k() const {
-        return m_keep_top_k;
-    }
-
-protected:
-    ngraph::element::Type& m_output_type;
-    int& m_nms_top_k;
-    int& m_keep_top_k;
-    virtual void validate();
-};
+using ov::op::util::NmsBase;
 }  // namespace util
 }  // namespace op
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const op::util::NmsBase::SortResultType& type);
+using ov::operator<<;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::op::util::NmsBase::SortResultType>
-    : public EnumAttributeAdapterBase<ngraph::op::util::NmsBase::SortResultType> {
-public:
-    AttributeAdapter(ngraph::op::util::NmsBase::SortResultType& value)
-        : EnumAttributeAdapterBase<ngraph::op::util::NmsBase::SortResultType>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::util::NmsBase::SortResultType>", 1};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/util/op_types.hpp b/ngraph/core/include/ngraph/op/util/op_types.hpp
index 5c875830025d85..c18fb656f1eed3 100644
--- a/ngraph/core/include/ngraph/op/util/op_types.hpp
+++ b/ngraph/core/include/ngraph/op/util/op_types.hpp
@@ -8,57 +8,20 @@
 
 #include "ngraph/ngraph_visibility.hpp"
 #include "ngraph/node.hpp"
+#include "openvino/op/util/op_types.hpp"
 
 namespace ngraph {
 namespace op {
-NGRAPH_API
-bool is_unary_elementwise_arithmetic(const ngraph::Node* node);
-NGRAPH_API
-bool is_binary_elementwise_arithmetic(const ngraph::Node* node);
-NGRAPH_API
-bool is_binary_elementwise_comparison(const ngraph::Node* node);
-NGRAPH_API
-bool is_binary_elementwise_logical(const ngraph::Node* node);
-
-NGRAPH_API
-bool supports_auto_broadcast(const ngraph::Node* node);
-
-NGRAPH_API
-bool is_op(const ngraph::Node* node);
-NGRAPH_API
-bool is_parameter(const ngraph::Node* node);
-NGRAPH_API
-bool is_output(const ngraph::Node* node);
-NGRAPH_API
-bool is_sink(const ngraph::Node* node);
-NGRAPH_API
-bool is_constant(const ngraph::Node* node);
-NGRAPH_API
-bool is_commutative(const ngraph::Node* node);
-
-NGRAPH_API
-bool is_unary_elementwise_arithmetic(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_binary_elementwise_arithmetic(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_binary_elementwise_comparison(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_binary_elementwise_logical(const std::shared_ptr<ngraph::Node>& node);
-
-NGRAPH_API
-bool supports_auto_broadcast(const std::shared_ptr<ngraph::Node>& node);
-
-NGRAPH_API
-bool is_op(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_parameter(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_output(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_sink(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_constant(const std::shared_ptr<ngraph::Node>& node);
-NGRAPH_API
-bool is_commutative(const std::shared_ptr<ngraph::Node>& node);
+using ov::op::util::is_binary_elementwise_arithmetic;
+using ov::op::util::is_binary_elementwise_comparison;
+using ov::op::util::is_binary_elementwise_logical;
+using ov::op::util::is_commutative;
+using ov::op::util::is_constant;
+using ov::op::util::is_op;
+using ov::op::util::is_output;
+using ov::op::util::is_parameter;
+using ov::op::util::is_sink;
+using ov::op::util::is_unary_elementwise_arithmetic;
+using ov::op::util::supports_auto_broadcast;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/reduction_base.hpp b/ngraph/core/include/ngraph/op/util/reduction_base.hpp
index ffc70ddc14d894..6af3f84077bf37 100644
--- a/ngraph/core/include/ngraph/op/util/reduction_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/reduction_base.hpp
@@ -5,31 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/reduction_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-class NGRAPH_API ReductionBase : public Op {
-protected:
-    /// \brief Constructs a reduction operation.
-    ReductionBase();
-
-    /// \brief Constructs a reduction operation.
-    ///
-    /// \param arg Output that produces the first input tensor.
-    /// \param reduction_axes The axis positions (0-based) to be eliminated.
-    ReductionBase(const Output<Node>& arg, const Output<Node>& reduction_axes);
-
-    /// \brief      Infers reduction operations output shape.
-    ///
-    /// \param[in] keep_dims    Reduction operation keeps dimensions.
-    ///
-    /// \return Partial shape of the output.
-    PartialShape infer_reduction_output_shape(const bool keep_dims);
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-};
+using ov::op::util::ReductionBase;
 }  // namespace util
 }  // namespace op
-}  // namespace ngraph
\ No newline at end of file
+}  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/rnn_cell_base.hpp b/ngraph/core/include/ngraph/op/util/rnn_cell_base.hpp
index 509830bd922a69..d351dcf38ab10d 100644
--- a/ngraph/core/include/ngraph/op/util/rnn_cell_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/rnn_cell_base.hpp
@@ -12,151 +12,14 @@
 #include "ngraph/node.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/activation_functions.hpp"
+#include "openvino/op/util/rnn_cell_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-enum class LSTMWeightsFormat {
-    FICO,  // IE
-    ICOF,  // PyTorch
-    IFCO,  // DNNL, TF, MxNet
-    IFOC,  // Caffe
-    IOFC,  // ONNX
-};
-
-///
-/// \brief      Change data format of provided node.
-///
-/// \param[in]  node  The input node to be permuted.
-///
-///
-/// \param[in]  from_format  Original node weights format.
-///
-///
-/// \param[in]  to_format  Weights format to convert to.
-///
-/// \return     Node representing reshaped tensor according to `to_format` weights
-/// format.
-///
-std::shared_ptr<Node> NGRAPH_API convert_lstm_node_format(const Output<Node>& node,
-                                                          LSTMWeightsFormat from_format,
-                                                          LSTMWeightsFormat to_format = LSTMWeightsFormat::FICO,
-                                                          int64_t axis = 0);
-
-/// \brief      Base class for all recurrent network cells.
-///
-/// \note       It holds all common attributes.
-///
-class NGRAPH_API RNNCellBase : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    ///
-    /// \brief      Constructs a RNNCellBase class.
-    ///
-    /// \param[in]  hidden_size        The number of hidden units for recurrent cell.
-    /// \param[in]  clip               The value defining clipping range [-clip, clip]
-    ///                                on input of activation functions.
-    /// \param[in]  activations        The vector of activation functions used inside
-    ///                                recurrent cell.
-    /// \param[in]  activations_alpha  The vector of alpha parameters for activation
-    ///                                functions in order respective to activation list.
-    /// \param[in]  activations_beta   The vector of beta parameters for activation
-    ///                                functions in order respective to activation list.
-    ///
-    RNNCellBase(const OutputVector& args,
-                std::size_t hidden_size,
-                float clip,
-                const std::vector<std::string>& activations,
-                const std::vector<float>& activations_alpha,
-                const std::vector<float>& activations_beta);
-
-    RNNCellBase();
-    virtual ~RNNCellBase() = default;
-
-    ///
-    /// \brief      Validates static rank and dimension for provided input parameters.
-    ///             Additionally input_size dimension is checked for X and W inputs.
-    ///
-    ///
-    /// \param[in]  input           Vector with RNN-Cell op inputs in following order:
-    ///                             X, initial_hidden_state, W, R and B.
-    ///
-    void validate_input_rank_dimension(const std::vector<ngraph::PartialShape>& input);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-    std::size_t get_hidden_size() const {
-        return m_hidden_size;
-    }
-    float get_clip() const {
-        return m_clip;
-    }
-    const std::vector<std::string>& get_activations() const {
-        return m_activations;
-    }
-    const std::vector<float>& get_activations_alpha() const {
-        return m_activations_alpha;
-    }
-    const std::vector<float>& get_activations_beta() const {
-        return m_activations_beta;
-    }
-
-protected:
-    ///
-    /// \brief      Constructs activation function object.
-    ///
-    /// \param[in]  idx   The index of the activation function name.
-    ///
-    /// \return     The object representing activation function.
-    ///
-    ActivationFunction get_activation_function(std::size_t idx) const;
-    ///
-    /// \brief      Creates node with element-wise add operation with numpy
-    ///             broadcasting.
-    ///
-    /// \param[in]  lhs   The left hand side argument node.
-    /// \param[in]  rhs   The right hand side argument node.
-    ///
-    /// \return     Node with element-wise add operation.
-    ///
-    static std::shared_ptr<Node> add(const Output<Node>& lhs, const Output<Node>& rhs);
-    ///
-    /// \brief      Creates node with element-wise subtract operation with numpy
-    ///             broadcasting.
-    ///
-    /// \param[in]  lhs   The left hand side argument node.
-    /// \param[in]  rhs   The right hand side argument node.
-    ///
-    /// \return     Node with element-wise subtract operation.
-    ///
-    static std::shared_ptr<Node> sub(const Output<Node>& lhs, const Output<Node>& rhs);
-    ///
-    /// \brief      Creates node with element-wise multiply operation with numpy
-    ///             broadcasting.
-    ///
-    /// \param[in]  lhs   The left hand side argument node.
-    /// \param[in]  rhs   The right hand side argument node.
-    ///
-    /// \return     Node with element-wise multiply operation.
-    ///
-    static std::shared_ptr<Node> mul(const Output<Node>& lhs, const Output<Node>& rhs);
-    ///
-    /// \brief      Creates node with element-wise clip operation with numpy
-    ///             broadcasting.
-    ///
-    /// \param[in]  data   The input tensor for clipping.
-    ///
-    /// \return     Node with element-wise clip operation.
-    ///
-    std::shared_ptr<Node> clip(const Output<Node>& data) const;
-
-protected:
-    std::size_t m_hidden_size;
-    float m_clip;
-    std::vector<std::string> m_activations;
-    std::vector<float> m_activations_alpha;
-    std::vector<float> m_activations_beta;
-};
+using ov::op::util::convert_lstm_node_format;
+using ov::op::util::LSTMWeightsFormat;
+using ov::op::util::RNNCellBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/scatter_base.hpp b/ngraph/core/include/ngraph/op/util/scatter_base.hpp
index c76a557a0d2525..2127050aef571b 100644
--- a/ngraph/core/include/ngraph/op/util/scatter_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/scatter_base.hpp
@@ -5,45 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/scatter_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-///
-/// \brief      Base class for ScatterXXX operators.
-///
-class NGRAPH_API ScatterBase : public Op {
-public:
-    static constexpr NodeTypeInfo type_info{"ScatterBase", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    virtual void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-protected:
-    ScatterBase() = default;
-
-    ///
-    /// \brief      Constructs ScatterBase object.
-    ///
-    /// \param      inputs   The input tensor to be updated.
-    /// \param      indices  The tensor with indexes which will be updated.
-    /// \param      updates  The tensor with update values.
-    /// \param[in]  axis     The axis at which elements will be updated.
-    ///
-    ScatterBase(const Output<Node>& inputs,
-                const Output<Node>& indices,
-                const Output<Node>& updates,
-                const Output<Node>& axis);
-
-private:
-    // Respective input ordinal number.
-    static constexpr int DATA = 0;
-    static constexpr int INDICES = 1;
-    static constexpr int UPDATES = 2;
-    static constexpr int AXIS = 3;
-};
+using ov::op::util::ScatterBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/scatter_nd_base.hpp b/ngraph/core/include/ngraph/op/util/scatter_nd_base.hpp
index 111d909f2a8e05..6b2215d68c95ca 100644
--- a/ngraph/core/include/ngraph/op/util/scatter_nd_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/scatter_nd_base.hpp
@@ -5,38 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/scatter_nd_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-///
-/// \brief      Base class for ScatterNDXXX operators.
-///
-class NGRAPH_API ScatterNDBase : public Op {
-public:
-    static constexpr NodeTypeInfo type_info{"ScatterNDBase", 3};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    // Respective input ordinal number.
-    static constexpr int INPUTS = 0;
-    static constexpr int INDICES = 1;
-    static constexpr int UPDATES = 2;
-    virtual void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-protected:
-    ScatterNDBase() = default;
-
-    ///
-    /// \brief      Constructs ScatterNDBase object.
-    ///
-    /// \param      inputs   The input tensor to be updated.
-    /// \param      indices  The tensor with indexes which will be updated.
-    /// \param      updates  The tensor with update values.
-    ///
-    ScatterNDBase(const Output<Node>& inputs, const Output<Node>& indices, const Output<Node>& updates);
-};
+using ov::op::util::ScatterNDBase;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/slice_plan.hpp b/ngraph/core/include/ngraph/op/util/slice_plan.hpp
index cd636450d1ec0a..746200d1048853 100644
--- a/ngraph/core/include/ngraph/op/util/slice_plan.hpp
+++ b/ngraph/core/include/ngraph/op/util/slice_plan.hpp
@@ -54,3 +54,5 @@ SlicePlan NGRAPH_API make_slice_plan(const Shape& input_shape,
                                      const AxisSet& shrink_axis_mask,
                                      const AxisSet& ellipsis_mask);
 }  // namespace ngraph
+
+using ngraph::make_slice_plan;
diff --git a/ngraph/core/include/ngraph/op/util/sub_graph_base.hpp b/ngraph/core/include/ngraph/op/util/sub_graph_base.hpp
index 9a72523e29f439..88d2b1a655c5ed 100644
--- a/ngraph/core/include/ngraph/op/util/sub_graph_base.hpp
+++ b/ngraph/core/include/ngraph/op/util/sub_graph_base.hpp
@@ -7,142 +7,14 @@
 #include <ngraph/op/parameter.hpp>
 
 #include "ngraph/op/util/multi_subgraph_base.hpp"
+#include "openvino/op/util/sub_graph_base.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-/// \brief Abstract base class for sub-graph based ops, i.e ops that have only one
-/// sub-graph
-///
-class NGRAPH_API SubGraphOp : public MultiSubGraphOp {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    virtual const std::shared_ptr<Function>& get_function() const {
-        return m_bodies[0];
-    };
-    virtual void set_function(const std::shared_ptr<Function>& func) {
-        m_bodies[0] = func;
-    };
-    /// \return a reference to the input descriptions.
-    const std::vector<std::shared_ptr<InputDescription>>& get_input_descriptions() const {
-        return m_input_descriptions[0];
-    }
-    /// \return a reference to the input descriptions. Can add input descriptions
-    /// before
-    /// validation.
-    std::vector<std::shared_ptr<InputDescription>>& get_input_descriptions() {
-        return m_input_descriptions[0];
-    }
-    /// \return a reference to the output descriptions.
-    const std::vector<std::shared_ptr<OutputDescription>>& get_output_descriptions() const {
-        return m_output_descriptions[0];
-    }
-    /// \return a reference to the output descriptions. Can add output descriptions
-    /// before
-    /// validation.
-    std::vector<std::shared_ptr<OutputDescription>>& get_output_descriptions() {
-        return m_output_descriptions[0];
-    }
-
-    ///
-    /// \brief      Indicate that a body parameter comes from slices of a value
-    ///
-    /// \param      parameter  The parameter to receive the slices
-    /// \param      value      The value to be sliced. This will be added as an input to
-    ///                        SubGraphOp.
-    /// \param      start      First index on axis of the slicing
-    /// \param      stride     Stepping of the slice
-    /// \param      part_size  Size of the slice on axis
-    /// \param      end        The last index on axis of the slicing
-    /// \param      axis       The axis to slice along
-    ///
-    virtual void set_sliced_input(const std::shared_ptr<Parameter>& parameter,
-                                  const Output<Node>& value,
-                                  int64_t start,
-                                  int64_t stride,
-                                  int64_t part_size,
-                                  int64_t end,
-                                  int64_t axis);
-    ///
-    /// \brief      Indicates that a body parameter has an initial value in the first
-    ///             iteration and computed value thereafter
-    ///
-    /// \param[in]  body_parameter    The body parameter
-    /// \param      initial_value     Value for the parameter in first iteration. This
-    ///                               will be added as an input to Loop.
-    /// \param      successive_value  Value for the parameter in successive iterations.
-    ///                               The value is what is active in the most recent
-    ///                               completed iteration.
-    ///
-    virtual void set_merged_input(const std::shared_ptr<Parameter>& body_parameter,
-                                  const Output<Node>& initial_value,
-                                  const Output<Node>& successive_value);
-    ///
-    /// \brief      Indicates that a body parameter has an invariant value during
-    ///             iteration that may depend on values computed outside of the
-    ///             iteration.
-    ///
-    /// \param      body_parameter  The body parameter
-    /// \param      value           The value supplied as an input to the block
-    ///
-    virtual void set_invariant_input(const std::shared_ptr<Parameter>& body_parameter, const Output<Node>& value);
-    ///
-    /// \brief      Gets a value for a particular iteration point
-    ///
-    /// \param      body_value  The value
-    /// \param      iteration   The iteration that supplies the value. Negative values
-    ///                         are from the last iteration.
-    ///                         Default value -1 (the last iteration).
-    ///
-    /// \return     The iterator value.
-    ///
-    virtual Output<Node> get_iter_value(const Output<Node>& body_value, int64_t iteration = -1);
-    ///
-    /// \brief      Concatenates slices from all iterations
-    ///
-    /// \param      value      The value supplying slice values from each iteration.
-    /// \param      start      First index on axis of the slicing
-    /// \param      stride     Stepping of the slice
-    /// \param      part_size  Size of the slice on axis
-    /// \param      end        The last index on axis of the slicing
-    /// \param      axis       The axis to slice along
-    ///
-    /// \return     The concatenated slices.
-    ///
-    virtual Output<Node> get_concatenated_slices(const Output<Node>& value,
-                                                 int64_t start,
-                                                 int64_t stride,
-                                                 int64_t part_size,
-                                                 int64_t end,
-                                                 int64_t axis);
-
-    SubGraphOp(const SubGraphOp&) = delete;
-    SubGraphOp(SubGraphOp&&) = default;
-
-    SubGraphOp& operator=(const SubGraphOp&) = delete;
-    SubGraphOp& operator=(SubGraphOp&&) = default;
-
-    int64_t get_num_iterations() const {
-        return m_num_iterations;
-    }
-
-protected:
-    int64_t m_num_iterations = -1;  // -1 means infinity for Loop op, inconsistent for TensorIterator
-
-    // Find an input corresponding to value, adding one if necessary.
-    Input<Node> input_for_value(const Output<Node>& value);
-
-    SubGraphOp();
-    explicit SubGraphOp(const OutputVector& args);
-
-private:
-    using MultiSubGraphOp::get_function;
-
-    using MultiSubGraphOp::set_function;
-};
-using InputDescriptionPtr = std::shared_ptr<util::SubGraphOp::InputDescription>;
-using OutputDescriptionPtr = std::shared_ptr<util::SubGraphOp::OutputDescription>;
+using ov::op::util::SubGraphOp;
+using InputDescriptionPtr = util::SubGraphOp::InputDescription::Ptr;
+using OutputDescriptionPtr = util::SubGraphOp::OutputDescription::Ptr;
 using InputDescriptionVector = std::vector<InputDescriptionPtr>;
 using OutputDescriptionVector = std::vector<OutputDescriptionPtr>;
 }  // namespace util
diff --git a/ngraph/core/include/ngraph/op/util/unary_elementwise_arithmetic.hpp b/ngraph/core/include/ngraph/op/util/unary_elementwise_arithmetic.hpp
index bce715e01690c7..91499fd7f47fa6 100644
--- a/ngraph/core/include/ngraph/op/util/unary_elementwise_arithmetic.hpp
+++ b/ngraph/core/include/ngraph/op/util/unary_elementwise_arithmetic.hpp
@@ -5,49 +5,12 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
 
 namespace ngraph {
 namespace op {
 namespace util {
-// clang-format off
-            /// \brief Abstract base class for elementwise unary arithmetic operations, i.e.,
-            ///        operations where the same scalar arithmetic operation is applied to each
-            ///        element.
-            ///
-            /// For example, if the underlying operation (determined by the subclass) is
-            /// \f$\mathit{op}(x)\f$, the input tensor \f$[[x,y],[z,w]]\f$ will be mapped to
-            /// \f$[[\mathit{op}(x),\mathit{op}(y)],[\mathit{op}(z),\mathit{op}(w)]]\f$.
-            ///
-            /// ## Inputs
-            ///
-            /// |       | Type                              | Description                                                              |
-            /// | ----- | --------------------------------- | ------------------------------------------------------------------------ |
-            /// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape. The element type \f$N\f$ may be any numeric type. |
-            ///
-            /// ## Output
-            ///
-            /// | Type                   | Description                                                                                                                                                             |
-            /// | ---------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-            /// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg}[i_1,\dots,i_n])\f$. This will always have the same shape and element type as the input tensor. |
-// clang-format on
-class NGRAPH_API UnaryElementwiseArithmetic : public Op {
-protected:
-    /// \brief Constructs a unary elementwise arithmetic operation.
-    UnaryElementwiseArithmetic();
-    /// \brief Constructs a unary elementwise arithmetic operation.
-    ///
-    /// \param arg Output that produces the input tensor.
-    UnaryElementwiseArithmetic(const Output<Node>& arg);
-
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    void validate_and_infer_types() override;
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-private:
-    void validate_and_infer_elementwise_arithmetic();
-};
+using ov::op::util::UnaryElementwiseArithmetic;
 }  // namespace util
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/variable.hpp b/ngraph/core/include/ngraph/op/util/variable.hpp
index 04c873bb3ab85c..9f57262628bec9 100644
--- a/ngraph/core/include/ngraph/op/util/variable.hpp
+++ b/ngraph/core/include/ngraph/op/util/variable.hpp
@@ -10,51 +10,11 @@
 #include "ngraph/partial_shape.hpp"
 #include "ngraph/type.hpp"
 #include "ngraph/type/element_type.hpp"
+#include "openvino/op/util/variable.hpp"
 
 namespace ngraph {
-struct VariableInfo {
-    PartialShape data_shape;
-    element::Type data_type;
-    std::string variable_id;
-
-    inline bool operator==(const VariableInfo& other) const {
-        return data_shape == other.data_shape && data_type == other.data_type && variable_id == other.variable_id;
-    }
-};
-
-class NGRAPH_API Variable {
-public:
-    Variable() = default;
-
-    explicit Variable(const VariableInfo& variable_info) : m_info(variable_info) {}
-
-    VariableInfo get_info() const {
-        return m_info;
-    }
-    void update(const VariableInfo& variable_info) {
-        m_info = variable_info;
-    }
-
-private:
-    VariableInfo m_info;
-};
+using ov::op::util::Variable;
+using ov::op::util::VariableInfo;
 using VariablePtr = std::shared_ptr<Variable>;
 using VariableVector = std::vector<VariablePtr>;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<std::shared_ptr<ngraph::Variable>>
-    : public DirectValueAccessor<std::shared_ptr<ngraph::Variable>> {
-public:
-    explicit AttributeAdapter(std::shared_ptr<ngraph::Variable>& value)
-        : DirectValueAccessor<std::shared_ptr<ngraph::Variable>>(value) {}
-
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<std::shared_ptr<Variable>>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/util/variable_context.hpp b/ngraph/core/include/ngraph/op/util/variable_context.hpp
index 71253347123f33..2856c197803822 100644
--- a/ngraph/core/include/ngraph/op/util/variable_context.hpp
+++ b/ngraph/core/include/ngraph/op/util/variable_context.hpp
@@ -11,81 +11,9 @@
 #include "ngraph/op/util/variable_value.hpp"
 #include "ngraph/output_vector.hpp"
 #include "ngraph/variant.hpp"
+#include "openvino/op/util/variable_context.hpp"
 
 namespace ngraph {
-using VariableValuePtr = std::shared_ptr<VariableValue>;
 using VariableMap = std::unordered_map<VariablePtr, VariableValuePtr>;
-
-/// VariableContext stores and manages a evaluation context for Variables.
-class NGRAPH_API VariableContext {
-public:
-    /// \brief Constructs an uninitialized VariableContext.
-    VariableContext() = default;
-
-    /// \brief Constructor for VariableContext.
-    /// \param variable_values The values associated with a particular Variables.
-    explicit VariableContext(const VariableMap& variable_values) : m_variable_values(variable_values) {}
-
-    /// \brief Sets the reset flags for all stored Variables to true.
-    void reset_variable_context() const {
-        for (const auto& el : m_variable_values) {
-            el.second->set_reset(true);
-        }
-    }
-
-    /// \brief Sets the new values for Variables.
-    /// \param variable_values The new values associated with a particular Variable.
-    void set_variable_values(const VariableMap& variable_values) {
-        m_variable_values = variable_values;
-    }
-
-    /// \brief Changes/sets the values for Variable.
-    /// \param variable New or stored Variable.
-    /// \param variable_value The values associated with the variable.
-    void set_variable_value(const VariablePtr& variable, const VariableValuePtr& variable_value) {
-        m_variable_values[variable] = variable_value;
-    }
-
-    /// \brief Removes context for a particular Variable.
-    /// \param variable The variable for which the context will be cleared.
-    void remove_variable_value(const VariablePtr& variable) {
-        m_variable_values.erase(variable);
-    }
-
-    /// \brief Returns the current values for Variables.
-    const VariableMap& get_variable_values() const {
-        return m_variable_values;
-    }
-
-    /// \brief Returns the value for specified Variable.
-    VariableValuePtr get_variable_value(const VariablePtr& variable) const {
-        auto var_value = m_variable_values.find(variable);
-        if (var_value != m_variable_values.end()) {
-            return (*var_value).second;
-        }
-        return VariableValuePtr();
-    }
-
-private:
-    /// The values associated with a particular Variable.
-    VariableMap m_variable_values;
-};
+using ov::op::util::VariableContext;
 }  // namespace ngraph
-
-namespace ov {
-template <>
-class NGRAPH_API VariantWrapper<ngraph::VariableContext> : public VariantImpl<ngraph::VariableContext> {
-public:
-    static constexpr VariantTypeInfo type_info{"Variant::EvaluationContext::VariableContext", 0};
-
-    const VariantTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-
-    explicit VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
-
-private:
-    using Variant::init;
-    using Variant::merge;
-};
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/op/util/variable_extension.hpp b/ngraph/core/include/ngraph/op/util/variable_extension.hpp
index e1145aa3dcb25b..90360d60a3bb36 100644
--- a/ngraph/core/include/ngraph/op/util/variable_extension.hpp
+++ b/ngraph/core/include/ngraph/op/util/variable_extension.hpp
@@ -4,37 +4,11 @@
 
 #pragma once
 
-#include <ngraph/runtime/host_tensor.hpp>
 #include <utility>
 
-namespace ngraph {
-class NGRAPH_API VariableExtension {
-public:
-    VariableExtension() = default;
-
-    /// \brief Returns variable connected to this node.
-    virtual std::shared_ptr<ngraph::Variable> get_variable() const {
-        return m_variable;
-    }
-
-    /// \brief Sets a new variable to be connected to this node.
-    ///
-    /// \param variable New variable to be connected to this node.
-    virtual void set_variable(const std::shared_ptr<ngraph::Variable>& variable) {
-        m_variable = variable;
-    }
+#include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/op/util/variable_extension.hpp"
 
-    /// \brief Sets the identifier to a variable
-    ///
-    /// \param variable_id New identifier of the variable.
-    virtual void set_variable_id(const std::string& variable_id) {
-        m_variable->get_info().variable_id = variable_id;
-    };
-
-    /// \brief Returns the identifier of corresponding variable.
-    virtual std::string get_variable_id() const = 0;
-
-protected:
-    std::shared_ptr<ngraph::Variable> m_variable;
-};
+namespace ngraph {
+using ov::op::util::VariableExtension;
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/util/variable_value.hpp b/ngraph/core/include/ngraph/op/util/variable_value.hpp
index 9e0173001f0740..1d69ba314f36b0 100644
--- a/ngraph/core/include/ngraph/op/util/variable_value.hpp
+++ b/ngraph/core/include/ngraph/op/util/variable_value.hpp
@@ -4,51 +4,12 @@
 
 #pragma once
 
-#include <ngraph/runtime/host_tensor.hpp>
 #include <utility>
 
-namespace ngraph {
-/// VariableValue stores data and state (reset flag) for a Variable,
-/// and provides an interface for changing them.
-class NGRAPH_API VariableValue {
-public:
-    /// \brief Constructs an uninitialized VariableValue.
-    VariableValue() = default;
-
-    /// \brief Constructor for VariableValue.
-    /// \param value The data for Variable.
-    explicit VariableValue(HostTensorPtr value) : m_value(std::move(value)) {}
-
-    /// \brief Constructor for VariableValue.
-    /// \param value Data for Variable.
-    /// \param reset The current state of the reset flag.
-    VariableValue(HostTensorPtr value, bool reset) : m_reset(reset), m_value(std::move(value)) {}
-
-    /// \brief Sets the reset flag to a new state.
-    /// \param reset The new state of the reset flag.
-    void set_reset(bool reset) {
-        m_reset = reset;
-    }
+#include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/op/util/variable_value.hpp"
 
-    /// \brief Returns the current reset flag state.
-    bool get_reset() const {
-        return m_reset;
-    }
-
-    /// \brief Returns the current stored data.
-    const HostTensorPtr& get_value() const {
-        return m_value;
-    }
-
-    /// \brief Sets new values for Variable.
-    /// \param value New data for Variable.
-    void set_value(const HostTensorPtr& value) {
-        m_value = value;
-    }
-
-private:
-    bool m_reset = true;
-    HostTensorPtr m_value;
-};
+namespace ngraph {
+using ov::op::util::VariableValue;
 using VariableValuePtr = std::shared_ptr<VariableValue>;
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/variadic_split.hpp b/ngraph/core/include/ngraph/op/variadic_split.hpp
index bb09f1fb486588..9a6a9e3cb90eeb 100644
--- a/ngraph/core/include/ngraph/op/variadic_split.hpp
+++ b/ngraph/core/include/ngraph/op/variadic_split.hpp
@@ -5,44 +5,13 @@
 #pragma once
 
 #include "ngraph/op/op.hpp"
+#include "openvino/op/variadic_split.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief VariadicSplit operation splits an input tensor into pieces along some axis.
-/// The pieces may have variadic lengths depending on "split_lengths" attribute.
-class NGRAPH_API VariadicSplit : public Op {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    /// \brief Constructs a variadic split operation.
-    VariadicSplit() = default;
-    /// \brief Constructs a variadic split operation.
-    ///
-    /// \param data           The tensor to be split.
-    /// \param axis           The index of an axis in "data" along which to perform the
-    /// split.
-    /// \param split_lengths  A list containing the sizes of each output tensor
-    /// along the split "axis". Size of "split_lengths" should be equal to the number of
-    ///
-    /// outputs. The sum of split_lengths must match data.shape[axis]
-    VariadicSplit(const Output<Node>& data, const Output<Node>& axis, const Output<Node>& split_lengths);
-
-    bool visit_attributes(AttributeVisitor& visitor) override;
-
-    void validate_and_infer_types() override;
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-    size_t get_default_output_index() const override {
-        return no_default_index();
-    }
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-
-private:
-    bool evaluate_variadic_split(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
-};
+using ov::op::v1::VariadicSplit;
 }  // namespace v1
-
 using v1::VariadicSplit;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/op/xor.hpp b/ngraph/core/include/ngraph/op/xor.hpp
index 34ff6c7675c78e..bfd0c9552095cd 100644
--- a/ngraph/core/include/ngraph/op/xor.hpp
+++ b/ngraph/core/include/ngraph/op/xor.hpp
@@ -7,68 +7,17 @@
 #include <memory>
 
 #include "ngraph/op/util/binary_elementwise_logical.hpp"
+#include "openvino/op/logical_xor.hpp"
+#include "openvino/op/xor.hpp"
 
 namespace ngraph {
 namespace op {
 namespace v1 {
-/// \brief Elementwise logical-xor operation.
-///
-class NGRAPH_API LogicalXor : public util::BinaryElementwiseLogical {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    LogicalXor() = default;
-    /// \brief Constructs a logical-xor operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param arg1 Node that produces the second input tensor.<br>
-    /// `[d0, ...]`
-    /// \param auto_broadcast Auto broadcast specification
-    ///
-    /// Output `[d0, ...]`
-    ///
-    LogicalXor(const Output<Node>& arg0,
-               const Output<Node>& arg1,
-               const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v1::LogicalXor;
 }  // namespace v1
 namespace v0 {
-/// \brief Elementwise logical-xor operation.
-///
-class NGRAPH_API Xor : public util::BinaryElementwiseLogical {
-public:
-    static constexpr NodeTypeInfo type_info{"Xor", 0};
-    const NodeTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-    Xor() = default;
-    /// \brief Constructs a logical-xor operation.
-    ///
-    /// \param arg0 Node that produces the first input tensor.<br>
-    /// `[d0, ...]`
-    /// \param arg1 Node that produces the second input tensor.<br>
-    /// `[d0, ...]`
-    /// \param auto_broadcast Auto broadcast specification
-    ///
-    /// Output `[d0, ...]`
-    ///
-    Xor(const Output<Node>& arg0,
-        const Output<Node>& arg1,
-        const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec());
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
-
-    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
-    bool has_evaluate() const override;
-};
+using ov::op::v0::Xor;
 }  // namespace v0
-
-// default opset version
 using v0::Xor;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/ops.hpp b/ngraph/core/include/ngraph/ops.hpp
index a6222ae58ad7b0..bd21031b1a3091 100644
--- a/ngraph/core/include/ngraph/ops.hpp
+++ b/ngraph/core/include/ngraph/ops.hpp
@@ -147,6 +147,7 @@
 #include "ngraph/op/sign.hpp"
 #include "ngraph/op/sin.hpp"
 #include "ngraph/op/sinh.hpp"
+#include "ngraph/op/slice.hpp"
 #include "ngraph/op/softmax.hpp"
 #include "ngraph/op/softplus.hpp"
 #include "ngraph/op/space_to_batch.hpp"
diff --git a/ngraph/core/include/ngraph/opsets/opset.hpp b/ngraph/core/include/ngraph/opsets/opset.hpp
index c1f6430a8c8122..039abf863d7b04 100644
--- a/ngraph/core/include/ngraph/opsets/opset.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset.hpp
@@ -12,99 +12,36 @@
 #include "ngraph/factory.hpp"
 #include "ngraph/ngraph_visibility.hpp"
 #include "ngraph/node.hpp"
+#include "openvino/opsets/opset.hpp"
 
 namespace ngraph {
 /// \brief Run-time opset information
-class NGRAPH_API OpSet {
+class NGRAPH_API OpSet : public ov::OpSet {
     static std::mutex& get_mutex();
 
 public:
-    OpSet() {}
-    std::set<NodeTypeInfo>::size_type size() const {
-        std::lock_guard<std::mutex> guard(get_mutex());
-        return m_op_types.size();
-    }
+    explicit OpSet(const ov::OpSet& opset);
+    OpSet(const ngraph::OpSet& opset) = default;
+    OpSet() = default;
     /// \brief Insert an op into the opset with a particular name and factory
     void insert(const std::string& name, const NodeTypeInfo& type_info, FactoryRegistry<Node>::Factory factory) {
-        std::lock_guard<std::mutex> guard(get_mutex());
-        m_op_types.insert(type_info);
-        m_name_type_info_map[name] = type_info;
-        m_case_insensitive_type_info_map[to_upper_name(name)] = type_info;
-        m_factory_registry.register_factory(type_info, factory);
+        return insert(name, type_info, std::move(factory));
     }
-
     /// \brief Insert OP_TYPE into the opset with a special name and the default factory
     template <typename OP_TYPE>
     void insert(const std::string& name) {
-        insert(name, OP_TYPE::type_info, FactoryRegistry<Node>::get_default_factory<OP_TYPE>());
+        ov::OpSet::insert<OP_TYPE>(name);
     }
 
     /// \brief Insert OP_TYPE into the opset with the default name and factory
     template <typename OP_TYPE>
     void insert() {
-        insert<OP_TYPE>(OP_TYPE::type_info.name);
-    }
-
-    const std::set<NodeTypeInfo>& get_types_info() const {
-        return m_op_types;
-    }
-    /// \brief Create the op named name using it's factory
-    ngraph::Node* create(const std::string& name) const;
-
-    /// \brief Create the op named name using it's factory
-    ngraph::Node* create_insensitive(const std::string& name) const;
-
-    /// \brief Return true if OP_TYPE is in the opset
-    bool contains_type(const NodeTypeInfo& type_info) const {
-        std::lock_guard<std::mutex> guard(get_mutex());
-        return m_op_types.find(type_info) != m_op_types.end();
-    }
-
-    /// \brief Return true if OP_TYPE is in the opset
-    template <typename OP_TYPE>
-    bool contains_type() const {
-        return contains_type(OP_TYPE::type_info);
+        ov::OpSet::insert<OP_TYPE>(OP_TYPE::type_info.name);
     }
 
-    /// \brief Return true if name is in the opset
-    bool contains_type(const std::string& name) const {
-        std::lock_guard<std::mutex> guard(get_mutex());
-        return m_name_type_info_map.find(name) != m_name_type_info_map.end();
-    }
-
-    /// \brief Return true if name is in the opset
-    bool contains_type_insensitive(const std::string& name) const {
-        std::lock_guard<std::mutex> guard(get_mutex());
-        return m_case_insensitive_type_info_map.find(to_upper_name(name)) != m_case_insensitive_type_info_map.end();
-    }
-
-    /// \brief Return true if node's type is in the opset
-    bool contains_op_type(const Node* node) const {
-        std::lock_guard<std::mutex> guard(get_mutex());
-        return m_op_types.find(node->get_type_info()) != m_op_types.end();
-    }
-
-    const std::set<NodeTypeInfo>& get_type_info_set() const {
-        return m_op_types;
-    }
     ngraph::FactoryRegistry<ngraph::Node>& get_factory_registry() {
         return m_factory_registry;
     }
-
-protected:
-    static std::string to_upper_name(const std::string& name) {
-        std::string upper_name = name;
-        std::locale loc;
-        std::transform(upper_name.begin(), upper_name.end(), upper_name.begin(), [&loc](char c) {
-            return std::toupper(c, loc);
-        });
-        return upper_name;
-    }
-
-    ngraph::FactoryRegistry<ngraph::Node> m_factory_registry;
-    std::set<NodeTypeInfo> m_op_types;
-    std::map<std::string, NodeTypeInfo> m_name_type_info_map;
-    std::map<std::string, NodeTypeInfo> m_case_insensitive_type_info_map;
 };
 
 const NGRAPH_API OpSet& get_opset1();
diff --git a/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp
index 03000cffbbbb0e..3a088f9eb6635e 100644
--- a/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset1_tbl.hpp
@@ -38,113 +38,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v0)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v1)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v1)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(Gather, ngraph::op::v1)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Interpolate, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v0)
-NGRAPH_OP(LSTMSequence, ngraph::op::v0)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(MaxPool, ngraph::op::v1)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v1)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v0)
-NGRAPH_OP(Range, ngraph::op::v0)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-NGRAPH_OP(Reverse, ngraph::op::v1)
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-NGRAPH_OP(RNNCell, ngraph::op::v0)
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v0)
-NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(TopK, ngraph::op::v1)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-NGRAPH_OP(Xor, ngraph::op::v0)
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset1_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp
index 122cba77f9020e..3dc125d1daf187 100644
--- a/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset2_tbl.hpp
@@ -7,137 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v0)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v1)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v1)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(Gather, ngraph::op::v1)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Interpolate, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v0)
-NGRAPH_OP(LSTMSequence, ngraph::op::v0)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(MaxPool, ngraph::op::v1)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-
-NGRAPH_OP(MVN, ngraph::op::v0)  // Missing in opset1
-
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v1)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v0)
-NGRAPH_OP(Range, ngraph::op::v0)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-
-NGRAPH_OP(ReorgYolo, ngraph::op::v0)  // Missing in opset1
-
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-
-// Moved out of opset2, it was added to opset1 by mistake
-// NGRAPH_OP(Reverse, ngraph::op::v1)
-
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-
-// Moved out of opset2, it was added to opset1 by mistake
-// NGRAPH_OP(RNNCell, ngraph::op::v0)
-
-NGRAPH_OP(ROIPooling, ngraph::op::v0)  // Missing in opset1
-
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v0)
-
-// Moved out of opset2, it was added to opset1 by mistake
-// NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(TopK, ngraph::op::v1)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-
-// Moved out of opset2, it was added to opset1 by mistake
-// NGRAPH_OP(Xor, ngraph::op::v0)
-
-// New operations added in opset2
-NGRAPH_OP(Gelu, ngraph::op::v0)
-NGRAPH_OP(BatchToSpace, ngraph::op::v1)
-NGRAPH_OP(SpaceToBatch, ngraph::op::v1)
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset2_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp
index a23d60c95f5335..eccbdc2e64ccda 100644
--- a/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset3_tbl.hpp
@@ -7,153 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v0)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v3)
-NGRAPH_OP(Bucketize, ngraph::op::v3)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(CumSum, ngraph::op::v0)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v1)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(ExtractImagePatches, ngraph::op::v3)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(Gather, ngraph::op::v1)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Interpolate, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v0)
-NGRAPH_OP(LSTMSequence, ngraph::op::v0)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(MaxPool, ngraph::op::v1)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-
-NGRAPH_OP(MVN, ngraph::op::v0)  // Missing in opset1
-
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v3)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v0)
-NGRAPH_OP(Range, ngraph::op::v0)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-
-NGRAPH_OP(ReorgYolo, ngraph::op::v0)  // Missing in opset1
-
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-
-// Moved out of opset2, it was added to opset1 by mistake
-// NGRAPH_OP(Reverse, ngraph::op::v1)
-
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-
-// Moved out of opset2, it was added to opset1 by mistake
-// NGRAPH_OP(RNNCell, ngraph::op::v0)
-
-NGRAPH_OP(ROIPooling, ngraph::op::v0)  // Missing in opset1
-
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-// Superseded
-// NGRAPH_OP(ShapeOf, ngraph::op::v0)
-
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-
-// Moved out of opset2, it was added to opset1 by mistake
-// NGRAPH_OP(Xor, ngraph::op::v0)
-
-// New operations added in opset2
-NGRAPH_OP(Gelu, ngraph::op::v0)
-NGRAPH_OP(BatchToSpace, ngraph::op::v1)
-NGRAPH_OP(SpaceToBatch, ngraph::op::v1)
-
-// New operations added in opset3
-NGRAPH_OP(EmbeddingBagPackedSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingSegmentsSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingBagOffsetsSum, ngraph::op::v3)
-NGRAPH_OP(GRUCell, ngraph::op::v3)
-NGRAPH_OP(NonZero, ngraph::op::v3)
-NGRAPH_OP(RNNCell, ngraph::op::v0)
-NGRAPH_OP(ROIAlign, ngraph::op::v3)
-NGRAPH_OP(ScatterElementsUpdate, ngraph::op::v3)
-NGRAPH_OP(ScatterUpdate, ngraph::op::v3)
-NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v3)
-NGRAPH_OP(Assign, ngraph::op::v3)
-NGRAPH_OP(ReadValue, ngraph::op::v3)
-NGRAPH_OP(TopK, ngraph::op::v3)
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset3_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp
index 23b907c1e24c74..70744995c9e739 100644
--- a/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset4_tbl.hpp
@@ -7,146 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v0)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v3)
-NGRAPH_OP(Bucketize, ngraph::op::v3)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(CumSum, ngraph::op::v0)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v1)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(ExtractImagePatches, ngraph::op::v3)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(Gather, ngraph::op::v1)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v4)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(MaxPool, ngraph::op::v1)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-NGRAPH_OP(MVN, ngraph::op::v0)
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v4)
-NGRAPH_OP(Range, ngraph::op::v4)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-NGRAPH_OP(ReorgYolo, ngraph::op::v0)
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-NGRAPH_OP(ROIPooling, ngraph::op::v0)
-NGRAPH_OP(ScatterNDUpdate, ngraph::op::v3)
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-
-// New operations added in opset2
-NGRAPH_OP(Gelu, ngraph::op::v0)
-NGRAPH_OP(BatchToSpace, ngraph::op::v1)
-NGRAPH_OP(SpaceToBatch, ngraph::op::v1)
-
-// New operations added in opset3
-NGRAPH_OP(EmbeddingBagPackedSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingSegmentsSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingBagOffsetsSum, ngraph::op::v3)
-NGRAPH_OP(GRUCell, ngraph::op::v3)
-NGRAPH_OP(NonZero, ngraph::op::v3)
-NGRAPH_OP(RNNCell, ngraph::op::v0)
-NGRAPH_OP(ROIAlign, ngraph::op::v3)
-NGRAPH_OP(ScatterElementsUpdate, ngraph::op::v3)
-NGRAPH_OP(ScatterUpdate, ngraph::op::v3)
-NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v3)
-NGRAPH_OP(Assign, ngraph::op::v3)
-NGRAPH_OP(ReadValue, ngraph::op::v3)
-NGRAPH_OP(TopK, ngraph::op::v3)
-
-// New operations added in opset4
-NGRAPH_OP(Acosh, ngraph::op::v3)
-NGRAPH_OP(Asinh, ngraph::op::v3)
-NGRAPH_OP(Atanh, ngraph::op::v3)
-NGRAPH_OP(CTCLoss, ngraph::op::v4)
-NGRAPH_OP(HSwish, ngraph::op::v4)
-NGRAPH_OP(Interpolate, ngraph::op::v4)
-NGRAPH_OP(Mish, ngraph::op::v4)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v4)
-NGRAPH_OP(ReduceL1, ngraph::op::v4)
-NGRAPH_OP(ReduceL2, ngraph::op::v4)
-NGRAPH_OP(SoftPlus, ngraph::op::v4)
-NGRAPH_OP(Swish, ngraph::op::v4)
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset4_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp
index 3f81f851358a0f..2e4b6ad7288714 100644
--- a/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset5_tbl.hpp
@@ -7,156 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v5)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v3)
-NGRAPH_OP(Bucketize, ngraph::op::v3)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(CumSum, ngraph::op::v0)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v1)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(ExtractImagePatches, ngraph::op::v3)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(Gather, ngraph::op::v1)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v4)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(MaxPool, ngraph::op::v1)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-NGRAPH_OP(MVN, ngraph::op::v0)
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v4)
-NGRAPH_OP(Range, ngraph::op::v4)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-NGRAPH_OP(ReorgYolo, ngraph::op::v0)
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-NGRAPH_OP(ROIPooling, ngraph::op::v0)
-NGRAPH_OP(ScatterNDUpdate, ngraph::op::v3)
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-
-// New operations added in opset2
-NGRAPH_OP(Gelu, ngraph::op::v0)
-NGRAPH_OP(BatchToSpace, ngraph::op::v1)
-NGRAPH_OP(SpaceToBatch, ngraph::op::v1)
-
-// New operations added in opset3
-NGRAPH_OP(EmbeddingBagPackedSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingSegmentsSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingBagOffsetsSum, ngraph::op::v3)
-NGRAPH_OP(GRUCell, ngraph::op::v3)
-NGRAPH_OP(NonZero, ngraph::op::v3)
-NGRAPH_OP(RNNCell, ngraph::op::v0)
-NGRAPH_OP(ROIAlign, ngraph::op::v3)
-NGRAPH_OP(ScatterElementsUpdate, ngraph::op::v3)
-NGRAPH_OP(ScatterUpdate, ngraph::op::v3)
-NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v3)
-NGRAPH_OP(Assign, ngraph::op::v3)
-NGRAPH_OP(ReadValue, ngraph::op::v3)
-NGRAPH_OP(TopK, ngraph::op::v3)
-
-// New operations added in opset4
-NGRAPH_OP(Acosh, ngraph::op::v3)
-NGRAPH_OP(Asinh, ngraph::op::v3)
-NGRAPH_OP(Atanh, ngraph::op::v3)
-NGRAPH_OP(CTCLoss, ngraph::op::v4)
-NGRAPH_OP(HSwish, ngraph::op::v4)
-NGRAPH_OP(Interpolate, ngraph::op::v4)
-NGRAPH_OP(Mish, ngraph::op::v4)
-NGRAPH_OP(ReduceL1, ngraph::op::v4)
-NGRAPH_OP(ReduceL2, ngraph::op::v4)
-NGRAPH_OP(SoftPlus, ngraph::op::v4)
-NGRAPH_OP(Swish, ngraph::op::v4)
-
-// New operations added in opset5
-NGRAPH_OP(GatherND, ngraph::op::v5)
-NGRAPH_OP(GRUSequence, ngraph::op::v5)
-NGRAPH_OP(HSigmoid, ngraph::op::v5)
-NGRAPH_OP(LogSoftmax, ngraph::op::v5)
-NGRAPH_OP(Loop, ngraph::op::v5)
-NGRAPH_OP(LSTMSequence, ngraph::op::v5)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v5)
-NGRAPH_OP(RNNSequence, ngraph::op::v5)
-NGRAPH_OP(Round, ngraph::op::v5)
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset5_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp
index d188304b53c3bd..e9cb2a0c12afe4 100644
--- a/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset6_tbl.hpp
@@ -7,165 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v5)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v3)
-NGRAPH_OP(Bucketize, ngraph::op::v3)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(CumSum, ngraph::op::v0)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v1)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(ExtractImagePatches, ngraph::op::v3)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(Gather, ngraph::op::v1)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v4)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(MaxPool, ngraph::op::v1)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v4)
-NGRAPH_OP(Range, ngraph::op::v4)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-NGRAPH_OP(ReorgYolo, ngraph::op::v0)
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-NGRAPH_OP(ROIPooling, ngraph::op::v0)
-NGRAPH_OP(ScatterNDUpdate, ngraph::op::v3)
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-
-// New operations added in opset2
-NGRAPH_OP(Gelu, ngraph::op::v0)
-NGRAPH_OP(BatchToSpace, ngraph::op::v1)
-NGRAPH_OP(SpaceToBatch, ngraph::op::v1)
-
-// New operations added in opset3
-NGRAPH_OP(EmbeddingBagPackedSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingSegmentsSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingBagOffsetsSum, ngraph::op::v3)
-NGRAPH_OP(GRUCell, ngraph::op::v3)
-NGRAPH_OP(NonZero, ngraph::op::v3)
-NGRAPH_OP(RNNCell, ngraph::op::v0)
-NGRAPH_OP(ROIAlign, ngraph::op::v3)
-NGRAPH_OP(ScatterElementsUpdate, ngraph::op::v3)
-NGRAPH_OP(ScatterUpdate, ngraph::op::v3)
-NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v3)
-NGRAPH_OP(TopK, ngraph::op::v3)
-
-// New operations added in opset4
-NGRAPH_OP(Acosh, ngraph::op::v3)
-NGRAPH_OP(Asinh, ngraph::op::v3)
-NGRAPH_OP(Atanh, ngraph::op::v3)
-NGRAPH_OP(CTCLoss, ngraph::op::v4)
-NGRAPH_OP(HSwish, ngraph::op::v4)
-NGRAPH_OP(Interpolate, ngraph::op::v4)
-NGRAPH_OP(Mish, ngraph::op::v4)
-NGRAPH_OP(ReduceL1, ngraph::op::v4)
-NGRAPH_OP(ReduceL2, ngraph::op::v4)
-NGRAPH_OP(SoftPlus, ngraph::op::v4)
-NGRAPH_OP(Swish, ngraph::op::v4)
-
-// New operations added in opset5
-NGRAPH_OP(GatherND, ngraph::op::v5)
-NGRAPH_OP(GRUSequence, ngraph::op::v5)
-NGRAPH_OP(HSigmoid, ngraph::op::v5)
-NGRAPH_OP(LogSoftmax, ngraph::op::v5)
-NGRAPH_OP(Loop, ngraph::op::v5)
-NGRAPH_OP(LSTMSequence, ngraph::op::v5)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v5)
-NGRAPH_OP(RNNSequence, ngraph::op::v5)
-NGRAPH_OP(Round, ngraph::op::v5)
-
-// New operations added in opset6
-NGRAPH_OP(CTCGreedyDecoderSeqLen, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronDetectionOutput, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronGenerateProposalsSingleImage, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronPriorGridGenerator, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronROIFeatureExtractor, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronTopKROIs, ngraph::op::v6)
-NGRAPH_OP(GatherElements, ngraph::op::v6)
-NGRAPH_OP(MVN, ngraph::op::v6)
-NGRAPH_OP(Assign, ngraph::op::v6)     // new version
-NGRAPH_OP(ReadValue, ngraph::op::v6)  // new version
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset6_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp
index 38ffbd373aa233..02802da1b94f19 100644
--- a/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset7_tbl.hpp
@@ -7,171 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v5)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v3)
-NGRAPH_OP(Bucketize, ngraph::op::v3)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(CumSum, ngraph::op::v0)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v1)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(ExtractImagePatches, ngraph::op::v3)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(Gather, ngraph::op::v7)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v4)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(MaxPool, ngraph::op::v1)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v4)
-NGRAPH_OP(Range, ngraph::op::v4)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-NGRAPH_OP(ReorgYolo, ngraph::op::v0)
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-NGRAPH_OP(ROIPooling, ngraph::op::v0)
-NGRAPH_OP(ScatterNDUpdate, ngraph::op::v3)
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-
-// New operations added in opset2
-NGRAPH_OP(BatchToSpace, ngraph::op::v1)
-NGRAPH_OP(SpaceToBatch, ngraph::op::v1)
-
-// New operations added in opset3
-NGRAPH_OP(EmbeddingBagPackedSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingSegmentsSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingBagOffsetsSum, ngraph::op::v3)
-NGRAPH_OP(GRUCell, ngraph::op::v3)
-NGRAPH_OP(NonZero, ngraph::op::v3)
-NGRAPH_OP(RNNCell, ngraph::op::v0)
-NGRAPH_OP(ROIAlign, ngraph::op::v3)
-NGRAPH_OP(ScatterElementsUpdate, ngraph::op::v3)
-NGRAPH_OP(ScatterUpdate, ngraph::op::v3)
-NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v3)
-NGRAPH_OP(TopK, ngraph::op::v3)
-
-// New operations added in opset4
-NGRAPH_OP(Acosh, ngraph::op::v3)
-NGRAPH_OP(Asinh, ngraph::op::v3)
-NGRAPH_OP(Atanh, ngraph::op::v3)
-NGRAPH_OP(CTCLoss, ngraph::op::v4)
-NGRAPH_OP(HSwish, ngraph::op::v4)
-NGRAPH_OP(Interpolate, ngraph::op::v4)
-NGRAPH_OP(Mish, ngraph::op::v4)
-NGRAPH_OP(ReduceL1, ngraph::op::v4)
-NGRAPH_OP(ReduceL2, ngraph::op::v4)
-NGRAPH_OP(SoftPlus, ngraph::op::v4)
-NGRAPH_OP(Swish, ngraph::op::v4)
-
-// New operations added in opset5
-NGRAPH_OP(GatherND, ngraph::op::v5)
-NGRAPH_OP(GRUSequence, ngraph::op::v5)
-NGRAPH_OP(HSigmoid, ngraph::op::v5)
-NGRAPH_OP(LogSoftmax, ngraph::op::v5)
-NGRAPH_OP(Loop, ngraph::op::v5)
-NGRAPH_OP(LSTMSequence, ngraph::op::v5)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v5)
-NGRAPH_OP(RNNSequence, ngraph::op::v5)
-NGRAPH_OP(Round, ngraph::op::v5)
-
-// New operations added in opset6
-NGRAPH_OP(CTCGreedyDecoderSeqLen, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronDetectionOutput, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronGenerateProposalsSingleImage, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronPriorGridGenerator, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronROIFeatureExtractor, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronTopKROIs, ngraph::op::v6)
-NGRAPH_OP(GatherElements, ngraph::op::v6)
-NGRAPH_OP(MVN, ngraph::op::v6)
-NGRAPH_OP(Assign, ngraph::op::v6)     // new version
-NGRAPH_OP(ReadValue, ngraph::op::v6)  // new version
-
-// New operations added in opset7
-NGRAPH_OP(DFT, ngraph::op::v7)
-NGRAPH_OP(Einsum, ngraph::op::v7)
-NGRAPH_OP(Gelu, ngraph::op::v7)
-NGRAPH_OP(IDFT, ngraph::op::v7)
-NGRAPH_OP(Roll, ngraph::op::v7)
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset7_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp b/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp
index faf3d65593af93..a57cb4318dab11 100644
--- a/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp
+++ b/ngraph/core/include/ngraph/opsets/opset8_tbl.hpp
@@ -7,179 +7,6 @@
 #    define NGRAPH_OP(x, y)
 #endif
 
-NGRAPH_OP(Abs, ngraph::op::v0)
-NGRAPH_OP(Acos, ngraph::op::v0)
-NGRAPH_OP(Add, ngraph::op::v1)
-NGRAPH_OP(Asin, ngraph::op::v0)
-NGRAPH_OP(Atan, ngraph::op::v0)
-NGRAPH_OP(AvgPool, ngraph::op::v1)
-NGRAPH_OP(BatchNormInference, ngraph::op::v5)
-NGRAPH_OP(BinaryConvolution, ngraph::op::v1)
-NGRAPH_OP(Broadcast, ngraph::op::v3)
-NGRAPH_OP(Bucketize, ngraph::op::v3)
-NGRAPH_OP(CTCGreedyDecoder, ngraph::op::v0)
-NGRAPH_OP(Ceiling, ngraph::op::v0)
-NGRAPH_OP(Clamp, ngraph::op::v0)
-NGRAPH_OP(Concat, ngraph::op::v0)
-NGRAPH_OP(Constant, ngraph::op)
-NGRAPH_OP(Convert, ngraph::op::v0)
-NGRAPH_OP(ConvertLike, ngraph::op::v1)
-NGRAPH_OP(Convolution, ngraph::op::v1)
-NGRAPH_OP(ConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(Cos, ngraph::op::v0)
-NGRAPH_OP(Cosh, ngraph::op::v0)
-NGRAPH_OP(CumSum, ngraph::op::v0)
-NGRAPH_OP(DeformablePSROIPooling, ngraph::op::v1)
-NGRAPH_OP(DepthToSpace, ngraph::op::v0)
-NGRAPH_OP(DetectionOutput, ngraph::op::v0)
-NGRAPH_OP(Divide, ngraph::op::v1)
-NGRAPH_OP(Elu, ngraph::op::v0)
-NGRAPH_OP(Erf, ngraph::op::v0)
-NGRAPH_OP(Equal, ngraph::op::v1)
-NGRAPH_OP(Exp, ngraph::op::v0)
-NGRAPH_OP(ExtractImagePatches, ngraph::op::v3)
-NGRAPH_OP(FakeQuantize, ngraph::op::v0)
-NGRAPH_OP(Floor, ngraph::op::v0)
-NGRAPH_OP(FloorMod, ngraph::op::v1)
-NGRAPH_OP(GatherTree, ngraph::op::v1)
-NGRAPH_OP(Greater, ngraph::op::v1)
-NGRAPH_OP(GreaterEqual, ngraph::op::v1)
-NGRAPH_OP(GroupConvolution, ngraph::op::v1)
-NGRAPH_OP(GroupConvolutionBackpropData, ngraph::op::v1)
-NGRAPH_OP(GRN, ngraph::op::v0)
-NGRAPH_OP(HardSigmoid, ngraph::op::v0)
-NGRAPH_OP(Less, ngraph::op::v1)
-NGRAPH_OP(LessEqual, ngraph::op::v1)
-NGRAPH_OP(Log, ngraph::op::v0)
-NGRAPH_OP(LogicalAnd, ngraph::op::v1)
-NGRAPH_OP(LogicalNot, ngraph::op::v1)
-NGRAPH_OP(LogicalOr, ngraph::op::v1)
-NGRAPH_OP(LogicalXor, ngraph::op::v1)
-NGRAPH_OP(LRN, ngraph::op::v0)
-NGRAPH_OP(LSTMCell, ngraph::op::v4)
-NGRAPH_OP(MatMul, ngraph::op::v0)
-NGRAPH_OP(Maximum, ngraph::op::v1)
-NGRAPH_OP(Minimum, ngraph::op::v1)
-NGRAPH_OP(Mod, ngraph::op::v1)
-NGRAPH_OP(Multiply, ngraph::op::v1)
-NGRAPH_OP(Negative, ngraph::op::v0)
-NGRAPH_OP(NormalizeL2, ngraph::op::v0)
-NGRAPH_OP(NotEqual, ngraph::op::v1)
-NGRAPH_OP(OneHot, ngraph::op::v1)
-NGRAPH_OP(PRelu, ngraph::op::v0)
-NGRAPH_OP(PSROIPooling, ngraph::op::v0)
-NGRAPH_OP(Pad, ngraph::op::v1)
-NGRAPH_OP(Parameter, ngraph::op::v0)
-NGRAPH_OP(Power, ngraph::op::v1)
-NGRAPH_OP(PriorBox, ngraph::op::v0)
-NGRAPH_OP(PriorBoxClustered, ngraph::op::v0)
-NGRAPH_OP(Proposal, ngraph::op::v4)
-NGRAPH_OP(Range, ngraph::op::v4)
-NGRAPH_OP(Relu, ngraph::op::v0)
-NGRAPH_OP(ReduceMax, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalAnd, ngraph::op::v1)
-NGRAPH_OP(ReduceLogicalOr, ngraph::op::v1)
-NGRAPH_OP(ReduceMean, ngraph::op::v1)
-NGRAPH_OP(ReduceMin, ngraph::op::v1)
-NGRAPH_OP(ReduceProd, ngraph::op::v1)
-NGRAPH_OP(ReduceSum, ngraph::op::v1)
-NGRAPH_OP(RegionYolo, ngraph::op::v0)
-NGRAPH_OP(ReorgYolo, ngraph::op::v0)
-NGRAPH_OP(Reshape, ngraph::op::v1)
-NGRAPH_OP(Result, ngraph::op::v0)
-NGRAPH_OP(ReverseSequence, ngraph::op::v0)
-NGRAPH_OP(ROIPooling, ngraph::op::v0)
-NGRAPH_OP(ScatterNDUpdate, ngraph::op::v3)
-NGRAPH_OP(Select, ngraph::op::v1)
-NGRAPH_OP(Selu, ngraph::op::v0)
-NGRAPH_OP(Sign, ngraph::op::v0)
-NGRAPH_OP(Sigmoid, ngraph::op::v0)
-NGRAPH_OP(Sin, ngraph::op::v0)
-NGRAPH_OP(Sinh, ngraph::op::v0)
-NGRAPH_OP(Softmax, ngraph::op::v1)
-NGRAPH_OP(Sqrt, ngraph::op::v0)
-NGRAPH_OP(SpaceToDepth, ngraph::op::v0)
-NGRAPH_OP(Split, ngraph::op::v1)
-NGRAPH_OP(SquaredDifference, ngraph::op::v0)
-NGRAPH_OP(Squeeze, ngraph::op::v0)
-NGRAPH_OP(StridedSlice, ngraph::op::v1)
-NGRAPH_OP(Subtract, ngraph::op::v1)
-NGRAPH_OP(Tan, ngraph::op::v0)
-NGRAPH_OP(Tanh, ngraph::op::v0)
-NGRAPH_OP(TensorIterator, ngraph::op::v0)
-NGRAPH_OP(Tile, ngraph::op::v0)
-NGRAPH_OP(Transpose, ngraph::op::v1)
-NGRAPH_OP(Unsqueeze, ngraph::op::v0)
-NGRAPH_OP(VariadicSplit, ngraph::op::v1)
-
-// New operations added in opset2
-NGRAPH_OP(BatchToSpace, ngraph::op::v1)
-NGRAPH_OP(SpaceToBatch, ngraph::op::v1)
-
-// New operations added in opset3
-NGRAPH_OP(EmbeddingBagPackedSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingSegmentsSum, ngraph::op::v3)
-NGRAPH_OP(EmbeddingBagOffsetsSum, ngraph::op::v3)
-NGRAPH_OP(GRUCell, ngraph::op::v3)
-NGRAPH_OP(NonZero, ngraph::op::v3)
-NGRAPH_OP(RNNCell, ngraph::op::v0)
-NGRAPH_OP(ROIAlign, ngraph::op::v3)
-NGRAPH_OP(ScatterElementsUpdate, ngraph::op::v3)
-NGRAPH_OP(ScatterUpdate, ngraph::op::v3)
-NGRAPH_OP(ShuffleChannels, ngraph::op::v0)
-NGRAPH_OP(ShapeOf, ngraph::op::v3)
-NGRAPH_OP(TopK, ngraph::op::v3)
-
-// New operations added in opset4
-NGRAPH_OP(Acosh, ngraph::op::v3)
-NGRAPH_OP(Asinh, ngraph::op::v3)
-NGRAPH_OP(Atanh, ngraph::op::v3)
-NGRAPH_OP(CTCLoss, ngraph::op::v4)
-NGRAPH_OP(HSwish, ngraph::op::v4)
-NGRAPH_OP(Interpolate, ngraph::op::v4)
-NGRAPH_OP(Mish, ngraph::op::v4)
-NGRAPH_OP(ReduceL1, ngraph::op::v4)
-NGRAPH_OP(ReduceL2, ngraph::op::v4)
-NGRAPH_OP(SoftPlus, ngraph::op::v4)
-NGRAPH_OP(Swish, ngraph::op::v4)
-
-// New operations added in opset5
-NGRAPH_OP(GatherND, ngraph::op::v5)
-NGRAPH_OP(GRUSequence, ngraph::op::v5)
-NGRAPH_OP(HSigmoid, ngraph::op::v5)
-NGRAPH_OP(LogSoftmax, ngraph::op::v5)
-NGRAPH_OP(Loop, ngraph::op::v5)
-NGRAPH_OP(LSTMSequence, ngraph::op::v5)
-NGRAPH_OP(NonMaxSuppression, ngraph::op::v5)
-NGRAPH_OP(RNNSequence, ngraph::op::v5)
-NGRAPH_OP(Round, ngraph::op::v5)
-
-// New operations added in opset6
-NGRAPH_OP(CTCGreedyDecoderSeqLen, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronDetectionOutput, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronGenerateProposalsSingleImage, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronPriorGridGenerator, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronROIFeatureExtractor, ngraph::op::v6)
-NGRAPH_OP(ExperimentalDetectronTopKROIs, ngraph::op::v6)
-NGRAPH_OP(GatherElements, ngraph::op::v6)
-NGRAPH_OP(MVN, ngraph::op::v6)
-NGRAPH_OP(Assign, ngraph::op::v6)     // new version
-NGRAPH_OP(ReadValue, ngraph::op::v6)  // new version
-
-// New operations added in opset7
-NGRAPH_OP(DFT, ngraph::op::v7)
-NGRAPH_OP(Einsum, ngraph::op::v7)
-NGRAPH_OP(Gelu, ngraph::op::v7)
-NGRAPH_OP(IDFT, ngraph::op::v7)
-NGRAPH_OP(Roll, ngraph::op::v7)
-
-// New operations added in opset8
-NGRAPH_OP(Gather, ngraph::op::v8)
-NGRAPH_OP(AdaptiveAvgPool, ngraph::op::v8)
-NGRAPH_OP(AdaptiveMaxPool, ngraph::op::v8)
-NGRAPH_OP(DeformableConvolution, ngraph::op::v8)
-NGRAPH_OP(MatrixNms, ngraph::op::v8)
-NGRAPH_OP(MaxPool, ngraph::op::v8)
-NGRAPH_OP(MulticlassNms, ngraph::op::v8)
-NGRAPH_OP(RandomUniform, ngraph::op::v8)
-NGRAPH_OP(If, ngraph::op::v8)
+#define OPENVINO_OP NGRAPH_OP
+#include "openvino/opsets/opset8_tbl.hpp"
+#undef OPENVINO_OP
diff --git a/ngraph/core/include/ngraph/partial_shape.hpp b/ngraph/core/include/ngraph/partial_shape.hpp
index d3bfb76dd4cbb9..917d25f81af6af 100644
--- a/ngraph/core/include/ngraph/partial_shape.hpp
+++ b/ngraph/core/include/ngraph/partial_shape.hpp
@@ -4,8 +4,11 @@
 
 #pragma once
 
+#include "ngraph/attribute_adapter.hpp"
 #include "ngraph/dimension.hpp"
+#include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/rank.hpp"
+#include "ngraph/shape.hpp"
 #include "openvino/core/partial_shape.hpp"
 
 namespace ngraph {
diff --git a/ngraph/core/include/ngraph/pass/constant_folding.hpp b/ngraph/core/include/ngraph/pass/constant_folding.hpp
index 479704dc69989d..884bfa4551c547 100644
--- a/ngraph/core/include/ngraph/pass/constant_folding.hpp
+++ b/ngraph/core/include/ngraph/pass/constant_folding.hpp
@@ -5,24 +5,10 @@
 #pragma once
 
 #include "ngraph/pass/pass.hpp"
+#include "openvino/pass/constant_folding.hpp"
 
 namespace ngraph {
 namespace pass {
-/**
- * @brief Constant folding iterates over the function and tries to evaluate nodes
- *        with constant inputs. Such nodes are then replaced with new Constants containing
- *        the result of a folded operation.
- */
-class NGRAPH_API ConstantFolding : public FunctionPass {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
-
-private:
-    void copy_runtime_info_to_target_inputs(const std::shared_ptr<Node>& node, const Output<Node>& replacement);
-    /// \brief Folds pre-calculated output tensor values to constants in case lower and
-    /// upper estimations are equal. Traverses graph backwards starting from the results.
-    bool pre_calculated_values_folding(const std::shared_ptr<ngraph::Function>& f);
-};
+using ov::pass::ConstantFolding;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/convert_fp32_to_fp16.hpp b/ngraph/core/include/ngraph/pass/convert_fp32_to_fp16.hpp
index 5753c0fd7ea41e..302eb89677ac7a 100644
--- a/ngraph/core/include/ngraph/pass/convert_fp32_to_fp16.hpp
+++ b/ngraph/core/include/ngraph/pass/convert_fp32_to_fp16.hpp
@@ -4,14 +4,11 @@
 
 #pragma once
 
-#include <ngraph/pass/graph_rewrite.hpp>
+#include "ngraph/pass/graph_rewrite.hpp"
+#include "openvino/pass/convert_fp32_to_fp16.hpp"
 
 namespace ngraph {
 namespace pass {
-class NGRAPH_API ConvertFP32ToFP16 : public ngraph::pass::FunctionPass {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    bool run_on_function(std::shared_ptr<ngraph::Function>) override;
-};
+using ov::pass::ConvertFP32ToFP16;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/graph_rewrite.hpp b/ngraph/core/include/ngraph/pass/graph_rewrite.hpp
index 17fd2b732f6ced..66daa15fb3b050 100644
--- a/ngraph/core/include/ngraph/pass/graph_rewrite.hpp
+++ b/ngraph/core/include/ngraph/pass/graph_rewrite.hpp
@@ -10,240 +10,17 @@
 
 #include "ngraph/pass/pass.hpp"
 #include "ngraph/pattern/matcher.hpp"
+#include "openvino/pass/graph_rewrite.hpp"
 
 namespace ngraph {
-using matcher_pass_callback = std::function<bool(ngraph::pattern::Matcher& m)>;
-using graph_rewrite_callback = std::function<bool(ngraph::pattern::Matcher& m)>;
-using recurrent_graph_rewrite_callback = std::function<bool(ngraph::pattern::RecurrentMatcher& m)>;
-using handler_callback = std::function<bool(const std::shared_ptr<Node>& node)>;
+using ov::graph_rewrite_callback;
+using ov::handler_callback;
+using ov::matcher_pass_callback;
+using ov::recurrent_graph_rewrite_callback;
 namespace pass {
-/// \brief MatcherPass is a basic block for pattern based transformations. It describes
-/// pattern and
-/// action that is applied if pattern is matched.
-///
-/// MatcherPass consists of Matcher and matcher_pass_callback that needs to be implemented
-/// and
-/// finally registered by using \sa register_matcher. MatcherPass can be executed on node
-/// within
-/// \sa apply method. To run matcher pass on Function use GraphRewrite.
-/// In addition MatcherPass provides a way for adding new operations into GraphRewrite
-/// execution
-/// queue. That means that operations that were created inside transformation callback can
-/// be added
-/// for matching. To register node use \sa register_new_node method. GraphRewrite
-/// automatically
-/// takes registered nodes and put them to execution queue. If multiple nodes were register
-/// make
-/// sure that they were registered in topological order.
-/// Note: when implementing pattern for Matcher make sure that root node is an operation
-/// from opset
-/// or has ngraph::pattern::op::WrapType. That will help GraphRewrite to execute matcher
-/// passes more
-/// efficient.
-
-class NGRAPH_API MatcherPass : public ngraph::pass::PassBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    MatcherPass() = default;
-
-    MatcherPass(const MatcherPass&) = delete;
-    MatcherPass& operator=(const MatcherPass&) = delete;
-
-    explicit MatcherPass(const std::string& name,
-                         const std::shared_ptr<pattern::Matcher>& m,
-                         const handler_callback& handler,
-                         const PassPropertyMask& property = PassProperty::CHANGE_DYNAMIC_STATE)
-        : PassBase(),
-          m_handler(handler),
-          m_matcher(m) {
-        set_name(name);
-        set_property(property, true);
-    }
-
-    bool apply(std::shared_ptr<ngraph::Node> node);
-
-    template <typename T, class... Args>
-    std::shared_ptr<T> register_new_node(Args&&... args) {
-        auto node = std::make_shared<T>(std::forward<Args>(args)...);
-        m_new_nodes.push_back(node);
-        return node;
-    }
-
-    template <typename T>
-    std::shared_ptr<T> register_new_node(const std::shared_ptr<T>& node) {
-        m_new_nodes.push_back(node);
-        return node;
-    }
-
-    const std::vector<std::shared_ptr<ngraph::Node>>& get_new_nodes() {
-        return m_new_nodes;
-    }
-    void clear_new_nodes() {
-        m_new_nodes.clear();
-    }
-    std::shared_ptr<pattern::Matcher> get_matcher() {
-        return m_matcher;
-    }
-
-protected:
-    void register_matcher(const std::shared_ptr<pattern::Matcher>& m,
-                          const ngraph::graph_rewrite_callback& callback,
-                          const PassPropertyMask& property = PassProperty::CHANGE_DYNAMIC_STATE);
-
-private:
-    handler_callback m_handler;
-    std::shared_ptr<pattern::Matcher> m_matcher;
-    std::vector<std::shared_ptr<ngraph::Node>> m_new_nodes;
-};
-
-/// \brief GraphRewrite is a container for MatcherPasses that allows to run them on Function
-/// in
-/// efficient way
-///
-/// Graph rewrite pass is used for matcher passes execution on Function.
-/// To register MatcherPass use \sa add_matcher<T>(args) method where T is a MatcherPass
-/// class.
-/// As a default algorithm graph rewrite pass traverse Function in topological order and
-/// applies
-/// registered matcher passes for each node. But if all registered matcher passes have type
-/// based
-/// root node in Matcher pattern then efficient mechanism is used to execute them.
-/// Matcher pattern root is type based if it's operation from opset or
-/// pattern::op::WrapType.
-/// Note: when implementing pattern for Matcher make sure that root node is an operation
-/// from opset
-/// or has ngraph::pattern::op::WrapType. That will help GraphRewrite to execute matcher
-/// passes more
-/// efficient.
-
-class NGRAPH_API GraphRewrite : public ngraph::pass::FunctionPass {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    GraphRewrite() = default;
-
-    explicit GraphRewrite(const std::shared_ptr<MatcherPass>& pass) : FunctionPass() {
-        m_matchers.push_back(pass);
-    }
-
-    /// \brief Register given transformation class type to GraphRewrite execution list
-    /// All registered transformations will be executed in a single graph traversal.
-    /// Example below show the basic usage of pass::GraphRewrite
-    ///
-    ///     pass::Manager manager;
-    ///     auto anchor = manager.register_pass<GraphRewrite>();
-    ///     anchor->add_matcher<MatcherPassA>();
-    ///     anchor->add_matcher<MatcherPassB>();
-    ///     anchor->set_name("CommonMatchers");
-    ///     manager.run_passes(f);
-    ///
-    /// For some purposes transformation can be registered and disabled by default.
-    ///
-    ///     anchor->add_matcher<MatcherPassB, false>();
-    ///
-    /// \return shared_ptr to the transformation instance
-    template <typename T,
-              bool Enabled = true,
-              class... Args,
-              typename std::enable_if<std::is_base_of<pass::MatcherPass, T>::value, bool>::type = true>
-    std::shared_ptr<T> add_matcher(Args&&... args) {
-        static_assert(std::is_base_of<pass::MatcherPass, T>::value, "pass not derived from MatcherPass");
-        auto pass = std::make_shared<T>(std::forward<Args>(args)...);
-        auto pass_config = get_pass_config();
-        pass->set_pass_config(pass_config);
-        if (!Enabled && !pass_config->is_enabled<T>()) {
-            pass_config->disable<T>();
-        }
-        m_matchers.push_back(pass);
-        return pass;
-    }
-
-    /// \brief Register passes from GraphRewrite class that contains sequence of matcher
-    /// passes registered in its ctor.
-    /// For example:
-    ///
-    ///    class ngraph::pass::LinFusions: public ngraph::pass::GraphRewrite {
-    ///    public:
-    ///         NGRAPH_RTTI_DECLARATION;
-    ///         Fusions() {
-    ///             add_matcher<ngraph::pass::AddFusion>();
-    ///             add_matcher<ngraph::pass::MulFusion>();
-    ///         }
-    ///     };
-    ///
-    ///     pass::Manager manager;
-    ///     auto anchor = manager.register_pass<GraphRewrite>();
-    ///     anchor->add_matcher<LinFusions>();
-    ///     anchor->add_matcher<OtherFusions>();
-    ///     anchor->set_name("CommonFusions");
-    ///     manager.run_passes(f);
-    ///
-    /// In this case all matcher passes from LinFusions pass will be united with other
-    /// registered matchers.
-    template <typename T,
-              class... Args,
-              typename std::enable_if<std::is_base_of<pass::GraphRewrite, T>::value, bool>::type = true>
-    void add_matcher(Args&&... args) {
-        static_assert(std::is_base_of<pass::GraphRewrite, T>::value, "pass not derived from GraphRewrite");
-        auto pass = std::make_shared<T>(std::forward<Args>(args)...);
-        auto pass_config = get_pass_config();
-
-        for (auto& matcher : pass->m_matchers) {
-            pass->set_pass_config(pass_config);
-            m_matchers.push_back(matcher);
-        }
-    }
-
-    NGRAPH_DEPRECATED("Use MatcherPass instead")
-    void add_matcher(const std::shared_ptr<pattern::Matcher>& m,
-                     const ngraph::graph_rewrite_callback& callback,
-                     const PassPropertyMask& property);
-
-    NGRAPH_DEPRECATED("Use MatcherPass instead")
-    void add_matcher(const std::shared_ptr<pattern::Matcher>& m, const ngraph::graph_rewrite_callback& callback);
-
-    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
-
-    void set_pass_config(const std::shared_ptr<PassConfig>& pass_config) override;
-
-protected:
-    bool apply_matcher_passes(std::shared_ptr<Function> f, std::deque<std::weak_ptr<Node>> nodes_to_run);
-
-    bool m_enable_shape_inference = false;
-
-    std::vector<std::shared_ptr<ngraph::pass::MatcherPass>> m_matchers;
-};
-
-class NGRAPH_API BackwardGraphRewrite : public ngraph::pass::GraphRewrite {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    BackwardGraphRewrite() = default;
-
-    explicit BackwardGraphRewrite(const std::shared_ptr<MatcherPass>& pass) : GraphRewrite(pass) {}
-
-    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
-};
-
-class NGRAPH_API RecurrentGraphRewrite : public ngraph::pass::FunctionPass {
-public:
-    RecurrentGraphRewrite(size_t num_iters = 10) : FunctionPass(), m_num_iters(num_iters) {}
-
-    void add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
-                     const ngraph::recurrent_graph_rewrite_callback& callback,
-                     const PassPropertyMask& property);
-
-    // TODO: This interface may deprecate after all passes are refactored.
-    void add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
-                     const ngraph::recurrent_graph_rewrite_callback& callback);
-
-    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
-
-private:
-    size_t m_num_iters;
-
-    std::vector<std::shared_ptr<ngraph::pass::MatcherPass>> m_matchers;
-};
+using ov::pass::BackwardGraphRewrite;
+using ov::pass::GraphRewrite;
+using ov::pass::MatcherPass;
+using ov::pass::RecurrentGraphRewrite;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/low_latency.hpp b/ngraph/core/include/ngraph/pass/low_latency.hpp
index 49607893b2bcf7..f003bba095af9c 100644
--- a/ngraph/core/include/ngraph/pass/low_latency.hpp
+++ b/ngraph/core/include/ngraph/pass/low_latency.hpp
@@ -5,10 +5,12 @@
 #pragma once
 
 #include <memory>
-#include <ngraph/pass/graph_rewrite.hpp>
-#include <ngraph/pass/pass.hpp>
 #include <vector>
 
+#include "ngraph/pass/graph_rewrite.hpp"
+#include "ngraph/pass/pass.hpp"
+#include "openvino/pass/low_latency.hpp"
+
 namespace ngraph {
 namespace pass {
 /**
@@ -46,38 +48,6 @@ class NGRAPH_DEPRECATED("Use LowLatency2 instead.") NGRAPH_API LowLatency : publ
     LowLatency();
 };
 
-/**
- * @brief The transformation finds all TensorIterator/Loop layers in the network,
- * processes all back edges that describe a connection between Result and Parameter
- * of the TensorIterator/Loop bodies,and inserts ReadValue and Assign layers at the
- * input and output corresponding to this back edge.
- * Supported platforms: CPU, GNA.
- *
- * The example below describes the changes made by the transformation
- *  [] - TensorIterator body
- *  () - new layer
- *  BE - back-edge
- *
- *  before applying the transformation:
- *  -> input1[BE_1 -> Parameter -> Layers ... -> Result  -> BE_1 ]output1->
- *
- *  after applying the transformation:
- *  ->(ReadValue)-> input1[BE_1 ->Parameter->Layers ...->Result->BE_1]output1 ->(Assign)
- *                                                                      \
- *                                                                       ->...
- * After applying the transformation, the resulting network can be inferred
- * step by step, the states will store between inferences.
- */
-class NGRAPH_API LowLatency2 : public ngraph::pass::FunctionPass {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    explicit LowLatency2(bool use_const_initializer = true) : m_use_const_initializer(use_const_initializer) {}
-
-    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
-
-private:
-    bool m_use_const_initializer;
-};
+using ov::pass::LowLatency2;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/manager.hpp b/ngraph/core/include/ngraph/pass/manager.hpp
index 573877046ef2d0..3ecef3dcaae2c7 100644
--- a/ngraph/core/include/ngraph/pass/manager.hpp
+++ b/ngraph/core/include/ngraph/pass/manager.hpp
@@ -11,106 +11,10 @@
 
 #include "ngraph/pass/pass.hpp"
 #include "ngraph/pass/validate.hpp"
+#include "openvino/pass/manager.hpp"
 
 namespace ngraph {
 namespace pass {
-class NGRAPH_API Manager {
-public:
-    Manager();
-    ~Manager();
-
-    //// \brief Construct Manager with shared PassConfig instance
-    explicit Manager(std::shared_ptr<PassConfig> pass_config);
-
-    /// \brief Register given transformation class type to execution list
-    /// Example below show the basic usage of pass::Manager
-    ///
-    ///     pass::Manager manager;
-    ///     manager.register_pass<MyTransformation>(/*transformation constructor ars*/);
-    ///     manager.run_passes(f);
-    ///
-    /// For some purposes transformation can be registered and disabled by default.
-    ///
-    ///     manager.register_pass<MyTransformation, false>();
-    ///
-    /// \return shared_ptr to the transformation instance
-    template <typename T, bool Enable = true, class... Args>
-    std::shared_ptr<T> register_pass(Args&&... args) {
-        auto rc = push_pass<T>(std::forward<Args>(args)...);
-        rc->set_pass_config(m_pass_config);
-        if (m_per_pass_validation) {
-            push_pass<Validate>();
-        }
-        if (!Enable && !m_pass_config->is_enabled<T>()) {
-            m_pass_config->disable<T>();
-        }
-        return rc;
-    }
-
-    void run_passes(std::shared_ptr<Function>);
-
-    void set_pass_visualization(bool new_state) {
-        m_visualize = new_state;
-    }
-    /// \brief Set flag to enable/disable running Validate pass after executing
-    /// each registered pass
-    /// \param new_state Value "true" enables Validate pass run; "false", otherwise
-    void set_per_pass_validation(bool new_state) {
-        m_per_pass_validation = new_state;
-    }
-    /// \brief Callback is a lambda function that can be used by registered transformations.
-    /// The main purpose of this callback is to provide a way for plugins to disable/enable
-    /// transformations based on some conditions. In some cases plugins may want not to
-    /// execute some
-    /// transformations.
-    /// For example plugin can disable unpleasant decompositions because of performance
-    /// reasons for
-    /// some cases.
-    /// Callback example:
-    /// auto callback = [](const std::shared_ptr<const ngraph::Node> & node) -> bool {
-    ///     return std::dynamic_pointer_cast<const ngraph::opset3::DepthToSpace>(node) !=
-    ///     nullptr;
-    /// };
-    /// This callback returns true in case of DepthToSpace operation. So when execution
-    /// DepthToSpace
-    /// decomposition pass will check is this decomposition needed or plugin can execute
-    /// this
-    /// operation directly. And of course on transformation side we need to have a response
-    /// for this
-    /// callback.
-    /// if (transformation_callback(batch_to_space)) {
-    ///     return false;
-    /// }
-    /// \param callback lamda function that returns true in case if node is supported by
-    /// plugin and
-    /// transformation is not needed
-    NGRAPH_DEPRECATED("Please use get_pass_config() to configure transformation pipeline")
-    void set_callback(const param_callback& callback) {
-        m_pass_config->set_callback(callback);
-    }
-    /// \return PassConfig shared object. This object is used for transformations pipeline
-    /// configuration.
-    /// This object allows to disable/enable transformations execution, set callback to
-    /// particular
-    /// transformation. For mo details see PassConfig class.
-    std::shared_ptr<PassConfig> get_pass_config() {
-        return m_pass_config;
-    }
-
-protected:
-    template <typename T, class... Args>
-    std::shared_ptr<T> push_pass(Args&&... args) {
-        static_assert(std::is_base_of<pass::PassBase, T>::value, "pass not derived from pass base");
-        auto pass = std::make_shared<T>(std::forward<Args>(args)...);
-        auto pass_base = std::static_pointer_cast<PassBase>(pass);
-        m_pass_list.push_back(pass_base);
-        return pass;
-    }
-
-    std::shared_ptr<PassConfig> m_pass_config;
-    std::vector<std::shared_ptr<PassBase>> m_pass_list;
-    bool m_visualize = false;
-    bool m_per_pass_validation = true;
-};
+using ov::pass::Manager;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/pass.hpp b/ngraph/core/include/ngraph/pass/pass.hpp
index 349439d36cd107..db0932b1227571 100644
--- a/ngraph/core/include/ngraph/pass/pass.hpp
+++ b/ngraph/core/include/ngraph/pass/pass.hpp
@@ -13,105 +13,32 @@
 #include "ngraph/node.hpp"
 #include "ngraph/pass/pass_config.hpp"
 #include "ngraph/util.hpp"
+#include "openvino/pass/pass.hpp"
 
-namespace ngraph {
+namespace ov {
 namespace pass {
-enum class PassProperty : uint32_t {
-    // Pass requires node shapes to be static
-    REQUIRE_STATIC_SHAPE = 0x1,
-    // Pass transformation will change the function's dynamic state
-    CHANGE_DYNAMIC_STATE = 1 << 1,
-};
-
-typedef EnumMask<PassProperty> PassPropertyMask;
-const PassPropertyMask all_pass_property_off;
-
-class NGRAPH_API PassBase {
-    friend class Manager;
-
-public:
-    PassBase();
-    virtual ~PassBase() {}
-    /// Check if this pass has all the pass properties.
-    bool get_property(const PassPropertyMask& prop_mask) const;
-
-    void set_name(const std::string& name) {
-        m_name = name;
-    }
-    std::string get_name() const;
-
-    /// \brief Set callback for particular transformation type.
-    /// This method set global callback. For more details see PassConfig class
-    /// documentation.
-    /// \param callback lambda function that takes node and returns bool
-    void set_callback(const param_callback& callback);
-
-    /// \brief Set PassConfig for particular transformation instance
-    /// \param pass_config is a PassConfig shared_ptr
-    virtual void set_pass_config(const std::shared_ptr<PassConfig>& pass_config) {
-        m_pass_config = pass_config;
-    }
-
-    /// \brief Allows to access PassConfig shared instance
-    /// \return Shared instance of PassConfig class
-    std::shared_ptr<PassConfig> get_pass_config() {
-        return m_pass_config;
-    }
-    /// \brief Applies callback for given node. By default callback returns false.
-    /// This method remains here only for backward compatibility and will be removed
-    /// after all transformations are moved to transformation_callback() method.
-    /// \return result of callback execution for given node
-    NGRAPH_DEPRECATED("Please use transformation_callback method instead")
-    bool m_transformation_callback(const std::shared_ptr<const Node>& node) {
-        return m_pass_config->get_callback(get_type_info())(node);
-    }
-
-    /// \brief Applies callback for given node. By default callback returns false.
-    /// \param node which will be used inside callback
-    /// \return result of callback execution for given node
-    bool transformation_callback(const std::shared_ptr<const Node>& node) {
-        return m_pass_config->get_callback(get_type_info())(node);
-    }
-
-    using type_info_t = DiscreteTypeInfo;
-
-    virtual const type_info_t& get_type_info() const = 0;
 
-protected:
-    void set_property(const PassPropertyMask& prop, bool value);
-
-private:
-    PassPropertyMask m_property;
-
-    std::string m_name;
-    std::shared_ptr<PassConfig> m_pass_config;
-};
+class Manager;
 
-class NGRAPH_API FunctionPass : public PassBase {
-public:
-    NGRAPH_RTTI_DECLARATION;
-    virtual ~FunctionPass();
-    virtual bool run_on_function(std::shared_ptr<ngraph::Function>) = 0;
-};
+}
+}  // namespace ov
+namespace ngraph {
+namespace pass {
+using ov::pass::FunctionPass;
+using ov::pass::FusionType;
+using ov::pass::FusionTypeMask;
+using ov::pass::Manager;
+using ov::pass::PassBase;
+using ov::pass::PassProperty;
+using ov::pass::PassPropertyMask;
+NGRAPH_DEPRECATED("This variable is deprecated and will be removed soon.")
+const PassPropertyMask all_pass_property_off;
 
 class NGRAPH_DEPRECATED("Use MatcherPass or FunctionPass instead.") NGRAPH_API NodePass : public PassBase {
 public:
     NGRAPH_RTTI_DECLARATION;
-    virtual ~NodePass();
+    ~NodePass() override;
     virtual bool run_on_node(std::shared_ptr<ngraph::Node>) = 0;
 };
-
-class Manager;
-enum class FusionType : uint32_t {
-    //`DIFFERENTIABLE_FUSIONS` produce ops that support autodiff
-    // i.e. implement `generate_adjoints`
-    DIFFERENTIABLE_FUSIONS = 0x1,
-    REGULAR_FUSIONS = 0x2,
-    //`FOP_FUSIONS` produce ops in the FusedOps category that might
-    // not be supported by all backends
-    FOP_FUSIONS = 0x4,
-    ALL_FUSIONS = 0xFFFFFFFF
-};
-typedef EnumMask<FusionType> FusionTypeMask;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/pass_config.hpp b/ngraph/core/include/ngraph/pass/pass_config.hpp
index 6f9bd8bd7556aa..69d89d94a4d0f0 100644
--- a/ngraph/core/include/ngraph/pass/pass_config.hpp
+++ b/ngraph/core/include/ngraph/pass/pass_config.hpp
@@ -12,164 +12,12 @@
 #include "ngraph/function.hpp"
 #include "ngraph/node.hpp"
 #include "ngraph/util.hpp"
+#include "openvino/pass/pass_config.hpp"
 
 namespace ngraph {
 namespace pass {
-using param_callback = std::function<bool(const std::shared_ptr<const ::ngraph::Node>)>;
-using param_callback_map = std::map<ngraph::DiscreteTypeInfo, param_callback>;
-
-/// \brief Class representing a transformations config that is used for disabling/enabling
-/// transformations registered inside pass::Manager and also allows to set callback for all
-/// transformations or for particular transformation.
-///
-/// When pass::Manager is created all passes registered inside this manager including nested
-/// passes will share the same instance of PassConfig class.
-/// To work with this class first you need to get shared instance of this class by calling
-/// manager.get_pass_config() method. Then you will be able to disable/enable passes based
-/// on transformations type_info. For example:
-///
-///     pass::Manager manager;
-///     manager.register_pass<CommonOptimizations>();
-///     auto pass_config = manager.get_pass_config();
-///     pass_config->disable<ConvertGELU>(); // this will disable nested pass inside
-///                                          // CommonOptimizations pipeline
-///     manager.run_passes(f);
-///
-/// Sometimes it is needed to call transformation inside other transformation manually. And
-/// for that case before running transformation you need manually check that this pass is
-/// not disabled and then you need to set current PassConfig instance to this
-/// transformation. For example:
-///
-///     // Inside MatcherPass callback or inside FunctionPass run_on_function() method
-///     // you need to call get_pass_config() method to get shared instance of PassConfig
-///     auto pass_config = get_pass_config();
-///
-///     // Before running nested transformation you need to check is it disabled or not
-///     if (!pass_config->is_disabled<ConvertGELU>()) {
-///         auto pass = ConvertGELU();
-///         pass->set_pass_config(pass_config);
-///         pass.apply(node);
-///     }
-///
-/// Following this logic inside your transformations you will guaranty that transformations
-/// will be executed in a right way.
-class NGRAPH_API PassConfig {
-public:
-    /// \brief Disable transformation by its type_info
-    /// \param type_info Transformation type_info
-    void disable(const DiscreteTypeInfo& type_info);
-    /// \brief Disable transformation by its class type (based on type_info)
-    template <typename T>
-    void disable() {
-        NGRAPH_SUPPRESS_DEPRECATED_START
-        disable(T::type_info);
-        NGRAPH_SUPPRESS_DEPRECATED_END
-    }
-
-    /// \brief Enable transformation by its type_info
-    /// \param type_info Transformation type_info
-    void enable(const DiscreteTypeInfo& type_info);
-    /// \brief Enable transformation by its class type (based on type_info)
-    template <typename T>
-    void enable() {
-        NGRAPH_SUPPRESS_DEPRECATED_START
-        enable(T::type_info);
-        NGRAPH_SUPPRESS_DEPRECATED_END
-    }
-
-    /// \brief Set callback for all kind of transformations
-    void set_callback(const param_callback& callback) {
-        m_callback = callback;
-    }
-    template <typename... Args>
-    typename std::enable_if<sizeof...(Args) == 0>::type set_callback(const param_callback& callback) {}
-
-    /// \brief Set callback for particular transformation class types
-    ///
-    /// Example below show how to set callback for one or multiple passes using this method.
-    ///
-    ///     pass_config->set_callback<ngraph::pass::ConvertBatchToSpace,
-    ///                               ngraph::pass::ConvertSpaceToBatch>(
-    ///              [](const_node_ptr &node) -> bool {
-    ///                   // Disable transformations for cases when input shape rank is not
-    ///                   equal to 4
-    ///                   const auto input_shape_rank =
-    ///                   node->get_output_partial_shape(0).rank().get_length();
-    ///                   if (input_shape_rank != 4) {
-    ///                       return false;
-    ///                   }
-    ///                   return true;
-    ///               });
-    ///
-    /// Note that inside transformations you must provide code that work with this callback.
-    /// See example below:
-    ///
-    ///     if (transformation_callback(node)) {
-    ///         return false; // exit from transformation
-    ///     }
-    ///
-    template <typename T, class... Args>
-    void set_callback(const param_callback& callback) {
-        m_callback_map[T::type_info] = callback;
-        set_callback<Args...>(callback);
-    }
-
-    /// \brief Get callback for given transformation type_info
-    /// \param type_info Transformation type_info
-    ///
-    /// In case if callback wasn't set for given transformation type then global callback
-    /// will be returned. But if even global callback wasn't set then default callback will
-    /// be returned.
-    param_callback get_callback(const DiscreteTypeInfo& type_info) const;
-
-    /// \brief Get callback for given transformation class type
-    /// \return callback lambda function
-    template <typename T>
-    param_callback get_callback() const {
-        NGRAPH_SUPPRESS_DEPRECATED_START
-        return get_callback(T::type_info);
-        NGRAPH_SUPPRESS_DEPRECATED_END
-    }
-
-    /// \brief Check either transformation type is disabled or not
-    /// \param type_info Transformation type_info
-    /// \return true if transformation type was disabled and false otherwise
-    bool is_disabled(const DiscreteTypeInfo& type_info) const {
-        return m_disabled.count(type_info);
-    }
-
-    /// \brief Check either transformation class type is disabled or not
-    /// \return true if transformation type was disabled and false otherwise
-    template <typename T>
-    bool is_disabled() const {
-        NGRAPH_SUPPRESS_DEPRECATED_START
-        return is_disabled(T::type_info);
-        NGRAPH_SUPPRESS_DEPRECATED_END
-    }
-
-    /// \brief Check either transformation type is force enabled or not
-    /// \param type_info Transformation type_info
-    /// \return true if transformation type was force enabled and false otherwise
-    bool is_enabled(const DiscreteTypeInfo& type_info) const {
-        return m_enabled.count(type_info);
-    }
-
-    /// \brief Check either transformation class type is force enabled or not
-    /// \return true if transformation type was force enabled and false otherwise
-    template <typename T>
-    bool is_enabled() const {
-        return is_enabled(T::type_info);
-    }
-
-    void add_disabled_passes(const PassConfig& rhs);
-
-private:
-    param_callback m_callback = [](const std::shared_ptr<const ::ngraph::Node>&) {
-        return false;
-    };
-    param_callback_map m_callback_map;
-    std::unordered_set<DiscreteTypeInfo> m_disabled;
-    std::unordered_set<DiscreteTypeInfo> m_enabled;
-};
+using ov::pass::param_callback;
+using ov::pass::param_callback_map;
+using ov::pass::PassConfig;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/validate.hpp b/ngraph/core/include/ngraph/pass/validate.hpp
index 6daa6ca09d3851..3f8b42d14f2e36 100644
--- a/ngraph/core/include/ngraph/pass/validate.hpp
+++ b/ngraph/core/include/ngraph/pass/validate.hpp
@@ -5,27 +5,10 @@
 #pragma once
 
 #include "ngraph/pass/pass.hpp"
+#include "openvino/pass/validate.hpp"
 
 namespace ngraph {
 namespace pass {
-/// \brief The Validate pass performs sanity checks on attributes and inputs, and
-/// computes output shapes and element types for all computation nodes in a given
-/// computation graph.
-///
-/// \details The verification and inference is done via invoking each node's specific
-/// implementation of \link ngraph::Node::validate_and_infer_types() \endlink function.
-///
-/// By default, the \ref ngraph::pass::Manager runs this pass after executing every
-/// optimization pass. This is to ensure that any update to the graph by an optimization
-/// pass does not break the shape and data type requirement on a computation node.
-/// This default validation run can be changed via calling the
-/// \link ngraph::pass::Manager::set_per_pass_validation(bool) \endlink function.
-class NGRAPH_API Validate : public FunctionPass {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    Validate() : FunctionPass() {}
-    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
-};
+using ov::pass::Validate;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pass/visualize_tree.hpp b/ngraph/core/include/ngraph/pass/visualize_tree.hpp
index 6c4b0863329f71..b37c0ec502f380 100644
--- a/ngraph/core/include/ngraph/pass/visualize_tree.hpp
+++ b/ngraph/core/include/ngraph/pass/visualize_tree.hpp
@@ -14,44 +14,10 @@
 #include <utility>
 
 #include "ngraph/pass/pass.hpp"
-
-class HeightMap;
-
-using visualize_tree_ops_map_t =
-    std::unordered_map<ngraph::Node::type_info_t, std::function<void(const ngraph::Node&, std::ostream& ss)>>;
+#include "openvino/pass/visualize_tree.hpp"
 
 namespace ngraph {
 namespace pass {
-class NGRAPH_API VisualizeTree : public FunctionPass {
-public:
-    NGRAPH_RTTI_DECLARATION;
-
-    using node_modifiers_t = std::function<void(const Node& node, std::vector<std::string>& attributes)>;
-    VisualizeTree(const std::string& file_name, node_modifiers_t nm = nullptr, bool dot_only = false);
-    bool run_on_function(std::shared_ptr<ngraph::Function>) override;
-
-    void set_ops_to_details(const visualize_tree_ops_map_t& ops_map) {
-        m_ops_to_details = ops_map;
-    }
-
-protected:
-    void add_node_arguments(std::shared_ptr<Node> node,
-                            std::unordered_map<Node*, HeightMap>& height_maps,
-                            size_t& fake_node_ctr);
-    std::string add_attributes(std::shared_ptr<Node> node);
-    virtual std::string get_attributes(std::shared_ptr<Node> node);
-    virtual std::string get_node_name(std::shared_ptr<Node> node);
-    std::string get_constant_value(std::shared_ptr<Node> node, size_t max_elements = 7);
-
-    void render() const;
-
-    std::stringstream m_ss;
-    std::string m_name;
-    std::set<std::shared_ptr<Node>> m_nodes_with_attributes;
-    visualize_tree_ops_map_t m_ops_to_details;
-    node_modifiers_t m_node_modifiers = nullptr;
-    bool m_dot_only;
-    static const int max_jump_distance;
-};
+using ov::pass::VisualizeTree;
 }  // namespace pass
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/matcher.hpp b/ngraph/core/include/ngraph/pattern/matcher.hpp
index f361365bdcbae5..add3789429d634 100644
--- a/ngraph/core/include/ngraph/pattern/matcher.hpp
+++ b/ngraph/core/include/ngraph/pattern/matcher.hpp
@@ -16,255 +16,21 @@
 #include "ngraph/pattern/op/any_output.hpp"
 #include "ngraph/pattern/op/label.hpp"
 #include "ngraph/pattern/op/skip.hpp"
+#include "openvino/pass/pattern/matcher.hpp"
 
-namespace ngraph {
+namespace ov {
 namespace pass {
 class GraphRewrite;
 }
+}  // namespace ov
+namespace ngraph {
+namespace pass {
+using ov::pass::GraphRewrite;
+}
 
 namespace pattern {
-class Matcher;
-
-class NGRAPH_API MatcherState {
-public:
-    MatcherState(Matcher*);
-    bool finish(bool is_successful);
-    ~MatcherState();
-
-protected:
-    Matcher* m_matcher;
-    PatternValueMap m_pattern_value_map;
-    PatternValueMaps m_pattern_value_maps;
-    size_t m_watermark;
-    size_t m_capture_size;
-    bool m_restore{true};
-};
-
-/// Matcher looks for node patterns in a computation graph. The patterns are described by an
-/// automaton that is described by an extended computation graph. The matcher executes
-/// by attempting to match the start node of the pattern to a computation graph value
-/// (output of a Node). In addition to determing if a match occurs, a pattern node may add
-/// graph nodes to a list of matched nodes, associate nodes with graph values, and start
-/// submatches. Submatches add match state changes to the enclosing match if the submatch
-/// succeeds; otherwise the state is reverted.
-///
-/// The default match behavior of a pattern node with a graph nodes is that the computation
-/// graph value is added to the end of the matched value list and the match succeeds if the
-/// node/pattern types match and the input values match. In the case of a commutative node,
-/// the inputs can match in any order. If the matcher is in strict mode, the graph value
-/// element type and shape must also match.
-///
-/// Pattern nodes that have different match behavior are in ngraph::pattern::op and have
-/// descriptions of their match behavior.
-class NGRAPH_API Matcher {
-public:
-    using PatternMap = ngraph::pattern::PatternMap;
-
-    // Avoid implicit string construction from nullptr.
-    Matcher(const std::shared_ptr<Node> pattern_node, std::nullptr_t name) = delete;
-
-    Matcher() {}
-    Matcher(Output<Node>& pattern_node) : m_pattern_node{pattern_node} {}
-
-    Matcher(Output<Node>& pattern_node, const std::string& name) : m_pattern_node(pattern_node), m_name{name} {}
-
-    /// \brief Constructs a Matcher object
-    ///
-    /// \param pattern_node is a pattern sub graph that will be matched against input graphs
-    /// \param name is a string which is used for logging and disabling a matcher
-    /// \param strict_mode forces a matcher to consider shapes and ET of nodes
-    Matcher(const Output<Node>& pattern_node, const std::string& name, bool strict_mode)
-        : m_pattern_node(pattern_node),
-          m_name(name),
-          m_strict_mode(strict_mode) {}
-
-    // Some matches should start on a node rather than an output. These three constructors
-    // are transition until we work out the right way to do that.
-    Matcher(std::shared_ptr<Node> pattern_node);
-    Matcher(std::shared_ptr<Node> pattern_node, const std::string& name);
-    Matcher(std::shared_ptr<Node> pattern_node, const std::string& name, bool strict_mode);
-
-    virtual ~Matcher() {}
-    /// \brief Matches a pattern to \p graph_node
-    ///
-    /// \param graph_value is an input graph to be matched against
-    bool match(const Output<Node>& graph_value);
-
-    bool match(std::shared_ptr<Node> graph_node);
-
-    /// \brief Matches a pattern to \p graph_node
-    ///
-    /// \param graph_value is an input graph to be matched against
-    /// \param previous_matches contains previous mappings from labels to nodes to use
-    bool match(const Output<Node>& graph_value, const PatternMap& previous_matches);
-    bool match(const Output<Node>& graph_value, const PatternValueMap& previous_matches);
-
-    template <typename T>
-    static std::shared_ptr<T> unique_match(std::shared_ptr<Node> node) {
-        std::shared_ptr<T> matched;
-        for (auto arg : node->input_values()) {
-            if (auto t_casted = ov::as_type_ptr<T>(arg.get_node_shared_ptr())) {
-                if (matched) {
-                    throw ngraph_error("There's more than two arguments of the same type");
-                } else {
-                    matched = t_casted;
-                }
-            }
-        }
-        return matched;
-    }
-
-    bool is_contained_match(const NodeVector& exclusions = {}, bool ignore_unused = true);
-    const NodeVector get_matched_nodes() {
-        return as_node_vector(m_matched_list);
-    }
-    const OutputVector& get_matched_values() const {
-        return m_matched_list;
-    }
-    OutputVector& get_matched_values() {
-        return m_matched_list;
-    }
-    void reset() {}
-    const std::string& get_name() {
-        return m_name;
-    }
-    std::shared_ptr<Node> get_pattern() {
-        return m_pattern_node.get_node_shared_ptr();
-    }
-    Output<Node> get_pattern_value() {
-        return m_pattern_node;
-    }
-    std::shared_ptr<Node> get_match_root();
-    Output<Node> get_match_value();
-    PatternMap get_pattern_map() const;
-    PatternValueMap& get_pattern_value_map() {
-        return m_pattern_map;
-    }
-    PatternValueMaps& get_pattern_value_maps() {
-        return m_pattern_value_maps;
-    }
-    /// \brief Low-level helper to match recurring patterns
-    ///
-    /// \param graph is a graph to be matched against
-    /// \param pattern is a recurring pattern
-    /// \param rpattern specifies a node to recur from next
-    /// \param patterns a map from labels to matches
-
-    size_t add_node(Output<Node> node);
-
-    bool virtual match_value(const ngraph::Output<Node>& pattern_value, const ngraph::Output<Node>& graph_value);
-
-    bool is_strict_mode() {
-        return m_strict_mode;
-    }
-    virtual bool match_arguments(Node* pattern_node, const std::shared_ptr<Node>& graph_node);
-
-    void capture(const std::set<Node*>& static_nodes);
-
-    void clear_state();
-
-    size_t get_number_of_recurrent_matches() const {
-        return m_pattern_value_maps.size();
-    }
-    NodeVector get_bound_nodes_for_pattern(const Output<Node>& pattern) const;
-    size_t get_number_of_bound_labels() const;
-    /// \brief Try a match
-    MatcherState start_match();
-
-    Output<Node> m_match_root;
-    Output<Node> m_pattern_node;
-    PatternValueMap m_pattern_map;
-    PatternValueMaps m_pattern_value_maps;
-    OutputVector m_matched_list;
-
-protected:
-    bool match_permutation(const OutputVector& pattern_args, const OutputVector& args);
-
-    std::string m_name{"unnamed"};
-    bool m_strict_mode{false};
-};
-
-class NGRAPH_API RecurrentMatcher {
-public:
-    /// \brief Constructs a RecurrentMatcher object. Reccurent Matchers are used to match
-    ///        repeating patterns (e.g. RNN, LSTM, GRU cells)
-    ///
-    /// \param initial_pattern is a pattern sub graph describing the initial cell
-    /// \param pattern is a pattern sub graph describing an individual cell
-    /// \param rpattern is a (recurring) label to denote which node the next match should
-    ///                 start at
-    /// \param correlated_patterns is a set of labels whose bound nodes must remain the same
-    ///                            across all cells
-    RecurrentMatcher(const Output<Node>& initial_pattern,
-                     const Output<Node>& pattern,
-                     const std::shared_ptr<Node>& rpattern,
-                     const std::set<std::shared_ptr<Node>>& correlated_patterns)
-        : m_initial_pattern(initial_pattern),
-          m_pattern(pattern),
-          m_recurrent_pattern(rpattern),
-          m_correlated_patterns(correlated_patterns) {}
-
-    /// \brief Constructs a RecurrentMatcher object. Reccurent Matchers are used to match
-    ///        repeating patterns (e.g. RNN, LSTM, GRU cells)
-    ///
-    /// \param pattern is a pattern sub graph describing an individual cell
-    /// \param rpattern is a (recurring) label to denote which node the next match should
-    ///                 start at
-    /// \param correlated_patterns is a set of labels whose bound nodes must remain the same
-    ///                            across all cells
-    RecurrentMatcher(const Output<Node>& pattern,
-                     const std::shared_ptr<Node>& rpattern,
-                     const std::set<std::shared_ptr<Node>>& correlated_patterns)
-        : RecurrentMatcher(pattern, pattern, rpattern, correlated_patterns) {}
-
-    RecurrentMatcher(const Output<Node>& initial_pattern,
-                     const Output<Node>& pattern,
-                     const std::shared_ptr<Node>& rpattern,
-                     const std::set<std::shared_ptr<op::Label>>& correlated_patterns);
-
-    RecurrentMatcher(const Output<Node>& pattern,
-                     const std::shared_ptr<Node>& rpattern,
-                     const std::set<std::shared_ptr<op::Label>>& correlated_patterns)
-        : RecurrentMatcher(pattern, pattern, rpattern, correlated_patterns) {}
-
-    /// \brief Returns a vector of bound nodes for a given label (used in a pattern
-    /// describing an individual cell
-    NodeVector get_bound_nodes_for_pattern(const std::shared_ptr<Node>& pattern) const {
-        if (m_matches.count(pattern) == 0) {
-            throw ngraph_error("No bound nodes for a given label");
-        }
-
-        return as_node_vector(m_matches.at(pattern));
-    }
-
-    size_t get_number_of_recurrent_matches() const {
-        if (m_matches.size() == 0) {
-            return 0;
-        }
-
-        return (*m_matches.begin()).second.size();
-    }
-
-    size_t get_number_of_bound_labels() const {
-        return m_matches.size();
-    }
-    /// \brief Tries to match a pattern for an individual cell to a given \p graph
-    bool match(Output<Node> graph);
-
-    std::shared_ptr<Node> get_match_root() {
-        return m_match_root.get_node_shared_ptr();
-    }
-    Output<Node> get_match_value() {
-        return m_match_root;
-    }
-
-private:
-    Output<Node> m_initial_pattern;
-    Output<Node> m_pattern;
-    std::shared_ptr<Node> m_recurrent_pattern;
-    const std::set<std::shared_ptr<Node>> m_correlated_patterns;
-    RPatternValueMap m_matches;
-    Output<Node> m_match_root;
-};
+using ov::pass::pattern::Matcher;
+using ov::pass::pattern::MatcherState;
+using ov::pass::pattern::RecurrentMatcher;
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/any.hpp b/ngraph/core/include/ngraph/pattern/op/any.hpp
index d9d2a85cd8b26c..bc2ac7801590d5 100644
--- a/ngraph/core/include/ngraph/pattern/op/any.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/any.hpp
@@ -6,38 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/any.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// The graph value is to the matched value list. If the predicate is true for the node
-/// and the arguments match, the match succeeds.
-class NGRAPH_API Any : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternAny", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    /// \brief creates a Any node containing a sub-pattern described by \sa type and \sa
-    ///        shape.
-    Any(const element::Type& type, const PartialShape& s, ValuePredicate pred, const OutputVector& wrapped_values)
-        : Pattern(wrapped_values, pred) {
-        set_output_type(0, type, s);
-    }
-    Any(const element::Type& type, const PartialShape& s, NodePredicate pred, const NodeVector& wrapped_values)
-        : Any(type, s, as_value_predicate(pred), as_output_vector(wrapped_values)) {}
-    /// \brief creates a Any node containing a sub-pattern described by the type and
-    ///        shape of \sa node.
-    Any(const Output<Node>& node, ValuePredicate pred, const OutputVector& wrapped_values)
-        : Any(node.get_element_type(), node.get_partial_shape(), pred, wrapped_values) {}
-    Any(const Output<Node>& node, NodePredicate pred, const NodeVector& wrapped_values)
-        : Any(node.get_element_type(),
-              node.get_partial_shape(),
-              as_value_predicate(pred),
-              as_output_vector(wrapped_values)) {}
-
-    bool match_value(pattern::Matcher* matcher,
-                     const Output<Node>& pattern_value,
-                     const Output<Node>& graph_value) override;
-};
+using ov::pass::pattern::op::Any;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/any_of.hpp b/ngraph/core/include/ngraph/pattern/op/any_of.hpp
index 4970626e136b09..166bd763271783 100644
--- a/ngraph/core/include/ngraph/pattern/op/any_of.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/any_of.hpp
@@ -6,47 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/any_of.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// The graph value is added to the matched values list. If the predicate is true for
-/// the
-/// graph node, a submatch is performed on the input of AnyOf and each input of the
-/// graph node. The first match that succeeds results in a successful match. Otherwise
-/// the match fails.
-///
-/// AnyOf may be given a type and shape for use in strict mode.
-class NGRAPH_API AnyOf : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternAnyOf", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    /// \brief creates a AnyOf node containing a sub-pattern described by \sa type and
-    ///        \sa shape.
-    AnyOf(const element::Type& type, const PartialShape& s, ValuePredicate pred, const OutputVector& wrapped_values)
-        : Pattern(wrapped_values, pred) {
-        if (wrapped_values.size() != 1) {
-            throw ngraph_error("AnyOf expects exactly one argument");
-        }
-        set_output_type(0, type, s);
-    }
-    AnyOf(const element::Type& type, const PartialShape& s, NodePredicate pred, const NodeVector& wrapped_values)
-        : AnyOf(
-              type,
-              s,
-              [pred](const Output<Node>& value) {
-                  return pred(value.get_node_shared_ptr());
-              },
-              as_output_vector(wrapped_values)) {}
-
-    /// \brief creates a AnyOf node containing a sub-pattern described by the type and
-    ///        shape of \sa node.
-    AnyOf(const Output<Node>& node, ValuePredicate pred, const OutputVector& wrapped_values)
-        : AnyOf(node.get_element_type(), node.get_partial_shape(), pred, wrapped_values) {}
-    AnyOf(std::shared_ptr<Node> node, NodePredicate pred, const NodeVector& wrapped_values)
-        : AnyOf(node, as_value_predicate(pred), as_output_vector(wrapped_values)) {}
-    bool match_value(Matcher* matcher, const Output<Node>& pattern_value, const Output<Node>& graph_value) override;
-};
+using ov::pass::pattern::op::AnyOf;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/any_output.hpp b/ngraph/core/include/ngraph/pattern/op/any_output.hpp
index 46cf734f57bbb0..58fd0c7a04439d 100644
--- a/ngraph/core/include/ngraph/pattern/op/any_output.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/any_output.hpp
@@ -6,23 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/any_output.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// Matches any output of a node
-class NGRAPH_API AnyOutput : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternAnyOutput", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    /// \brief creates an AnyOutput node matching any output of a node
-    /// \param node The node to match
-    AnyOutput(const std::shared_ptr<Node>& pattern) : Pattern({pattern->output(0)}) {}
-
-    bool match_value(pattern::Matcher* matcher,
-                     const Output<Node>& pattern_value,
-                     const Output<Node>& graph_value) override;
-};
+using ov::pass::pattern::op::AnyOutput;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/branch.hpp b/ngraph/core/include/ngraph/pattern/op/branch.hpp
index 13a4e93db57f8a..c6bbf9a45e54ec 100644
--- a/ngraph/core/include/ngraph/pattern/op/branch.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/branch.hpp
@@ -6,48 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/branch.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// A branch adds a loop to the pattern. The branch match is successful if the
-/// destination node pattern matches the graph value. The destination node is a node in
-/// the pattern graph that will not have been created some time after the Branch node is
-/// created; use set_destination to add it.
-///
-/// The branch destination is not stored as a shared pointer to prevent reference
-/// cycles. Thus the destination node must be referenced in some other way to prevent it
-/// from being deleted.
-class NGRAPH_API Branch : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternBranch", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    /// \brief Creates a Branch pattern
-    /// \param pattern the destinationing pattern
-    /// \param labels Labels where the destination may occur
-    Branch() : Pattern(OutputVector{}) {
-        set_output_type(0, element::f32, Shape{});
-    }
-
-    void set_destination(const Output<Node>& destination) {
-        m_destination_node = destination.get_node();
-        m_destination_index = destination.get_index();
-    }
-
-    Output<Node> get_destination() const {
-        return m_destination_node == nullptr
-                   ? Output<Node>()
-                   : Output<Node>{m_destination_node->shared_from_this(), m_destination_index};
-    }
-
-    bool match_value(pattern::Matcher* matcher,
-                     const Output<Node>& pattern_value,
-                     const Output<Node>& graph_value) override;
-
-protected:
-    Node* m_destination_node{nullptr};
-    size_t m_destination_index{0};
-};
+using ov::pass::pattern::op::Branch;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/capture.hpp b/ngraph/core/include/ngraph/pattern/op/capture.hpp
index d5f816588fa2fd..586e0f697c804b 100644
--- a/ngraph/core/include/ngraph/pattern/op/capture.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/capture.hpp
@@ -6,37 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/capture.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// Experimental for support of recurrent matches.
-///
-/// Capture adds the pattern value map to a list of pattern value maps and resets
-/// matches for pattern nodes not in the static node list. The match always succeeds.
-class NGRAPH_API Capture : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternCapture", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    Capture(const Output<Node>& arg) : Pattern({arg}) {
-        set_output_type(0, arg.get_element_type(), arg.get_partial_shape());
-    }
-
-    /// \brief static nodes are retained after a capture. All other nodes are dropped
-    std::set<Node*> get_static_nodes() {
-        return m_static_nodes;
-    }
-    void set_static_nodes(const std::set<Node*>& static_nodes) {
-        m_static_nodes = static_nodes;
-    }
-
-    virtual bool match_value(pattern::Matcher* matcher,
-                             const Output<Node>& pattern_value,
-                             const Output<Node>& graph_value) override;
-
-protected:
-    std::set<Node*> m_static_nodes;
-};
+using ov::pass::pattern::op::Capture;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/label.hpp b/ngraph/core/include/ngraph/pattern/op/label.hpp
index 50da1e63b2b20e..d1893f375eff66 100644
--- a/ngraph/core/include/ngraph/pattern/op/label.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/label.hpp
@@ -6,106 +6,14 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/label.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// Fails if the predicate returns false on the graph value.
-///
-/// The graph value is added to the matched values list. If the Label is already
-/// associated with a value, the match succeeds if the value is the same as the graph
-/// value. Otherwise, the label is associated with the graph value and the match
-/// succeeds if the pattern input matches the graph value.
-///
-/// DEPRECATED: If no inputs are given to Label, a True node is serves as the input. If
-/// more than one inputs are given, an Or pattern of the inputs serves as the input.
-class NGRAPH_API Label : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternLabel", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    /// \brief creates a Label node containing a sub-pattern described by \sa type and
-    ///        \sa shape.
-    ///
-    /// this Label node can be bound only to the nodes in the input graph
-    /// that match the pattern specified by \sa wrapped_nodes
-    /// Example:
-    /// \code{.cpp}
-    /// auto add = a + b; // a and b are op::Parameter in this example
-    /// auto label = std::make_shared<pattern::op::Label>(element::f32,
-    ///                                                   Shape{2,2},
-    ///                                                   nullptr,
-    ///                                                   OutputVector{add});
-    /// \endcode
-    Label(const element::Type& type,
-          const PartialShape& s,
-          const ValuePredicate pred,
-          const OutputVector& wrapped_values)
-        : Pattern(OutputVector{wrap_values(wrapped_values)}, pred) {
-        set_output_type(0, type, s);
-    }
-
-    explicit Label(const element::Type& type = element::dynamic, const PartialShape& s = PartialShape::dynamic())
-        : Label(
-              type,
-              s,
-              [](const Output<Node>&) {
-                  return true;
-              },
-              OutputVector()) {}
-
-    Label(const element::Type& type, const PartialShape& s, ValuePredicate pred)
-        : Label(type, s, pred, OutputVector{}) {}
-
-    Label(const element::Type& type, const PartialShape& s, NodePredicate pred)
-        : Label(type, s, as_value_predicate(pred), OutputVector{}) {}
-
-    Label(const element::Type& type, const PartialShape& s, const NodePredicate pred, const NodeVector& wrapped_values)
-        : Label(type, s, as_value_predicate(pred), as_output_vector(wrapped_values)) {}
-
-    /// \brief creates a Label node containing a sub-pattern described by the type and
-    ///        shape of \sa node.
-    ///
-    /// this Label node can be bound only to the nodes in the input graph
-    /// that match the pattern specified by \sa wrapped_values
-    /// Example:
-    /// \code{.cpp}
-    /// auto add = a + b; // a and b are op::Parameter in this example
-    /// auto label = std::make_shared<pattern::op::Label>(add,
-    ///                                                   nullptr,
-    ///                                                   OutputVector{add});
-    /// \endcode
-    Label(const Output<Node>& value, const ValuePredicate pred, const OutputVector& wrapped_values)
-        : Label(value.get_element_type(), value.get_partial_shape(), pred, wrapped_values) {}
-    Label(const Output<Node>& value, const ValuePredicate pred)
-        : Label(value.get_element_type(), value.get_partial_shape(), pred, OutputVector{}) {}
-
-    Label(const Output<Node>& value, const NodePredicate pred)
-        : Label(value.get_element_type(), value.get_partial_shape(), as_value_predicate(pred), OutputVector{}) {}
-    Label(const Output<Node>& value)
-        : Label(
-              value.get_element_type(),
-              value.get_partial_shape(),
-              [](const Output<Node>&) {
-                  return true;
-              },
-              OutputVector{}) {}
-    Label(const Output<Node>& node, const NodePredicate pred, const NodeVector& wrapped_values)
-        : Label(node.get_element_type(),
-                node.get_partial_shape(),
-                as_value_predicate(pred),
-                as_output_vector(wrapped_values)) {}
-
-    bool match_value(Matcher* matcher, const Output<Node>& pattern_value, const Output<Node>& graph_value) override;
-
-protected:
-    static Output<Node> wrap_values(const OutputVector& wrapped_values);
-};
+using ov::pass::pattern::op::Label;
 }  // namespace op
 
-NGRAPH_API
-std::shared_ptr<Node> any_input();
-
-NGRAPH_API
-std::shared_ptr<Node> any_input(const pattern::op::ValuePredicate& pred);
+using ov::pass::pattern::any_input;
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/or.hpp b/ngraph/core/include/ngraph/pattern/op/or.hpp
index 53368949712281..19f02c6c5c91be 100644
--- a/ngraph/core/include/ngraph/pattern/op/or.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/or.hpp
@@ -6,25 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/or.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// A submatch on the graph value is performed on each input to the Or; the match
-/// succeeds on the first match. Otherwise the match fails.
-class NGRAPH_API Or : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternOr", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    /// \brief creates an Or node matching one of several sub-patterns in order. Does
-    /// not add node to match list.
-    /// \param patterns The patterns to try for matching
-    Or(const OutputVector& patterns) : Pattern(patterns) {}
-
-    bool match_value(pattern::Matcher* matcher,
-                     const Output<Node>& pattern_value,
-                     const Output<Node>& graph_value) override;
-};
+using ov::pass::pattern::op::Or;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/pattern.hpp b/ngraph/core/include/ngraph/pattern/op/pattern.hpp
index 931c3d9e4e04f8..99e4edfc570816 100644
--- a/ngraph/core/include/ngraph/pattern/op/pattern.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/pattern.hpp
@@ -7,8 +7,10 @@
 #include <functional>
 
 #include "ngraph/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
 
-namespace ngraph {
+namespace ov {
+namespace pass {
 namespace pattern {
 namespace op {
 class Label;
@@ -16,79 +18,42 @@ class Label;
 
 class Matcher;
 class MatchState;
-
-using RPatternValueMap = std::map<std::shared_ptr<Node>, OutputVector>;
-using PatternValueMap = std::map<std::shared_ptr<Node>, Output<Node>>;
-using PatternValueMaps = std::vector<PatternValueMap>;
-
-using PatternMap = std::map<std::shared_ptr<Node>, std::shared_ptr<Node>>;
-
-PatternMap as_pattern_map(const PatternValueMap& pattern_value_map);
-PatternValueMap as_pattern_value_map(const PatternMap& pattern_map);
-
-template <typename T>
-std::function<bool(std::shared_ptr<Node>)> has_class() {
-    auto pred = [](std::shared_ptr<Node> node) -> bool {
-        return ov::is_type<T>(node);
-    };
-
-    return pred;
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
+namespace ngraph {
+namespace pattern {
+namespace op {
+using ov::pass::pattern::op::Label;
 }
 
-NGRAPH_API
-std::function<bool(Output<Node>)> consumers_count(size_t n);
+using ov::pass::pattern::Matcher;
+using ov::pass::pattern::MatcherState;
 
-NGRAPH_API
-std::function<bool(Output<Node>)> has_static_dim(size_t pos);
+using ov::pass::pattern::PatternValueMap;
+using ov::pass::pattern::PatternValueMaps;
+using ov::pass::pattern::RPatternValueMap;
 
-NGRAPH_API
-std::function<bool(Output<Node>)> has_static_dims(const std::vector<size_t>& dims);
+using ov::pass::pattern::PatternMap;
 
-NGRAPH_API
-std::function<bool(Output<Node>)> has_static_shape();
-
-NGRAPH_API
-std::function<bool(Output<Node>)> has_static_rank();
-
-NGRAPH_API
-std::function<bool(Output<Node>)> rank_equals(const Dimension& expected_rank);
-
-NGRAPH_API
-std::function<bool(Output<Node>)> type_matches(const element::Type& type);
-
-NGRAPH_API
-std::function<bool(Output<Node>)> type_matches_any(const std::vector<element::Type>& types);
+using ov::pass::pattern::as_pattern_map;
+using ov::pass::pattern::as_pattern_value_map;
+using ov::pass::pattern::consumers_count;
+using ov::pass::pattern::has_class;
+using ov::pass::pattern::has_static_dim;
+using ov::pass::pattern::has_static_dims;
+using ov::pass::pattern::has_static_rank;
+using ov::pass::pattern::has_static_shape;
+using ov::pass::pattern::rank_equals;
+using ov::pass::pattern::type_matches;
+using ov::pass::pattern::type_matches_any;
 
 namespace op {
-using NodePredicate = std::function<bool(std::shared_ptr<Node>)>;
-using ValuePredicate = std::function<bool(const Output<Node>& value)>;
-
-NGRAPH_API
-ValuePredicate as_value_predicate(NodePredicate pred);
-
-class NGRAPH_API Pattern : public Node {
-public:
-    /// \brief \p a base class for \sa Skip and \sa Label
-    ///
-    Pattern(const OutputVector& patterns, ValuePredicate pred) : Node(patterns), m_predicate(pred) {
-        if (!m_predicate) {
-            m_predicate = [](const Output<Node>&) {
-                return true;
-            };
-        }
-    }
-
-    Pattern(const OutputVector& patterns) : Pattern(patterns, nullptr) {}
-
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& /* new_args */) const override {
-        throw ngraph_error("Uncopyable");
-    }
-
-    ValuePredicate get_predicate() const;
+using ov::pass::pattern::op::NodePredicate;
+using ov::pass::pattern::op::ValuePredicate;
 
-protected:
-    ValuePredicate m_predicate;
-};
+using ov::pass::pattern::op::as_value_predicate;
+using ov::pass::pattern::op::Pattern;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/skip.hpp b/ngraph/core/include/ngraph/pattern/op/skip.hpp
index f16bb667069c45..edf08ef69da55d 100644
--- a/ngraph/core/include/ngraph/pattern/op/skip.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/skip.hpp
@@ -6,37 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/skip.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// The graph value is added to the matched value list. If the predicate is true, the
-/// match succeeds if the arguments match; if the predicate is false, the match succeeds
-/// if the pattern input matches the graph value.
-class NGRAPH_API Skip : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternSkip", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    Skip(const Output<Node>& arg, ValuePredicate pred) : Pattern({arg}, pred) {
-        set_output_type(0, arg.get_element_type(), arg.get_partial_shape());
-    }
-
-    Skip(const Output<Node>& arg, NodePredicate pred = nullptr) : Pattern({arg}, as_value_predicate(pred)) {
-        set_output_type(0, arg.get_element_type(), arg.get_partial_shape());
-    }
-
-    Skip(const OutputVector& args, ValuePredicate pred) : Pattern(args, pred) {
-        set_output_type(0, args.at(0).get_element_type(), args.at(0).get_partial_shape());
-    }
-
-    Skip(const OutputVector& args, NodePredicate pred = nullptr) : Pattern(args, as_value_predicate(pred)) {
-        set_output_type(0, args.at(0).get_element_type(), args.at(0).get_partial_shape());
-    }
-
-    virtual bool match_value(pattern::Matcher* matcher,
-                             const Output<Node>& pattern_value,
-                             const Output<Node>& graph_value) override;
-};
+using ov::pass::pattern::op::Skip;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/true.hpp b/ngraph/core/include/ngraph/pattern/op/true.hpp
index ba08d05acff8a6..1ccfa9e57fa3ae 100644
--- a/ngraph/core/include/ngraph/pattern/op/true.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/true.hpp
@@ -6,21 +6,12 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/true.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-/// \brief The match always succeeds.
-class NGRAPH_API True : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternTrue", 0};
-    const NodeTypeInfo& get_type_info() const override;
-    /// \brief Always matches, does not add node to match list.
-    True() : Pattern(OutputVector{}) {}
-    bool match_value(pattern::Matcher* matcher,
-                     const Output<Node>& pattern_value,
-                     const Output<Node>& graph_value) override;
-};
+using ov::pass::pattern::op::True;
 }  // namespace op
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/pattern/op/wrap_type.hpp b/ngraph/core/include/ngraph/pattern/op/wrap_type.hpp
index 5d08553138e05b..875e890bd8563f 100644
--- a/ngraph/core/include/ngraph/pattern/op/wrap_type.hpp
+++ b/ngraph/core/include/ngraph/pattern/op/wrap_type.hpp
@@ -6,68 +6,14 @@
 
 #include "ngraph/node.hpp"
 #include "ngraph/pattern/op/pattern.hpp"
+#include "openvino/pass/pattern/op/wrap_type.hpp"
 
 namespace ngraph {
 namespace pattern {
 namespace op {
-class NGRAPH_API WrapType : public Pattern {
-public:
-    static constexpr NodeTypeInfo type_info{"patternAnyType", 0};
-    const NodeTypeInfo& get_type_info() const override;
-
-    explicit WrapType(
-        NodeTypeInfo wrapped_type,
-        const ValuePredicate& pred =
-            [](const Output<Node>& output) {
-                return true;
-            },
-        const OutputVector& input_values = {})
-        : Pattern(input_values, pred),
-          m_wrapped_types({wrapped_type}) {
-        set_output_type(0, element::Type_t::dynamic, PartialShape::dynamic());
-    }
-
-    explicit WrapType(
-        std::vector<NodeTypeInfo> wrapped_types,
-        const ValuePredicate& pred =
-            [](const Output<Node>& output) {
-                return true;
-            },
-        const OutputVector& input_values = {})
-        : Pattern(input_values, pred),
-          m_wrapped_types(std::move(wrapped_types)) {
-        set_output_type(0, element::Type_t::dynamic, PartialShape::dynamic());
-    }
-
-    bool match_value(pattern::Matcher* matcher,
-                     const Output<Node>& pattern_value,
-                     const Output<Node>& graph_value) override;
-
-    NodeTypeInfo get_wrapped_type() const;
-
-    const std::vector<NodeTypeInfo>& get_wrapped_types() const;
-
-private:
-    std::vector<NodeTypeInfo> m_wrapped_types;
-};
+using ov::pass::pattern::op::WrapType;
 }  // namespace op
 
-template <class... Args>
-std::shared_ptr<Node> wrap_type(const OutputVector& inputs, const pattern::op::ValuePredicate& pred) {
-    std::vector<DiscreteTypeInfo> info{Args::type_info...};
-    return std::make_shared<op::WrapType>(info, pred, inputs);
-}
-
-template <class... Args>
-std::shared_ptr<Node> wrap_type(const OutputVector& inputs = {}) {
-    return wrap_type<Args...>(inputs, [](const Output<Node>& output) {
-        return true;
-    });
-}
-
-template <class... Args>
-std::shared_ptr<Node> wrap_type(const pattern::op::ValuePredicate& pred) {
-    return wrap_type<Args...>({}, pred);
-}
+using ov::pass::pattern::wrap_type;
 }  // namespace pattern
 }  // namespace ngraph
diff --git a/ngraph/core/include/ngraph/runtime/host_tensor.hpp b/ngraph/core/include/ngraph/runtime/host_tensor.hpp
index 5f49c7f4159d71..e88330a8a2b6be 100644
--- a/ngraph/core/include/ngraph/runtime/host_tensor.hpp
+++ b/ngraph/core/include/ngraph/runtime/host_tensor.hpp
@@ -7,17 +7,23 @@
 #include <memory>
 
 #include "ngraph/descriptor/output.hpp"
+#include "ngraph/partial_shape.hpp"
 #include "ngraph/runtime/tensor.hpp"
 #include "ngraph/type/element_type.hpp"
 #include "ngraph/type/element_type_traits.hpp"
 
 namespace ov {
 class Node;
+namespace op {
+namespace v0 {
+class Constant;
 }
+}  // namespace op
+}  // namespace ov
 namespace ngraph {
 namespace op {
 namespace v0 {
-class Constant;
+using ov::op::v0::Constant;
 }
 }  // namespace op
 namespace runtime {
diff --git a/ngraph/core/include/ngraph/shape.hpp b/ngraph/core/include/ngraph/shape.hpp
index ae3b25b261e18d..1f2d31e0400580 100644
--- a/ngraph/core/include/ngraph/shape.hpp
+++ b/ngraph/core/include/ngraph/shape.hpp
@@ -5,94 +5,20 @@
 #pragma once
 
 #include <cstdio>
+#include <numeric>
 #include <vector>
 
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/axis_set.hpp"
 #include "ngraph/ngraph_visibility.hpp"
 #include "ngraph/strides.hpp"
+#include "openvino/core/shape.hpp"
 
 namespace ngraph {
-/// \brief Shape for a tensor.
-class Shape : public std::vector<size_t> {
-public:
-    NGRAPH_API Shape();
-
-    NGRAPH_API Shape(const std::initializer_list<size_t>& axis_lengths);
-
-    NGRAPH_API Shape(const std::vector<size_t>& axis_lengths);
-
-    NGRAPH_API Shape(const Shape& axis_lengths);
-
-    NGRAPH_API explicit Shape(size_t n, size_t initial_value = 0);
-
-    NGRAPH_API ~Shape();
-
-    template <class InputIterator>
-    Shape(InputIterator first, InputIterator last) : std::vector<size_t>(first, last) {}
-
-    NGRAPH_API Shape& operator=(const Shape& v);
-    NGRAPH_API Shape& operator=(Shape&& v) noexcept;
-};
-
-/// Number of elements in spanned by a shape
-template <typename SHAPE_TYPE>
-size_t shape_size(const SHAPE_TYPE& shape) {
-    size_t size = 1;
-    for (auto d : shape) {
-        size *= d;
-    }
-    return size;
-}
-
-/// Row-major strides for a shape
-template <typename SHAPE_TYPE>
-std::vector<size_t> row_major_strides(const SHAPE_TYPE& shape) {
-    std::vector<size_t> strides(shape.size());
-    size_t s = 1;
-    auto st = strides.rbegin();
-    for (auto d = shape.rbegin(); d != shape.rend() && st != strides.rend(); d++, st++) {
-        *st = s;
-        s *= *d;
-    }
-    return strides;
-}
-
-template <typename SHAPE_TYPE>
-size_t row_major_stride(const SHAPE_TYPE& shape, size_t axis) {
-    size_t s = 1;
-    for (size_t i = shape.size(); i-- > axis + 1;) {
-        s *= shape[i];
-    }
-    return s;
-}
-
-template <typename SHAPE_TYPE>
-inline bool is_scalar(const SHAPE_TYPE& shape) {
-    return 0 == shape.size();
-}
-
-template <typename SHAPE_TYPE>
-inline bool is_vector(const SHAPE_TYPE& shape) {
-    return 1 == shape.size();
-}
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const Shape& shape);
+using ov::is_scalar;
+using ov::is_vector;
+using ov::row_major_stride;
+using ov::row_major_strides;
+using ov::Shape;
+using ov::shape_size;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::Shape>
-    : public IndirectVectorValueAccessor<ngraph::Shape, std::vector<int64_t>>
-
-{
-public:
-    AttributeAdapter(ngraph::Shape& value) : IndirectVectorValueAccessor<ngraph::Shape, std::vector<int64_t>>(value) {}
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<Shape>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-}  // namespace ov
diff --git a/ngraph/core/include/ngraph/strides.hpp b/ngraph/core/include/ngraph/strides.hpp
index c07c2d79c8acb3..de9147b455a902 100644
--- a/ngraph/core/include/ngraph/strides.hpp
+++ b/ngraph/core/include/ngraph/strides.hpp
@@ -10,47 +10,8 @@
 
 #include "ngraph/attribute_adapter.hpp"
 #include "ngraph/ngraph_visibility.hpp"
+#include "openvino/core/strides.hpp"
 
 namespace ngraph {
-/// \brief Strides for a tensor.
-class Strides : public std::vector<size_t> {
-public:
-    NGRAPH_API Strides();
-
-    NGRAPH_API Strides(const std::initializer_list<size_t>& axis_strides);
-
-    NGRAPH_API Strides(const std::vector<size_t>& axis_strides);
-
-    NGRAPH_API Strides(const Strides& axis_strides);
-
-    NGRAPH_API explicit Strides(size_t n, size_t initial_value = 0);
-
-    template <class InputIterator>
-    Strides(InputIterator first, InputIterator last) : std::vector<size_t>(first, last) {}
-
-    NGRAPH_API Strides& operator=(const Strides& v);
-
-    NGRAPH_API Strides& operator=(Strides&& v) noexcept;
-};
-
-NGRAPH_API
-std::ostream& operator<<(std::ostream& s, const Strides& strides);
+using ov::Strides;
 }  // namespace ngraph
-
-namespace ov {
-
-template <>
-class NGRAPH_API AttributeAdapter<ngraph::Strides>
-    : public IndirectVectorValueAccessor<ngraph::Strides, std::vector<int64_t>>
-
-{
-public:
-    AttributeAdapter(ngraph::Strides& value)
-        : IndirectVectorValueAccessor<ngraph::Strides, std::vector<int64_t>>(value) {}
-    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<Strides>", 0};
-    const DiscreteTypeInfo& get_type_info() const override {
-        return type_info;
-    }
-};
-
-}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/coordinate.hpp b/ngraph/core/include/openvino/core/coordinate.hpp
index 28dd5196030b2d..f1cf0d04bd1816 100644
--- a/ngraph/core/include/openvino/core/coordinate.hpp
+++ b/ngraph/core/include/openvino/core/coordinate.hpp
@@ -17,7 +17,7 @@ class Coordinate : public std::vector<size_t> {
     OPENVINO_API Coordinate();
     OPENVINO_API Coordinate(const std::initializer_list<size_t>& axes);
 
-    OPENVINO_API Coordinate(const ngraph::Shape& shape);
+    OPENVINO_API Coordinate(const Shape& shape);
 
     OPENVINO_API Coordinate(const std::vector<size_t>& axes);
 
diff --git a/ngraph/core/include/openvino/core/deprecated.hpp b/ngraph/core/include/openvino/core/deprecated.hpp
index 2d885ba9439705..dea6428f2b78cc 100644
--- a/ngraph/core/include/openvino/core/deprecated.hpp
+++ b/ngraph/core/include/openvino/core/deprecated.hpp
@@ -25,7 +25,7 @@
 #    define OPENVINO_DEPRECATED(msg)      __attribute__((deprecated(msg)))
 #    define OPENVINO_ENUM_DEPRECATED(msg) OPENVINO_DEPRECATED(msg)
 #elif defined(__GNUC__)
-#    define OPENVINO_DEPRECATED(msg) __attribute__((deprecated((msg))))
+#    define OPENVINO_DEPRECATED(msg) __attribute__((deprecated(msg)))
 #    if __GNUC__ < 6 && !defined(__clang__)
 #        define OPENVINO_ENUM_DEPRECATED(msg)
 #    else
diff --git a/ngraph/core/include/openvino/core/descriptor/input.hpp b/ngraph/core/include/openvino/core/descriptor/input.hpp
index 437b44f6a604a6..c677e43ce183fb 100644
--- a/ngraph/core/include/openvino/core/descriptor/input.hpp
+++ b/ngraph/core/include/openvino/core/descriptor/input.hpp
@@ -92,7 +92,7 @@ class OPENVINO_API Input {
     }
 
     /// \return the shape of the connected output
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
 
     /// \return the partial shape of the connected output
     const PartialShape& get_partial_shape() const;
diff --git a/ngraph/core/include/openvino/core/descriptor/output.hpp b/ngraph/core/include/openvino/core/descriptor/output.hpp
index c4ec21d5ca67b9..f9c1f3c3f28f0a 100644
--- a/ngraph/core/include/openvino/core/descriptor/output.hpp
+++ b/ngraph/core/include/openvino/core/descriptor/output.hpp
@@ -59,7 +59,7 @@ class OPENVINO_API Output {
         return m_rt_info;
     }
     /// \return the shape of the output
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
 
     /// \return the partial shape of the output
     const PartialShape& get_partial_shape() const;
diff --git a/ngraph/core/include/openvino/core/descriptor/tensor.hpp b/ngraph/core/include/openvino/core/descriptor/tensor.hpp
index cc4c196c3e562d..af052dea8c6e96 100644
--- a/ngraph/core/include/openvino/core/descriptor/tensor.hpp
+++ b/ngraph/core/include/openvino/core/descriptor/tensor.hpp
@@ -10,9 +10,9 @@
 #include <string>
 #include <unordered_set>
 
-#include "ngraph/shape.hpp"
 #include "openvino/core/core_visibility.hpp"
 #include "openvino/core/partial_shape.hpp"
+#include "openvino/core/shape.hpp"
 #include "openvino/core/type/element_type.hpp"
 
 namespace ngraph {
@@ -56,7 +56,7 @@ class OPENVINO_API Tensor {
     const element::Type& get_element_type() const {
         return m_element_type;
     }
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
     const PartialShape& get_partial_shape() const {
         return m_partial_shape;
     }
@@ -78,19 +78,19 @@ class OPENVINO_API Tensor {
     element::Type m_element_type;
 
     // TODO: remove along with get_shape
-    // Initially there was ngraph::Shape m_shape only available to keep shape information.
-    // Support for dynamic shapes required transition to ngraph::PartialShape.
-    // To smoothly transition to ngraph::PartialShape we introduced m_partial_shape
+    // Initially there was Shape m_shape only available to keep shape information.
+    // Support for dynamic shapes required transition to ov::PartialShape.
+    // To smoothly transition to ov::PartialShape we introduced m_partial_shape
     // and kept m_shape in sync with m_partial_shape. Synchronization point was placed
     // in set_partial_shape which dramatically affected performance of ngraph::Function
-    // validation. Since we have started the transition to ngraph::PartialShape and reduced
-    // ngraph::Shape usage the only user of m_shape was get_shape method with signature:
-    // const Shape& descriptor::Tensor::get_shape() const
+    // validation. Since we have started the transition to ov::PartialShape and reduced
+    // Shape usage the only user of m_shape was get_shape method with signature:
+    // const PartialShape& descriptor::Tensor::get_shape() const
     // It was decided to move m_shape and m_partial_shape synchronization point there and
     // to keep methods signature backward compatible.
     mutable std::mutex shape_mutex;
     mutable std::atomic_bool m_shape_changed;
-    mutable ngraph::Shape m_shape;
+    mutable Shape m_shape;
     // TODO: end
 
     PartialShape m_partial_shape;
diff --git a/ngraph/core/include/openvino/core/except.hpp b/ngraph/core/include/openvino/core/except.hpp
index 30372a344d42bb..14c9260e1e5e21 100644
--- a/ngraph/core/include/openvino/core/except.hpp
+++ b/ngraph/core/include/openvino/core/except.hpp
@@ -20,4 +20,163 @@ class OPENVINO_API Exception : public std::runtime_error {
     explicit Exception(const std::stringstream& what_arg) : std::runtime_error(what_arg.str()) {}
 };
 
+static inline std::ostream& write_all_to_stream(std::ostream& str) {
+    return str;
+}
+template <typename T, typename... TS>
+static inline std::ostream& write_all_to_stream(std::ostream& str, const T& arg, TS&&... args) {
+    return write_all_to_stream(str << arg, args...);
+}
+
+struct CheckLocInfo {
+    const char* file;
+    int line;
+    const char* check_string;
+};
+
+/// Base class for check failure exceptions.
+class OPENVINO_API AssertFailure : public Exception {
+public:
+    AssertFailure(const CheckLocInfo& check_loc_info, const std::string& context_info, const std::string& explanation)
+        : Exception(make_what(check_loc_info, context_info, explanation)) {}
+
+private:
+    static std::string make_what(const CheckLocInfo& check_loc_info,
+                                 const std::string& context_info,
+                                 const std::string& explanation);
+};
 }  // namespace ov
+
+//
+// Helper macro for defining custom check macros, which throw custom exception classes and provide
+// useful context information (the check condition, source filename, line number, and any domain-
+// specific context information [e.g., a summary of the node that was being processed at the time
+// of the check]).
+//
+// For example (actually implemented in node.cpp), let's say we want to define a macro for
+// checking conditions during node validation, usable as follows:
+//
+//    NODE_VALIDATION_CHECK(node_being_checked,
+//                          node_being_checked->get_input_shape(0).size() == 1,
+//                          "Node must have an input rank of 1, but got ",
+//                          node_being_checked->get_input_shape(0).size(), ".");
+//
+// In case of failure, this will throw an exception of type NodeValidationFailure with a what()
+// string something like:
+//
+//      Check 'node_being_checked->get_input_shape(0).size() == 1' failed at foo.cpp:123:
+//      While validating node 'Broadcast[Broadcast_10](Reshape_9: float{1,3,4,5}) -> (??)':
+//      Node must have an input of rank 1, but got 2.
+//
+// To implement this, he first step is to define a subclass of AssertFailure (let's say it's called
+// MyFailure), which must have a constructor of the form:
+//
+//      MyFailure(const CheckLocInfo& check_loc_info,
+//                T context_info, // "T" can be any type; you'll supply a function to convert "T"
+//                                // to std::string
+//                const std::string& explanation)
+//
+// Here, we define a custom class for node validation failures as follows:
+//
+//    static std::string node_validation_failure_loc_string(const Node* node)
+//    {
+//        std::stringstream ss;
+//        ss << "While validating node '" << *node << "'";
+//        return ss.str();
+//    }
+//
+//    class NodeValidationFailure : public AssertFailure
+//    {
+//    public:
+//        NodeValidationFailure(const CheckLocInfo& check_loc_info,
+//                              const Node* node,
+//                              const std::string& explanation)
+//            : AssertFailure(check_loc_info, node_validation_failure_loc_string(node), explanation)
+//        {
+//        }
+//    };
+//
+// Then, we define the macro NODE_VALIDATION_CHECK as follows:
+//
+// #define NODE_VALIDATION_CHECK(node, cond, ...) <backslash>
+//     OPENVINO_ASSERT_HELPER(::ov::NodeValidationFailure, (node), (cond), ##__VA_ARGS__)
+//
+// The macro NODE_VALIDATION_CHECK can now be called on any condition, with a Node* pointer
+// supplied to generate an informative error message via node_validation_failure_loc_string().
+//
+// Take care to fully qualify the exception class name in the macro body.
+//
+// The "..." may be filled with expressions of any type that has an "operator<<" overload for
+// insertion into std::ostream.
+//
+#define OPENVINO_ASSERT_HELPER2(exc_class, ctx, check, ...)                                        \
+    do {                                                                                           \
+        if (!(check)) {                                                                            \
+            ::std::stringstream ss___;                                                             \
+            ::ov::write_all_to_stream(ss___, __VA_ARGS__);                                         \
+            throw exc_class((::ov::CheckLocInfo{__FILE__, __LINE__, #check}), (ctx), ss___.str()); \
+        }                                                                                          \
+    } while (0)
+
+#define OPENVINO_ASSERT_HELPER1(exc_class, ctx, check)                                    \
+    do {                                                                                  \
+        if (!(check)) {                                                                   \
+            throw exc_class((::ov::CheckLocInfo{__FILE__, __LINE__, #check}), (ctx), ""); \
+        }                                                                                 \
+    } while (0)
+
+/// \brief Macro to check whether a boolean condition holds.
+/// \param cond Condition to check
+/// \param ... Additional error message info to be added to the error message via the `<<`
+///            stream-insertion operator. Note that the expressions here will be evaluated lazily,
+///            i.e., only if the `cond` evalutes to `false`.
+/// \throws ::ov::AssertFailure if `cond` is false.
+#define OPENVINO_ASSERT(...) OPENVINO_ASSERT_HELPER(::ov::AssertFailure, "", __VA_ARGS__)
+
+/// \brief Macro to signal a code path that is unreachable in a successful execution. It's
+/// implemented with OPENVINO_ASSERT macro.
+/// \param ... Additional error message that should describe why that execution path is unreachable.
+/// \throws ::ov::AssertFailure if the macro is executed.
+#define OPENVINO_UNREACHABLE(...)                   OPENVINO_ASSERT(false, "Unreachable: ", __VA_ARGS__)
+#define OPENVINO_ASSERT_HELPER(exc_class, ctx, ...) CALL_OVERLOAD(OPENVINO_ASSERT_HELPER, exc_class, ctx, __VA_ARGS__)
+
+#define GLUE(x, y) x y
+
+#define RETURN_ARG_COUNT(_1_,   \
+                         _2_,   \
+                         _3_,   \
+                         _4_,   \
+                         _5_,   \
+                         _6,    \
+                         _7,    \
+                         _8,    \
+                         _9,    \
+                         _10,   \
+                         _11,   \
+                         _12,   \
+                         _13,   \
+                         _14,   \
+                         _15,   \
+                         _16,   \
+                         _17,   \
+                         _18,   \
+                         _19,   \
+                         _20,   \
+                         _21,   \
+                         _22,   \
+                         _23,   \
+                         _24,   \
+                         _25,   \
+                         count, \
+                         ...)   \
+    count
+#define EXPAND_ARGS(args) RETURN_ARG_COUNT args
+#define COUNT_ARGS_MAXN(...) \
+    EXPAND_ARGS((__VA_ARGS__, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 0))
+
+#define OVERLOAD_MACRO2(name, count) name##count
+#define OVERLOAD_MACRO1(name, count) OVERLOAD_MACRO2(name, count)
+#define OVERLOAD_MACRO(name, count)  OVERLOAD_MACRO1(name, count)
+
+#define CALL_OVERLOAD(name, exc_class, ctx, ...) \
+    GLUE(OVERLOAD_MACRO(name, COUNT_ARGS_MAXN(__VA_ARGS__)), (exc_class, ctx, __VA_ARGS__))
diff --git a/ngraph/core/include/openvino/core/function.hpp b/ngraph/core/include/openvino/core/function.hpp
index 76f7a904591265..38b49cb541116b 100644
--- a/ngraph/core/include/openvino/core/function.hpp
+++ b/ngraph/core/include/openvino/core/function.hpp
@@ -11,7 +11,6 @@
 #include <string>
 #include <vector>
 
-#include "ngraph/node.hpp"
 #include "ngraph/op/assign.hpp"
 #include "ngraph/op/parameter.hpp"
 #include "ngraph/op/read_value.hpp"
@@ -19,6 +18,7 @@
 #include "ngraph/op/sink.hpp"
 #include "ngraph/op/util/variable.hpp"
 #include "openvino/core/core_visibility.hpp"
+#include "openvino/core/node.hpp"
 
 namespace ov {
 /// A user-defined function.
@@ -97,10 +97,10 @@ class OPENVINO_API Function {
     const ngraph::element::Type& get_output_element_type(size_t i) const;
 
     /// Return the shape of element i
-    const ngraph::Shape& get_output_shape(size_t i) const;
+    const Shape& get_output_shape(size_t i) const;
 
     /// Return the partial shape of element i
-    const ngraph::PartialShape& get_output_partial_shape(size_t i) const;
+    const PartialShape& get_output_partial_shape(size_t i) const;
 
     /// Check that there is a single result and return it.
     std::shared_ptr<ngraph::Node> get_result() const;
diff --git a/ngraph/core/include/openvino/core/layout.hpp b/ngraph/core/include/openvino/core/layout.hpp
new file mode 100644
index 00000000000000..16c3b72dfd64d8
--- /dev/null
+++ b/ngraph/core/include/openvino/core/layout.hpp
@@ -0,0 +1,158 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+#include <unordered_map>
+
+#include "ngraph/attribute_adapter.hpp"
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/rank.hpp"
+#include "openvino/core/variant.hpp"
+
+namespace ov {
+
+class OPENVINO_API Layout {
+public:
+    /// \brief Constructs a dynamic Layout with no layout information.
+    Layout();
+
+    /// \brief Constructs layout representing scalar
+    static Layout scalar();
+
+    /// \brief Constructs a Layout with static or dynamic layout information based
+    /// on string representation.
+    ///
+    /// \param layoutStr The string used to construct Layout from.
+    /// The string representation can be in the following form:
+    /// - can define order and meaning for dimensions "NCHW"
+    /// - partial layout specialization:
+    ///   - "NC?" defines 3 dimensional layout, first two NC, 3rd one is not defined
+    ///   - "N...C" defines layout with dynamic rank where 1st dimension is N, last one is C
+    ///   - "N...C" defines layout with dynamic rank where first two are NC, others are not
+    ///   defined
+    /// - only order of dimensions "adbc" (0312)
+    /// - Advanced syntax can be used for multi-character names like "[N,C,H,W,...,CustomName]"
+    Layout(const char* layoutStr) : Layout(std::string(layoutStr)) {}
+
+    explicit Layout(const std::string& layoutStr);
+
+    /// \brief Comparison operator (equal)
+    bool operator==(const Layout& rhs) const;
+
+    /// \brief Comparison operator (not equal)
+    bool operator!=(const Layout& rhs) const;
+
+    /// \brief Checks if dimension with specified name is in layout
+    /// \return `true` if layout has information about dimension index with a given name
+    bool has_name(const std::string& dimensionName) const;
+
+    /// \brief Gets index of dimension with a specified name
+    ///
+    /// \throws ov::AssertFailure if dimension name is not found in a layout
+    ///
+    /// \return Index of given dimension name
+    std::int64_t get_index_by_name(const std::string& dimensionName) const;
+
+    /// \brief String representation of Layout
+    std::string to_string() const;
+
+private:
+    /// stores dimension names map to index in a layout
+    std::unordered_map<std::string, std::int64_t> m_names;
+    std::unordered_map<std::int64_t, std::string> m_index_map;
+
+    /// special case for scalar
+    bool m_scalar = false;
+
+    bool m_dynamic = false;
+    int64_t m_left_size = 0;
+    int64_t m_right_size = 0;
+};
+
+namespace layout {
+
+/// \brief Checks if layout has 'batch' dimension
+OPENVINO_API bool has_batch(const Layout& layout);
+
+/// \brief Returns 'batch' dimension index.
+///
+/// \throws ov::AssertFailure if dimension doesn't exist.
+///
+OPENVINO_API std::int64_t batch(const Layout& layout);
+
+/// \brief Checks if layout has 'channels' dimension
+///
+/// \throws ov::AssertFailure if dimension doesn't exist.
+///
+OPENVINO_API bool has_channels(const Layout& layout);
+
+/// \brief Returns 'channels' dimension index.
+///
+/// \throws ov::AssertFailure if dimension doesn't exist.
+///
+OPENVINO_API std::int64_t channels(const Layout& layout);
+
+/// \brief Checks if layout has 'depth' dimension
+OPENVINO_API bool has_depth(const Layout& layout);
+
+/// \brief Returns 'depth' dimension index.
+///
+/// \throws ov::AssertFailure if dimension doesn't exist.
+///
+OPENVINO_API std::int64_t depth(const Layout& layout);
+
+/// \brief Checks if layout has 'height' dimension
+OPENVINO_API bool has_height(const Layout& layout);
+
+/// \brief Returns 'height' dimension index.
+///
+/// \throws ov::AssertFailure if dimension doesn't exist.
+///
+OPENVINO_API std::int64_t height(const Layout& layout);
+
+/// \brief Checks if layout has 'width' dimension
+OPENVINO_API bool has_width(const Layout& layout);
+
+/// \brief Returns 'width' dimension index.
+///
+/// \throws ov::AssertFailure if dimension doesn't exist.
+///
+OPENVINO_API std::int64_t width(const Layout& layout);
+
+}  // namespace layout
+
+template <>
+class OPENVINO_API AttributeAdapter<Layout> : public ValueAccessor<std::string> {
+public:
+    explicit AttributeAdapter(Layout& value) : m_ref(value) {}
+
+    const std::string& get() override;
+    void set(const std::string& value) override;
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<Layout>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+    explicit operator Layout&() {
+        return m_ref;
+    }
+
+protected:
+    Layout& m_ref;
+    std::string m_dump;
+};
+
+template <>
+class OPENVINO_API VariantWrapper<Layout> : public VariantImpl<Layout> {
+public:
+    static constexpr VariantTypeInfo type_info{"Variant::Layout", 0};
+    const VariantTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+
+    explicit VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/node.hpp b/ngraph/core/include/openvino/core/node.hpp
index 3ba65a5cd78ddd..dc73907ec5fa0a 100644
--- a/ngraph/core/include/openvino/core/node.hpp
+++ b/ngraph/core/include/openvino/core/node.hpp
@@ -18,23 +18,23 @@
 #include <unordered_set>
 #include <vector>
 
-#include "ngraph/check.hpp"
-#include "ngraph/deprecated.hpp"
-#include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/op/util/op_annotations.hpp"
-#include "ngraph/op/util/variable.hpp"
-#include "ngraph/op/util/variable_value.hpp"
-#include "ngraph/strides.hpp"
 #include "openvino/core/attribute_visitor.hpp"
 #include "openvino/core/core_visibility.hpp"
+#include "openvino/core/deprecated.hpp"
 #include "openvino/core/descriptor/input.hpp"
 #include "openvino/core/descriptor/output.hpp"
 #include "openvino/core/descriptor/tensor.hpp"
+#include "openvino/core/except.hpp"
 #include "openvino/core/node_input.hpp"
 #include "openvino/core/node_output.hpp"
 #include "openvino/core/node_vector.hpp"
+#include "openvino/core/strides.hpp"
 #include "openvino/core/type.hpp"
 #include "openvino/core/variant.hpp"
+#include "openvino/op/util/attr_types.hpp"
+#include "openvino/op/util/variable.hpp"
+#include "openvino/op/util/variable_value.hpp"
 
 namespace ngraph {
 
@@ -42,20 +42,20 @@ namespace runtime {
 class HostTensor;
 }  // namespace runtime
 
-namespace op {
-struct AutoBroadcastSpec;
+}  // namespace ngraph
 
+namespace ov {
+namespace op {
 namespace v0 {
 class Result;
 }  // namespace v0
+struct AutoBroadcastSpec;
 }  // namespace op
-
+namespace pass {
 namespace pattern {
 class Matcher;
 }  // namespace pattern
-}  // namespace ngraph
-
-namespace ov {
+}  // namespace pass
 using HostTensor = ngraph::runtime::HostTensor;
 using HostTensorPtr = std::shared_ptr<HostTensor>;
 using HostTensorVector = std::vector<HostTensorPtr>;
@@ -72,7 +72,7 @@ class Node;
 /// environment) for evaluating ngraph::function.
 using EvaluationContext = std::map<std::string, std::shared_ptr<Variant>>;
 
-using ResultVector = std::vector<std::shared_ptr<ngraph::op::v0::Result>>;
+using ResultVector = std::vector<std::shared_ptr<ov::op::v0::Result>>;
 
 OPENVINO_API
 std::string node_validation_failure_loc_string(const Node* node);
@@ -194,7 +194,7 @@ class OPENVINO_API Node : public std::enable_shared_from_this<Node> {
         return false;
     }
     /// \returns the autobroadcasr spec
-    virtual const ngraph::op::AutoBroadcastSpec& get_autob() const;
+    virtual const ov::op::AutoBroadcastSpec& get_autob() const;
 
     /// \brief Allows to get information about availability of evaluate method for the current
     /// operation
@@ -318,7 +318,7 @@ class OPENVINO_API Node : public std::enable_shared_from_this<Node> {
     const element::Type& get_element_type() const;
 
     /// Returns the shape for output i
-    const ngraph::Shape& get_output_shape(size_t i) const;
+    const Shape& get_output_shape(size_t i) const;
 
     /// Returns the partial shape for output i
     const PartialShape& get_output_partial_shape(size_t i) const;
@@ -337,7 +337,7 @@ class OPENVINO_API Node : public std::enable_shared_from_this<Node> {
     // TODO: deprecate in favor of node->get_output_shape(0) with a suitable check in the
     // calling code, or updates to the calling code if it is making an invalid assumption of
     // only one output.
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
 
     /// Returns the tensor for output or input i
     descriptor::Tensor& get_output_tensor(size_t i) const;
@@ -358,7 +358,7 @@ class OPENVINO_API Node : public std::enable_shared_from_this<Node> {
 
     /// Returns the shape of input i
     // TODO: deprecate in favor of node->get_input_shape(i)
-    const ngraph::Shape& get_input_shape(size_t i) const;
+    const Shape& get_input_shape(size_t i) const;
 
     /// Returns the partial shape of input i
     // TODO: deprecate in favor of node->get_input_partial_shape(i)
@@ -487,11 +487,11 @@ class OPENVINO_API Node : public std::enable_shared_from_this<Node> {
     }
     OPENVINO_SUPPRESS_DEPRECATED_END
 
-    virtual bool match_value(ngraph::pattern::Matcher* matcher,
+    virtual bool match_value(ov::pass::pattern::Matcher* matcher,
                              const Output<Node>& pattern_value,
                              const Output<Node>& graph_value);
 
-    virtual bool match_node(ngraph::pattern::Matcher* matcher, const Output<Node>& graph_value);
+    virtual bool match_node(ov::pass::pattern::Matcher* matcher, const Output<Node>& graph_value);
 
 private:
     descriptor::Input& get_input_descriptor(size_t position);
@@ -654,10 +654,10 @@ struct RawNodeOutput {
 
 using RawNodeOutputMap = std::map<RawNodeOutput, Output<Node>>;
 
-class OPENVINO_API NodeValidationFailure : public ngraph::CheckFailure {
+class OPENVINO_API NodeValidationFailure : public ov::AssertFailure {
 public:
     NodeValidationFailure(const ngraph::CheckLocInfo& check_loc_info, const Node* node, const std::string& explanation)
-        : CheckFailure(check_loc_info, node_validation_failure_loc_string(node), explanation) {}
+        : AssertFailure(check_loc_info, node_validation_failure_loc_string(node), explanation) {}
 };
 }  // namespace ov
 #define NODE_VALIDATION_CHECK(node, ...) NGRAPH_CHECK_HELPER(::ov::NodeValidationFailure, (node), __VA_ARGS__)
diff --git a/ngraph/core/include/openvino/core/node_input.hpp b/ngraph/core/include/openvino/core/node_input.hpp
index fb6e2cb527c8b4..18918b1fcca07c 100644
--- a/ngraph/core/include/openvino/core/node_input.hpp
+++ b/ngraph/core/include/openvino/core/node_input.hpp
@@ -39,7 +39,7 @@ class OPENVINO_API Input<Node> {
     /// \return The element type of the input referred to by this input handle.
     const element::Type& get_element_type() const;
     /// \return The shape of the input referred to by this input handle.
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
     /// \return The partial shape of the input referred to by this input handle.
     const PartialShape& get_partial_shape() const;
     /// \return A handle to the output that is connected to this input.
@@ -90,7 +90,7 @@ class OPENVINO_API Input<const Node> {
     /// \return The element type of the input referred to by this input handle.
     const element::Type& get_element_type() const;
     /// \return The shape of the input referred to by this input handle.
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
     /// \return The partial shape of the input referred to by this input handle.
     const PartialShape& get_partial_shape() const;
     /// \return A handle to the output that is connected to this input.
diff --git a/ngraph/core/include/openvino/core/node_output.hpp b/ngraph/core/include/openvino/core/node_output.hpp
index 73d9b4659823ba..931e403ca04a10 100644
--- a/ngraph/core/include/openvino/core/node_output.hpp
+++ b/ngraph/core/include/openvino/core/node_output.hpp
@@ -8,10 +8,10 @@
 #include <map>
 #include <unordered_set>
 
-#include "ngraph/shape.hpp"
 #include "openvino/core/core_visibility.hpp"
 #include "openvino/core/descriptor/tensor.hpp"
 #include "openvino/core/partial_shape.hpp"
+#include "openvino/core/shape.hpp"
 #include "openvino/core/type/element_type.hpp"
 #include "openvino/core/variant.hpp"
 
@@ -68,7 +68,7 @@ class OPENVINO_API Output<Node> {
     /// \return The element type of the output referred to by this output handle.
     const element::Type& get_element_type() const;
     /// \return The shape of the output referred to by this output handle.
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
     /// \return The partial shape of the output referred to by this output handle.
     const PartialShape& get_partial_shape() const;
 
@@ -145,7 +145,7 @@ class OPENVINO_API Output<const Node> {
     /// \return The element type of the output referred to by this output handle.
     const element::Type& get_element_type() const;
     /// \return The shape of the output referred to by this output handle.
-    const ngraph::Shape& get_shape() const;
+    const Shape& get_shape() const;
     /// \return The partial shape of the output referred to by this output handle.
     const PartialShape& get_partial_shape() const;
 
diff --git a/ngraph/core/include/openvino/core/partial_shape.hpp b/ngraph/core/include/openvino/core/partial_shape.hpp
index eff5c651d36574..d66cc8d64bfa20 100644
--- a/ngraph/core/include/openvino/core/partial_shape.hpp
+++ b/ngraph/core/include/openvino/core/partial_shape.hpp
@@ -6,21 +6,17 @@
 
 #include <cstddef>
 
-#include "ngraph/attribute_adapter.hpp"
 #include "ngraph/op/util/attr_types.hpp"
-#include "ngraph/shape.hpp"
+#include "openvino/core/attribute_adapter.hpp"
 #include "openvino/core/dimension.hpp"
 #include "openvino/core/rank.hpp"
+#include "openvino/core/shape.hpp"
 
-namespace ngraph {
+namespace ov {
 namespace op {
 struct AutoBroadcastSpec;
 }
 
-}  // namespace ngraph
-
-namespace ov {
-
 /// \brief Class representing a shape that may be partially or totally dynamic.
 ///
 ///
@@ -63,9 +59,9 @@ class OPENVINO_API PartialShape {
     /// \brief Constructs a static PartialShape with zero rank (the shape of a scalar).
     PartialShape();
 
-    /// \brief Constructs a static PartialShape from a Shape.
-    /// \param shape The Shape to convert into PartialShape.
-    PartialShape(const ngraph::Shape& shape);
+    /// \brief Constructs a static PartialShape from a PartialShape.
+    /// \param shape The PartialShape to convert into PartialShape.
+    PartialShape(const Shape& shape);
 
     /// \brief Check if this shape is static.
     /// \return `true` if this shape is static, else `false`.
@@ -157,10 +153,10 @@ class OPENVINO_API PartialShape {
     /// \return `true` if this shape's rank is compatible with `r`, else `false`.
     bool merge_rank(Rank r);
 
-    /// \brief Convert a static PartialShape to a Shape.
-    /// \return A new Shape `s` where `s[i] = size_t((*this)[i])`.
+    /// \brief Convert a static PartialShape to a PartialShape.
+    /// \return A new PartialShape `s` where `s[i] = size_t((*this)[i])`.
     /// \throws std::invalid_argument If this PartialShape is dynamic.
-    ngraph::Shape to_shape() const;
+    Shape to_shape() const;
 
     /// \brief Returns `true` if all static dimensions of the tensor are non-negative, else
     ///        `false`.
@@ -183,11 +179,11 @@ class OPENVINO_API PartialShape {
     bool operator==(const PartialShape& partial_shape) const;
     bool operator!=(const PartialShape& partial_shape) const;
     /// Get the max bounding shape
-    ngraph::Shape get_max_shape() const;
+    Shape get_max_shape() const;
     /// Get the min bounding shape
-    ngraph::Shape get_min_shape() const;
+    Shape get_min_shape() const;
     /// Get the unique shape
-    ngraph::Shape get_shape() const;
+    Shape get_shape() const;
 
     /// \brief Try to merge one shape into another.
     /// \param[in,out] dst The shape that `src` will be merged into.
@@ -304,7 +300,7 @@ class OPENVINO_API PartialShape {
     // True if the shape's rank is static.
     bool m_rank_is_static;
 
-    /// \brief Shape types. The shape type is lazily evaluated by calling the is_static()
+    /// \brief PartialShape types. The shape type is lazily evaluated by calling the is_static()
     /// method.
     ///
     /// \details It is highly recommended to avoid using the Dimension& operator[](size_t)
@@ -323,7 +319,7 @@ class OPENVINO_API PartialShape {
                            // by non-constant reference.
     } m_shape_type{ShapeType::SHAPE_IS_UNKNOWN};
 
-    // Shape dimensions. This has no meaning if m_rank_is_static is false.
+    // PartialShape dimensions. This has no meaning if m_rank_is_static is false.
     Dimensions m_dimensions;
 };
 
diff --git a/ngraph/core/include/openvino/core/preprocess/input_info.hpp b/ngraph/core/include/openvino/core/preprocess/input_info.hpp
new file mode 100644
index 00000000000000..d586a44ca6657e
--- /dev/null
+++ b/ngraph/core/include/openvino/core/preprocess/input_info.hpp
@@ -0,0 +1,72 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/preprocess/input_tensor_info.hpp"
+#include "openvino/core/preprocess/preprocess_steps.hpp"
+
+namespace ov {
+namespace preprocess {
+
+/// \brief Class holding preprocessing information for one input
+/// API has Builder-like style to allow chaining calls in client's code, like
+/// \code{.cpp}
+/// auto proc = PrePostProcessor().input(InputInfo().tensor(...).preprocess(...);
+/// \endcode
+class OPENVINO_API InputInfo final {
+    class InputInfoImpl;
+    std::unique_ptr<InputInfoImpl> m_impl;
+    friend class PrePostProcessor;
+
+public:
+    /// \brief Empty constructor. Should be used only if network will have only one input
+    InputInfo();
+
+    /// \brief Information about info for particular input index of model
+    ///
+    /// \param input_index Index to address specified input parameter of model
+    InputInfo(size_t input_index);
+
+    /// \brief Default move constructor
+    InputInfo(InputInfo&&) noexcept;
+
+    /// \brief Default move assignment operator
+    InputInfo& operator=(InputInfo&&) noexcept;
+
+    /// \brief Default destructor
+    ~InputInfo();
+
+    /// \brief Set input tensor information for input - Lvalue version
+    ///
+    /// \param builder Input tensor information.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputInfo& tensor(InputTensorInfo&& builder) &;
+
+    /// \brief Set input tensor information for input - Rvalue version
+    ///
+    /// \param builder Input tensor information.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputInfo&& tensor(InputTensorInfo&& builder) &&;
+
+    /// \brief Set preprocessing operations for input - Lvalue version
+    ///
+    /// \param builder Preprocessing operations.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputInfo& preprocess(PreProcessSteps&& builder) &;
+
+    /// \brief Set preprocessing operations for input - Rvalue version
+    ///
+    /// \param builder Preprocessing operations.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputInfo&& preprocess(PreProcessSteps&& builder) &&;
+};
+
+}  // namespace preprocess
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/preprocess/input_tensor_info.hpp b/ngraph/core/include/openvino/core/preprocess/input_tensor_info.hpp
new file mode 100644
index 00000000000000..a333a97dee2567
--- /dev/null
+++ b/ngraph/core/include/openvino/core/preprocess/input_tensor_info.hpp
@@ -0,0 +1,79 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/layout.hpp"
+#include "openvino/core/type/element_type.hpp"
+
+namespace ov {
+namespace preprocess {
+
+/// \brief Information about user's input tensor. By default, it will be initialized to same data (type/shape/etc) as
+/// network's input parameter User application can override particular parameters (like 'element_type') according to
+/// application's data and specify appropriate conversions in pre-processing steps
+///
+/// \code{.cpp}
+/// auto proc =
+/// PrePostProcessor()
+///     .input(InputInfo()
+///            .tensor(InputTensorInfo()
+///                    .set_element_type(ov::element::u8))
+///            .preprocess(<add steps + conversion to network's input element type>)
+///     );
+/// \endcode
+class OPENVINO_API InputTensorInfo final {
+    class InputTensorInfoImpl;
+    std::unique_ptr<InputTensorInfoImpl> m_impl;
+    friend class InputInfo;
+
+public:
+    /// \brief Default empty constructor
+    InputTensorInfo();
+
+    /// \brief Default move constructor
+    InputTensorInfo(InputTensorInfo&&) noexcept;
+
+    /// \brief Default move assignment
+    InputTensorInfo& operator=(InputTensorInfo&&) noexcept;
+
+    /// \brief Default destructor
+    ~InputTensorInfo();
+
+    /// \brief Set element type for user's input tensor
+    /// This version allows chaining for Lvalue objects
+    ///
+    /// \param type Element type for user's input tensor.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputTensorInfo& set_element_type(const ov::element::Type& type) &;
+
+    /// \brief Set element type for user's input tensor
+    /// This version allows chaining for Rvalue objects
+    ///
+    /// \param type Element type for user's input tensor.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputTensorInfo&& set_element_type(const ov::element::Type& type) &&;
+
+    /// \brief Set layout for user's input tensor
+    /// This version allows chaining for Lvalue objects
+    ///
+    /// \param layout Layout for user's input tensor.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputTensorInfo& set_layout(const ov::Layout& layout) &;
+
+    /// \briefSet layout for user's input tensor
+    /// This version allows chaining for Rvalue objects
+    ///
+    /// \param layout Layout for user's input tensor.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    InputTensorInfo&& set_layout(const ov::Layout& layout) &&;
+};
+
+}  // namespace preprocess
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/preprocess/pre_post_process.hpp b/ngraph/core/include/openvino/core/preprocess/pre_post_process.hpp
new file mode 100644
index 00000000000000..300fd1ab557295
--- /dev/null
+++ b/ngraph/core/include/openvino/core/preprocess/pre_post_process.hpp
@@ -0,0 +1,70 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/preprocess/input_info.hpp"
+
+namespace ov {
+
+class Function;
+
+namespace preprocess {
+
+/// \brief Main class for adding pre- and post- processing steps to existing ov::Function
+/// API has Builder-like style to allow chaining calls in client's code, like
+/// \code{.cpp}
+/// auto proc = PrePostProcessor().input(<for input1>).input(<input2>);
+/// \endcode
+///
+/// This is a helper class for writing easy pre- and post- processing operations on ov::Function object assuming that
+/// any preprocess operation takes one input and produces one output.
+///
+/// For advanced preprocessing scenarios, like combining several functions with multiple inputs/outputs into one,
+/// client's code can use transformation passes over ov::Function
+///
+class OPENVINO_API PrePostProcessor final {
+    class PrePostProcessorImpl;
+    std::unique_ptr<PrePostProcessorImpl> m_impl;
+
+public:
+    /// \brief Default constructor
+    PrePostProcessor();
+
+    /// \brief Default move constructor
+    PrePostProcessor(PrePostProcessor&&) noexcept;
+
+    /// \brief Default move assignment operator
+    PrePostProcessor& operator=(PrePostProcessor&&) noexcept;
+
+    /// \brief Default destructor
+    ~PrePostProcessor();
+
+    /// \brief Adds pre-processing information and steps to input of model. This method can be used only if ov::Function
+    /// passed on `build` has only one input
+    ///
+    /// \param builder Pre-processing data for input tensor of model.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    PrePostProcessor& input(InputInfo&& builder) &;
+
+    /// \brief Adds pre-processing information and steps to input of model - Rvalue version. This method can be used
+    /// only if ov::Function passed on `build` has only one input.
+    ///
+    /// \param builder Pre-processing data for input tensor of model.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    PrePostProcessor&& input(InputInfo&& builder) &&;
+
+    /// \brief Adds pre/post-processing operations to existing function
+    ///
+    /// \param function Existing function representing loaded model
+    ///
+    /// \return Function with added pre/post-processing operations
+    std::shared_ptr<Function> build(const std::shared_ptr<Function>& function);
+};
+
+}  // namespace preprocess
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/preprocess/preprocess_steps.hpp b/ngraph/core/include/openvino/core/preprocess/preprocess_steps.hpp
new file mode 100644
index 00000000000000..641e5394b5c91a
--- /dev/null
+++ b/ngraph/core/include/openvino/core/preprocess/preprocess_steps.hpp
@@ -0,0 +1,145 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/type/element_type.hpp"
+
+namespace ov {
+
+class Node;
+
+namespace preprocess {
+
+/// \brief Preprocessing steps. Each step typically intends adding of some operation to input parameter
+/// User application can specify sequence of preprocessing steps in a builder-like manner
+/// \code{.cpp}
+/// auto proc = PrePostProcessor()
+///     .input(InputInfo()
+///            .preprocess(PreProcessSteps()
+///                        .mean(0.2f)     // Subtract 0.2 from each element
+///                        .scale(2.3f))   // then divide each element to 2.3
+///     );
+/// \endcode
+class OPENVINO_API PreProcessSteps final {
+    class PreProcessStepsImpl;
+    std::unique_ptr<PreProcessStepsImpl> m_impl;
+    friend class InputInfo;
+
+public:
+    /// \brief Default empty constructor
+    PreProcessSteps();
+
+    /// \brief Default move constructor
+    PreProcessSteps(PreProcessSteps&&) noexcept;
+
+    /// \brief Default move assignment operator
+    PreProcessSteps& operator=(PreProcessSteps&&) noexcept;
+
+    /// \brief Default destructor
+    ~PreProcessSteps();
+
+    /// \brief Add convert element type preprocess operation - Lvalue version
+    ///
+    /// \param type Desired type of input.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps& convert_element_type(const ov::element::Type& type) &;
+
+    /// \brief Add convert element type preprocess operation - Rvalue version
+    ///
+    /// \param type Desired type of input.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps&& convert_element_type(const ov::element::Type& type) &&;
+
+    /// \brief Add scale preprocess operation - Lvalue version
+    /// Divide each element of input by specified value
+    ///
+    /// \param value Scaling value.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps& scale(float value) &;
+
+    /// \brief Add scale preprocess operation - Rvalue version
+    /// Divide each element of input by specified value
+    ///
+    /// \param value Scaling value.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps&& scale(float value) &&;
+
+    /// \brief Add scale preprocess operation - Lvalue version
+    ///
+    /// \param values Scaling values. Layout runtime info with channels dimension must be specified for input tensor
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps& scale(const std::vector<float>& values) &;
+
+    /// \brief Add scale preprocess operation - Rvalue version
+    ///
+    /// \param values Scaling values. Layout runtime info with channels dimension must be specified for input tensor
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps&& scale(const std::vector<float>& values) &&;
+
+    /// \brief Add mean preprocess operation - Lvalue version
+    /// Subtract specified value from each element of input
+    ///
+    /// \param value Value to subtract from each element.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps& mean(float value) &;
+
+    /// \brief Add mean preprocess operation - Rvalue version
+    /// Subtract specified value from each element of input
+    ///
+    /// \param value Value to subtract from each element.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps&& mean(float value) &&;
+
+    /// \brief Add mean preprocess operation - Lvalue version
+    ///
+    /// \param values Mean values. Layout runtime info with channels dimension must be specified for input tensor
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps& mean(const std::vector<float>& values) &;
+
+    /// \brief Add mean preprocess operation - Rvalue version
+    ///
+    /// \param values Mean values. Layout runtime info with channels dimension must be specified for input tensor
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps&& mean(const std::vector<float>& values) &&;
+
+    /// \brief Signature for custom preprocessing operation. Custom preprocessing operation takes one input node and
+    /// produces one output node. For more advanced cases, client's code can use transformation passes over ov::Function
+    /// directly
+    ///
+    /// \param node Input node for custom preprocessing operation
+    ///
+    /// \return New node after applying custom preprocessing operation
+    using CustomPreprocessOp = std::function<std::shared_ptr<ov::Node>(const std::shared_ptr<ov::Node>& node)>;
+
+    /// \brief Add custom preprocess operation - Lvalue version
+    /// Client application can specify callback function for custom action
+    ///
+    /// \param preprocess_cb Client's custom preprocess operation.
+    ///
+    /// \return Reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps& custom(const CustomPreprocessOp& preprocess_cb) &;
+
+    /// \brief Add custom preprocess operation - Rvalue version
+    /// Client application can specify callback function for custom action
+    ///
+    /// \param preprocess_cb Client's custom preprocess operation.
+    ///
+    /// \return Rvalue reference to 'this' to allow chaining with other calls in a builder-like manner
+    PreProcessSteps&& custom(const CustomPreprocessOp& preprocess_cb) &&;
+};
+
+}  // namespace preprocess
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/shape.hpp b/ngraph/core/include/openvino/core/shape.hpp
new file mode 100644
index 00000000000000..3b16d3b1dcd8ef
--- /dev/null
+++ b/ngraph/core/include/openvino/core/shape.hpp
@@ -0,0 +1,109 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstdio>
+#include <numeric>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/core/axis_set.hpp"
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/strides.hpp"
+
+namespace ov {
+/// \brief Shape for a tensor.
+class Shape : public std::vector<size_t> {
+public:
+    OPENVINO_API Shape();
+
+    OPENVINO_API Shape(const std::initializer_list<size_t>& axis_lengths);
+
+    OPENVINO_API Shape(const std::vector<size_t>& axis_lengths);
+
+    OPENVINO_API Shape(const Shape& axis_lengths);
+
+    OPENVINO_API explicit Shape(size_t n, size_t initial_value = 0);
+
+    OPENVINO_API ~Shape();
+
+    template <class InputIterator>
+    Shape(InputIterator first, InputIterator last) : std::vector<size_t>(first, last) {}
+
+    OPENVINO_API Shape& operator=(const Shape& v);
+    OPENVINO_API Shape& operator=(Shape&& v) noexcept;
+};
+
+/// Number of elements in spanned by a shape
+template <typename SHAPE_TYPE>
+size_t shape_size(const SHAPE_TYPE& shape) {
+    size_t size = 1;
+    for (auto d : shape) {
+        size *= d;
+    }
+    return size;
+}
+
+/// Number of elements in a subset of dimensions of a shape.
+/// Returns a product of dimensions in a range [start_dim;end_dim)
+template <typename ForwardIt>
+size_t shape_size(ForwardIt start_dim, const ForwardIt end_dim) {
+    static_assert(std::is_arithmetic<typename std::iterator_traits<ForwardIt>::value_type>::value,
+                  "shape_size expects 2 forward iterators as inputs. value_type of those iterators has to be an "
+                  "arithmetic type so that they can be used in multiplication operation.");
+
+    return std::accumulate(start_dim,
+                           end_dim,
+                           typename std::iterator_traits<ForwardIt>::value_type{1},
+                           std::multiplies<typename std::iterator_traits<ForwardIt>::value_type>());
+}
+
+/// Row-major strides for a shape
+template <typename SHAPE_TYPE>
+std::vector<size_t> row_major_strides(const SHAPE_TYPE& shape) {
+    std::vector<size_t> strides(shape.size());
+    size_t s = 1;
+    auto st = strides.rbegin();
+    for (auto d = shape.rbegin(); d != shape.rend() && st != strides.rend(); d++, st++) {
+        *st = s;
+        s *= *d;
+    }
+    return strides;
+}
+
+template <typename SHAPE_TYPE>
+size_t row_major_stride(const SHAPE_TYPE& shape, size_t axis) {
+    size_t s = 1;
+    for (size_t i = shape.size(); i-- > axis + 1;) {
+        s *= shape[i];
+    }
+    return s;
+}
+
+template <typename SHAPE_TYPE>
+inline bool is_scalar(const SHAPE_TYPE& shape) {
+    return 0 == shape.size();
+}
+
+template <typename SHAPE_TYPE>
+inline bool is_vector(const SHAPE_TYPE& shape) {
+    return 1 == shape.size();
+}
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const Shape& shape);
+
+template <>
+class OPENVINO_API AttributeAdapter<ov::Shape> : public IndirectVectorValueAccessor<ov::Shape, std::vector<int64_t>>
+
+{
+public:
+    AttributeAdapter(ov::Shape& value) : IndirectVectorValueAccessor<ov::Shape, std::vector<int64_t>>(value) {}
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<Shape>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/strides.hpp b/ngraph/core/include/openvino/core/strides.hpp
new file mode 100644
index 00000000000000..65d0b660d473d8
--- /dev/null
+++ b/ngraph/core/include/openvino/core/strides.hpp
@@ -0,0 +1,49 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <ostream>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/core/core_visibility.hpp"
+
+namespace ov {
+/// \brief Strides for a tensor.
+class Strides : public std::vector<size_t> {
+public:
+    OPENVINO_API Strides();
+
+    OPENVINO_API Strides(const std::initializer_list<size_t>& axis_strides);
+
+    OPENVINO_API Strides(const std::vector<size_t>& axis_strides);
+
+    OPENVINO_API Strides(const Strides& axis_strides);
+
+    OPENVINO_API explicit Strides(size_t n, size_t initial_value = 0);
+
+    template <class InputIterator>
+    Strides(InputIterator first, InputIterator last) : std::vector<size_t>(first, last) {}
+
+    OPENVINO_API Strides& operator=(const Strides& v);
+
+    OPENVINO_API Strides& operator=(Strides&& v) noexcept;
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const Strides& strides);
+
+template <>
+class OPENVINO_API AttributeAdapter<Strides> : public IndirectVectorValueAccessor<Strides, std::vector<int64_t>> {
+public:
+    AttributeAdapter(Strides& value) : IndirectVectorValueAccessor<Strides, std::vector<int64_t>>(value) {}
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<Strides>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/core/type/element_type.hpp b/ngraph/core/include/openvino/core/type/element_type.hpp
index 88fb9d70327588..24854224fae0d1 100644
--- a/ngraph/core/include/openvino/core/type/element_type.hpp
+++ b/ngraph/core/include/openvino/core/type/element_type.hpp
@@ -195,4 +195,15 @@ class OPENVINO_API AttributeAdapter<ov::element::Type> : public ValueAccessor<st
 protected:
     ov::element::Type& m_ref;
 };
+
+template <>
+class NGRAPH_API AttributeAdapter<ov::element::TypeVector> : public DirectValueAccessor<ov::element::TypeVector> {
+public:
+    AttributeAdapter(ov::element::TypeVector& value) : DirectValueAccessor<ov::element::TypeVector>(value) {}
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<vector<element::Type>>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
 }  // namespace ov
diff --git a/ngraph/core/include/openvino/op/abs.hpp b/ngraph/core/include/openvino/op/abs.hpp
new file mode 100644
index 00000000000000..b3cc02d724f86e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/abs.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise absolute value operation.
+///
+class OPENVINO_API Abs : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs an absolute value operation.
+    Abs() = default;
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    /// \brief Constructs an absolute value operation.
+    ///
+    /// \param arg Output that produces the input tensor.<br>
+    /// `[d1, ...]`
+    ///
+    /// Output `[d1, ...]`
+    ///
+    Abs(const Output<Node>& arg);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/acos.hpp b/ngraph/core/include/openvino/op/acos.hpp
new file mode 100644
index 00000000000000..0804926bdda5c4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/acos.hpp
@@ -0,0 +1,38 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise inverse cosine (arccos) operation.
+///
+class OPENVINO_API Acos : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs an arccos operation.
+    Acos() = default;
+    /// \brief Constructs an arccos operation.
+    ///
+    /// \param arg Output that produces the input tensor.<br>
+    /// `[d1, ...]`
+    ///
+    /// Output `[d1, ...]`
+    ///
+    Acos(const Output<Node>& arg);
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/acosh.hpp b/ngraph/core/include/openvino/op/acosh.hpp
new file mode 100644
index 00000000000000..5e7e638a3f63c0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/acosh.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Elementwise inverse hyperbolic cos operation.
+///
+class OPENVINO_API Acosh : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an Acosh operation.
+    Acosh() = default;
+    /// \brief Constructs an Acosh operation.
+    ///
+    /// \param arg Output that produces the input tensor.<br>
+    /// `[d1, ...]`
+    ///
+    /// Output `[d1, ...]`
+    ///
+    Acosh(const Output<Node>& arg);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/adaptive_avg_pool.hpp b/ngraph/core/include/openvino/op/adaptive_avg_pool.hpp
new file mode 100644
index 00000000000000..fd4419e5d8b108
--- /dev/null
+++ b/ngraph/core/include/openvino/op/adaptive_avg_pool.hpp
@@ -0,0 +1,38 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v8 {
+/// \brief Adaptive average pooling operation.
+///
+class OPENVINO_API AdaptiveAvgPool : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    AdaptiveAvgPool() = default;
+
+    ///
+    /// \brief    Constructs adaptive average pooling operation.
+    ///
+    /// \param    data            Input data
+    ///
+    /// \param    output_shape    1D tensor describing output shape for spatial
+    ///                           dimensions.
+    ///
+    AdaptiveAvgPool(const Output<Node>& data, const Output<Node>& output_shape);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/adaptive_max_pool.hpp b/ngraph/core/include/openvino/op/adaptive_max_pool.hpp
new file mode 100644
index 00000000000000..512131ed0aa157
--- /dev/null
+++ b/ngraph/core/include/openvino/op/adaptive_max_pool.hpp
@@ -0,0 +1,50 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v8 {
+/// \brief Adaptive max pooling operation.
+///
+class OPENVINO_API AdaptiveMaxPool : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    AdaptiveMaxPool() = default;
+
+    ///
+    /// \brief    Constructs adaptive max pooling operation.
+    ///
+    /// \param    data                  Input data
+    ///
+    /// \param    output_shape          1D tensor describing output shape for spatial
+    ///                                 dimensions.
+    ///
+    /// \param    index_element_type    Specifies the output tensor type for indices
+    /// output
+    ///
+    AdaptiveMaxPool(const Output<Node>& data,
+                    const Output<Node>& output_shape,
+                    const ngraph::element::Type& index_element_type = ngraph::element::i64);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    element::Type get_index_element_type() const {
+        return m_index_element_type;
+    }
+
+protected:
+    ngraph::element::Type m_index_element_type = ngraph::element::i64;
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/add.hpp b/ngraph/core/include/openvino/op/add.hpp
new file mode 100644
index 00000000000000..38b3121ab0bb5a
--- /dev/null
+++ b/ngraph/core/include/openvino/op/add.hpp
@@ -0,0 +1,47 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise addition operation.
+///
+class OPENVINO_API Add : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an uninitialized addition operation
+    Add() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs an addition operation.
+    ///
+    /// \param arg0 Output that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param arg1 Output that produces the second input tensor.<br>
+    /// `[d0, ...]`
+    /// \param auto_broadcast Auto broadcast specification. Default is Numpy-style
+    ///                       implicit broadcasting.
+    ///
+    /// Output `[d0, ...]`
+    ///
+    Add(const Output<Node>& arg0,
+        const Output<Node>& arg1,
+        const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/asin.hpp b/ngraph/core/include/openvino/op/asin.hpp
new file mode 100644
index 00000000000000..b08569cddeee0f
--- /dev/null
+++ b/ngraph/core/include/openvino/op/asin.hpp
@@ -0,0 +1,39 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise inverse sine (arcsin) operation.
+///
+class OPENVINO_API Asin : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs an arcsin operation.
+    Asin() = default;
+    /// \brief Constructs an arcsin operation.
+    ///
+    /// \param arg Output that produces the input tensor.<br>
+    /// `[d1, ...]`
+    ///
+    /// Output `[d1, ...]`
+    ///
+    Asin(const Output<Node>& arg);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/asinh.hpp b/ngraph/core/include/openvino/op/asinh.hpp
new file mode 100644
index 00000000000000..5ad07bddd26557
--- /dev/null
+++ b/ngraph/core/include/openvino/op/asinh.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Elementwise inverse hyperbolic sin operation.
+///
+class OPENVINO_API Asinh : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an Asinh operation.
+    Asinh() = default;
+    /// \brief Constructs an Asinh operation.
+    ///
+    /// \param arg Output that produces the input tensor.<br>
+    /// `[d1, ...]`
+    ///
+    /// Output `[d1, ...]`
+    ///
+    Asinh(const Output<Node>& arg);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/assign.hpp b/ngraph/core/include/openvino/op/assign.hpp
new file mode 100644
index 00000000000000..01502de7410875
--- /dev/null
+++ b/ngraph/core/include/openvino/op/assign.hpp
@@ -0,0 +1,72 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/assign_base.hpp"
+#include "openvino/op/util/variable.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Assign operation sets an input value to the variable with `variable_id`
+class OPENVINO_API Assign : public util::AssignBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Assign() = default;
+
+    /// \brief Constructs an Assign operation.
+    ///
+    /// \param new_value   Node that produces the input tensor.
+    /// \param variable_id identifier of the variable to be updated.
+    Assign(const Output<Node>& new_value, const std::string& variable_id);
+
+    void validate_and_infer_types() override;
+    std::string get_variable_id() const override {
+        return m_variable_id;
+    }
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    std::string m_variable_id;
+};
+}  // namespace v3
+
+namespace v6 {
+/// \brief Assign operation sets an input value to the variable with `variable_id`
+class OPENVINO_API Assign : public util::AssignBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Assign() = default;
+
+    /// \brief Constructs an Assign operation.
+    ///
+    /// \param new_value Node that produces the input tensor.
+    /// \param variable Class for storing and synchronizing element types, shapes and
+    /// identifiers
+    /// between pairs of Assign/ReadValue nodes.
+    Assign(const Output<Node>& new_value, const std::shared_ptr<util::Variable>& variable);
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::string get_variable_id() const override {
+        NGRAPH_CHECK(m_variable, "Variable is not initialized. Variable_id is unavailable");
+        return m_variable->get_info().variable_id;
+    }
+    bool evaluate(const HostTensorVector& outputs,
+                  const HostTensorVector& inputs,
+                  const EvaluationContext& evaluation_context) const override;
+    bool has_evaluate() const override;
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/atan.hpp b/ngraph/core/include/openvino/op/atan.hpp
new file mode 100644
index 00000000000000..3b336946c25700
--- /dev/null
+++ b/ngraph/core/include/openvino/op/atan.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise inverse tangent (arctan) operation.
+///
+class OPENVINO_API Atan : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs an arctan operation.
+    Atan() = default;
+
+    /// \brief Constructs an arctan operation.
+    ///
+    /// \param arg Output that produces the input tensor.<br>
+    /// `[d1, ...]`
+    ///
+    /// Output `[d1, ...]`
+    ///
+    Atan(const Output<Node>& arg);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/atanh.hpp b/ngraph/core/include/openvino/op/atanh.hpp
new file mode 100644
index 00000000000000..5332636a9fd2af
--- /dev/null
+++ b/ngraph/core/include/openvino/op/atanh.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Elementwise inverse hyperbolic tangent operation.
+///
+class OPENVINO_API Atanh : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an Atanh operation.
+    Atanh() = default;
+    /// \brief Constructs an Atanh operation.
+    ///
+    /// \param arg Output that produces the input tensor.<br>
+    /// `[d1, ...]`
+    ///
+    /// Output `[d1, ...]`
+    ///
+    Atanh(const Output<Node>& arg);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/avg_pool.hpp b/ngraph/core/include/openvino/op/avg_pool.hpp
new file mode 100644
index 00000000000000..12324028f974b2
--- /dev/null
+++ b/ngraph/core/include/openvino/op/avg_pool.hpp
@@ -0,0 +1,88 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Batched average pooling operation.
+///
+class OPENVINO_API AvgPool : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a batched average pooling operation.
+    AvgPool() = default;
+
+    ///
+    /// \brief      Constructs a batched average pooling operation.
+    ///
+    /// \param      arg            The output producing the input data batch tensor.<br>
+    ///                            `[d1, dn]`
+    /// \param      strides        The strides.<br> `[n]`
+    /// \param      pads_begin     The beginning of padding shape.<br> `[n]`
+    /// \param      pads_end       The end of padding shape.<br> `[n]`
+    /// \param      kernel         The kernel shape.<br> `[n]`
+    /// \param      exclude_pad    If false then averages include padding elements, each
+    ///                            treated as the number zero.  If true, padding
+    ///                            elements
+    ///                            are entirely ignored when computing averages.
+    /// \param      rounding_type  Whether to use ceiling or floor rounding type while
+    ///                            computing output shape.
+    /// \param      auto_pad       Padding type to use for additional padded dimensions
+    ///
+    AvgPool(const Output<Node>& arg,
+            const Strides& strides,
+            const Shape& pads_begin,
+            const Shape& pads_end,
+            const Shape& kernel,
+            bool exclude_pad,
+            op::RoundingType rounding_type = op::RoundingType::FLOOR,
+            const PadType& auto_pad = op::PadType::EXPLICIT);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The kernel shape.
+    const Shape& get_kernel() const;
+    void set_kernel(const Shape& kernel);
+    /// \return The strides.
+    const Strides& get_strides() const;
+    void set_strides(const Strides& strides);
+    /// \return The beginning of padding shape.
+    const Shape& get_pads_begin() const;
+    void set_pads_begin(const Shape& pads_begin);
+    /// \return The end of padding shape.
+    const Shape& get_pads_end() const;
+    void set_pads_end(const Shape& pads_end);
+    bool get_exclude_pad() const;
+    void set_exclude_pad(bool exclude_pad);
+    /// \return The pad type for pooling.
+    const PadType& get_auto_pad() const;
+    void set_auto_pad(const PadType& auto_pad);
+    op::RoundingType get_rounding_type() const;
+    void set_rounding_type(op::RoundingType rounding_type);
+    /// \return The default value for AvgPool.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+protected:
+    Shape m_kernel;
+    Strides m_strides;
+    Shape m_pads_begin;
+    Shape m_pads_end;
+    bool m_exclude_pad{true};
+    PadType m_auto_pad{PadType::EXPLICIT};
+    op::RoundingType m_rounding_type{op::RoundingType::FLOOR};
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/batch_norm.hpp b/ngraph/core/include/openvino/op/batch_norm.hpp
new file mode 100644
index 00000000000000..77f45f3f90ff18
--- /dev/null
+++ b/ngraph/core/include/openvino/op/batch_norm.hpp
@@ -0,0 +1,94 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API BatchNormInference : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    BatchNormInference() = default;
+    /// \param input [., C, ...]
+    /// \param gamma gamma scaling for normalized value. [C]
+    /// \param beta bias added to the scaled normalized value [C]
+    /// \param mean value for mean normalization [C]
+    /// \param variance value for variance normalization [C]
+    /// \param epsilon Avoids divsion by 0 if input has 0 variance
+    BatchNormInference(const Output<Node>& input,
+                       const Output<Node>& gamma,
+                       const Output<Node>& beta,
+                       const Output<Node>& mean,
+                       const Output<Node>& variance,
+                       double epsilon);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    double get_eps_value() const {
+        return m_epsilon;
+    }
+    void set_eps_value(double epsilon) {
+        m_epsilon = epsilon;
+    }
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+private:
+    static constexpr size_t INPUT_GAMMA = 0;
+    static constexpr size_t INPUT_BETA = 1;
+    static constexpr size_t INPUT_DATA = 2;
+    static constexpr size_t INPUT_MEAN = 3;
+    static constexpr size_t INPUT_VARIANCE = 4;
+
+    double m_epsilon;
+};
+}  // namespace v0
+namespace v5 {
+class OPENVINO_API BatchNormInference : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    BatchNormInference() = default;
+    /// \param input [., C, ...]
+    /// \param gamma gamma scaling for normalized value. [C]
+    /// \param beta bias added to the scaled normalized value [C]
+    /// \param mean value for mean normalization [C]
+    /// \param variance value for variance normalization [C]
+    /// \param epsilon Avoids divsion by 0 if input has 0 variance
+    BatchNormInference(const Output<Node>& input,
+                       const Output<Node>& gamma,
+                       const Output<Node>& beta,
+                       const Output<Node>& mean,
+                       const Output<Node>& variance,
+                       double epsilon);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    double get_eps_value() const {
+        return m_epsilon;
+    }
+    void set_eps_value(double epsilon) {
+        m_epsilon = epsilon;
+    }
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+private:
+    static constexpr size_t INPUT_DATA = 0;
+    static constexpr size_t INPUT_GAMMA = 1;
+    static constexpr size_t INPUT_BETA = 2;
+    static constexpr size_t INPUT_MEAN = 3;
+    static constexpr size_t INPUT_VARIANCE = 4;
+
+    double m_epsilon;
+};
+}  // namespace v5
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/batch_to_space.hpp b/ngraph/core/include/openvino/op/batch_to_space.hpp
new file mode 100644
index 00000000000000..11a72013f3bfef
--- /dev/null
+++ b/ngraph/core/include/openvino/op/batch_to_space.hpp
@@ -0,0 +1,48 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief BatchToSpace permutes data from the batch dimension of the data tensor into
+///        spatial dimensions.
+///
+/// \note  Values from the batch dimension are moved in spatial blocks dimensions.
+///
+///        Output node produces a tensor with shape:
+///        `[batch / (block_shape[0] * block_shape[1] * ... * block_shape[N - 1]),
+///         D_1 * block_shape[1] - crops_begin[1] - crops_end[1],
+///         D_2 * block_shape[2] - crops_begin[2] - crops_end[2], ...,
+///         D_{N - 1} * block_shape[N - 1] - crops_begin[N - 1] - crops_end[N - 1]`
+///         of the same type as `data` input.
+class OPENVINO_API BatchToSpace : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    BatchToSpace() = default;
+    /// \brief Constructs a BatchToSpace operation.
+    ///
+    /// \param data Node producing the data tensor
+    /// \param block_shape The sizes of the block of values to be moved
+    /// \param crops_begin Specifies the amount to crop from the beginning along each
+    /// axis of `data` input
+    /// \param crops_end Specifies the amount to crop from the ending along each axis of
+    /// `data` input.
+    BatchToSpace(const Output<Node>& data,
+                 const Output<Node>& block_shape,
+                 const Output<Node>& crops_begin,
+                 const Output<Node>& crops_end);
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/binary_convolution.hpp b/ngraph/core/include/openvino/op/binary_convolution.hpp
new file mode 100644
index 00000000000000..d7ef7493bcd3d2
--- /dev/null
+++ b/ngraph/core/include/openvino/op/binary_convolution.hpp
@@ -0,0 +1,143 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/coordinate_diff.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API BinaryConvolution : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    enum class BinaryConvolutionMode {
+        // Interpret input data and kernel values: 0 as -1, 1 as 1
+        XNOR_POPCOUNT
+    };
+
+    /// \brief Constructs a binary convolution operation.
+    BinaryConvolution() = default;
+    /// \brief Constructs a binary convolution operation.
+    /// \param data The node producing the input data batch tensor.
+    /// \param kernel The node producing the filters tensor.
+    /// \param strides The strides.
+    /// \param pads_begin The beginning of padding shape.
+    /// \param pads_end The end of padding shape.
+    /// \param dilations The dilations.
+    /// \param mode Defines how input tensor 0/1 values and weights 0/1 are interpreted.
+    /// \param pad_value Floating-point value used to fill pad area.
+    /// \param auto_pad The pad type for automatically computing padding sizes.
+    ///
+    /// Output `[N, C_OUT, R1, ... Rf]`
+    BinaryConvolution(const Output<Node>& data,
+                      const Output<Node>& kernel,
+                      const Strides& strides,
+                      const CoordinateDiff& pads_begin,
+                      const CoordinateDiff& pads_end,
+                      const Strides& dilations,
+                      BinaryConvolutionMode mode,
+                      float pad_value,
+                      const PadType& auto_pad = PadType::EXPLICIT);
+
+    BinaryConvolution(const Output<Node>& data,
+                      const Output<Node>& kernel,
+                      const Strides& strides,
+                      const CoordinateDiff& pads_begin,
+                      const CoordinateDiff& pads_end,
+                      const Strides& dilations,
+                      const std::string& mode,
+                      float pad_value,
+                      const PadType& auto_pad = PadType::EXPLICIT);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The strides.
+    const Strides& get_strides() const {
+        return m_strides;
+    }
+    void set_strides(const Strides& strides) {
+        m_strides = strides;
+    }
+    /// \return The dilations.
+    const Strides& get_dilations() const {
+        return m_dilations;
+    }
+    void set_dilations(const Strides& dilations) {
+        m_dilations = dilations;
+    }
+    /// \return The padding-below sizes (possibly negative).
+    const CoordinateDiff& get_pads_begin() const {
+        return m_pads_begin;
+    }
+    void set_pads_begin(const CoordinateDiff& pads_begin) {
+        m_pads_begin = pads_begin;
+    }
+    /// \return The padding-above sizes (possibly negative).
+    const CoordinateDiff& get_pads_end() const {
+        return m_pads_end;
+    }
+    void set_adding_above(const CoordinateDiff& pads_end) {
+        m_pads_end = pads_end;
+    }
+    /// \return The pad type for convolution.
+    const PadType& get_auto_pad() const {
+        return m_auto_pad;
+    }
+    void set_auto_pad(const PadType& auto_pad) {
+        m_auto_pad = auto_pad;
+    }
+    /// \return The mode of convolution.
+    const BinaryConvolutionMode& get_mode() const {
+        return m_mode;
+    }
+    void set_mode(const BinaryConvolutionMode& mode) {
+        m_mode = mode;
+    }
+    /// \return The pad value.
+    float get_pad_value() const {
+        return m_pad_value;
+    }
+    void set_pad_value(float pad_value) {
+        m_pad_value = pad_value;
+    }
+
+protected:
+    BinaryConvolutionMode mode_from_string(const std::string& mode) const;
+    Strides m_strides;
+    Strides m_dilations;
+    CoordinateDiff m_pads_begin;
+    CoordinateDiff m_pads_end;
+    BinaryConvolutionMode m_mode;
+    float m_pad_value;
+    PadType m_auto_pad;
+};
+}  // namespace v1
+}  // namespace op
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v1::BinaryConvolution::BinaryConvolutionMode& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v1::BinaryConvolution::BinaryConvolutionMode>
+    : public EnumAttributeAdapterBase<op::v1::BinaryConvolution::BinaryConvolutionMode> {
+public:
+    AttributeAdapter(op::v1::BinaryConvolution::BinaryConvolutionMode& value)
+        : EnumAttributeAdapterBase<op::v1::BinaryConvolution::BinaryConvolutionMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v1::BinaryConvolution::BinaryConvolutionMode>",
+                                                0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/broadcast.hpp b/ngraph/core/include/openvino/op/broadcast.hpp
new file mode 100644
index 00000000000000..2b605a7afed94a
--- /dev/null
+++ b/ngraph/core/include/openvino/op/broadcast.hpp
@@ -0,0 +1,133 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+#include "openvino/op/util/broadcast_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Operation which "adds" axes to an input tensor, replicating elements from the
+///        input as needed along the new axes.
+class OPENVINO_API Broadcast : public util::BroadcastBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a broadcast operation.
+    Broadcast() = default;
+    /// \brief Constructs a broadcast operation.
+    ///
+    /// \param arg            The input tensor to be broadcast.
+    /// \param target_shape   The shape of the output tensor.
+    /// \param axes_mapping   The axis positions (0-based) in the result that correspond
+    ///                       to input axes. 'Arg' tensor is broadcast along the
+    ///                       remaining axes.
+    ///                       E.g., Input Shape - [3, 4], Target Shape - [3, 5, 4, 4]
+    ///                       axes_mapping - [0, 2] => Broadcast along axes 1 and 3.
+    ///                       axes_mapping - [0, 3] => Broadcast along axes 1 and 2.
+    /// \param broadcast_spec Broadcast specification to use for determining broadcast
+    ///                       axes. 'axes_mapping' should not be provided if mode other
+    ///                       than explicit (none) is used.
+    Broadcast(const Output<Node>& arg,
+              const Output<Node>& target_shape,
+              const Output<Node>& axes_mapping,
+              const BroadcastModeSpec& broadcast_spec = BroadcastType::EXPLICIT);
+
+    /// \brief Constructs a broadcast operation.
+    ///
+    /// \param arg            The input tensor to be broadcast.
+    /// \param target_shape   The shape of the output tensor.
+    /// \param broadcast_spec Broadcast specification to use for determining broadcast
+    ///                       axes
+    Broadcast(const Output<Node>& arg,
+              const Output<Node>& target_shape,
+              const BroadcastModeSpec& broadcast_spec = BroadcastType::NUMPY);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    // \return Broadcast Specification.
+    const BroadcastModeSpec& get_broadcast_spec() const {
+        return m_mode;
+    }
+    void set_broadcast_spec(const BroadcastModeSpec& broadcast_spec) {
+        m_mode = broadcast_spec;
+    }
+
+    void validate_and_infer_types() override;
+
+    /// \return true and the AxisSet if broadcast axes can be fully determined.
+    std::pair<bool, AxisSet> get_broadcast_axes() const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool broadcast_evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v3
+
+namespace v1 {
+/// \brief Operation which "adds" axes to an input tensor, replicating elements from the
+///        input as needed along the new axes.
+class OPENVINO_API Broadcast : public util::BroadcastBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a broadcast operation.
+    Broadcast() = default;
+    /// \brief Constructs a broadcast operation.
+    ///
+    /// \param arg            The input tensor to be broadcast.
+    /// \param target_shape   The shape of the output tensor.
+    /// \param axes_mapping   The axis positions (0-based) in the result that correspond
+    ///                       to input axes. 'Arg' tensor is broadcast along the
+    ///                       remaining axes.
+    ///                       E.g., Input Shape - [3, 4], Target Shape - [3, 5, 4, 4]
+    ///                       axes_mapping - [0, 2] => Broadcast along axes 1 and 3.
+    ///                       axes_mapping - [0, 3] => Broadcast along axes 1 and 2.
+    /// \param broadcast_spec Broadcast specification to use for determining broadcast
+    ///                       axes. 'axes_mapping' is ignored if broadcast_spec is not
+    ///                       NONE
+    Broadcast(const Output<Node>& arg,
+              const Output<Node>& target_shape,
+              const Output<Node>& axes_mapping,
+              const AutoBroadcastSpec& broadcast_spec = AutoBroadcastSpec());
+
+    /// \brief Constructs a broadcast operation.
+    ///
+    /// \param arg            The input tensor to be broadcast.
+    /// \param target_shape   The shape of the output tensor.
+    /// \param broadcast_spec Broadcast specification to use for determining broadcast
+    ///                       axes
+    Broadcast(const Output<Node>& arg,
+              const Output<Node>& target_shape,
+              const AutoBroadcastSpec& broadcast_spec = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return Broadcast Specification.
+    const AutoBroadcastSpec& get_broadcast_spec() const {
+        return m_broadcast_spec;
+    }
+    void set_broadcast_spec(const AutoBroadcastSpec& broadcast_spec) {
+        m_broadcast_spec = broadcast_spec;
+    }
+
+    void validate_and_infer_types() override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    AutoBroadcastSpec m_broadcast_spec;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/bucketize.hpp b/ngraph/core/include/openvino/op/bucketize.hpp
new file mode 100644
index 00000000000000..dbc89f188ba9eb
--- /dev/null
+++ b/ngraph/core/include/openvino/op/bucketize.hpp
@@ -0,0 +1,57 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Operation that bucketizes the input based on boundaries
+class OPENVINO_API Bucketize : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Bucketize() = default;
+    /// \brief Constructs a Bucketize node
+
+    /// \param data              Input data to bucketize
+    /// \param buckets           1-D of sorted unique boundaries for buckets
+    /// \param output_type       Output tensor type, "i64" or "i32", defaults to i64
+    /// \param with_right_bound  indicates whether bucket includes the right or left
+    ///                          edge of interval. default true = includes right edge
+    Bucketize(const Output<Node>& data,
+              const Output<Node>& buckets,
+              const element::Type output_type = element::i64,
+              const bool with_right_bound = true);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override;
+
+    element::Type get_output_type() const {
+        return m_output_type;
+    }
+    void set_output_type(element::Type output_type) {
+        m_output_type = output_type;
+    }
+    // Overload collision with method on Node
+    using Node::set_output_type;
+
+    bool get_with_right_bound() const {
+        return m_with_right_bound;
+    }
+    void set_with_right_bound(bool with_right_bound) {
+        m_with_right_bound = with_right_bound;
+    }
+
+private:
+    element::Type m_output_type;
+    bool m_with_right_bound;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/ceiling.hpp b/ngraph/core/include/openvino/op/ceiling.hpp
new file mode 100644
index 00000000000000..95b6359e8e237a
--- /dev/null
+++ b/ngraph/core/include/openvino/op/ceiling.hpp
@@ -0,0 +1,32 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise ceiling operation.
+class OPENVINO_API Ceiling : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a ceiling operation.
+    Ceiling() = default;
+    /// \brief Constructs a ceiling operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Ceiling(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/clamp.hpp b/ngraph/core/include/openvino/op/clamp.hpp
new file mode 100644
index 00000000000000..42f9bc08cd4ef1
--- /dev/null
+++ b/ngraph/core/include/openvino/op/clamp.hpp
@@ -0,0 +1,50 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Performs a clipping operation on all elements of the input node
+///
+/// All input values that are outside of the <min;max> range are set to 'min' or 'max'
+/// depending on which side of the <min;max> range they are. The values that fall into
+/// this range remain unchanged.
+class OPENVINO_API Clamp : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Clamp();
+    /// \brief Constructs a Clamp node.
+    ///
+    /// \param data - Node producing the input tensor
+    /// \param min - the lower bound of the <min;max> range
+    /// \param max - the upper bound of the <min;max> range
+    Clamp(const Output<Node>& data, const double min, const double max);
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    double get_min() const {
+        return m_min;
+    }
+    double get_max() const {
+        return m_max;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    double m_min;
+    double m_max;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/concat.hpp b/ngraph/core/include/openvino/op/concat.hpp
new file mode 100644
index 00000000000000..e21ab5fc5ea0d4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/concat.hpp
@@ -0,0 +1,65 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Concatenation operation.
+class OPENVINO_API Concat : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a concatenation operation.
+    Concat() = default;
+    /// \brief Constructs a concatenation operation.
+    ///
+    /// \param args               The outputs producing the input tensors.
+    /// \param axis The axis along which to concatenate the input tensors.
+    Concat(const OutputVector& args, int64_t axis);
+
+    /// \brief Constructs a concatenation operation.
+    ///
+    /// \param args               The nodes producing the input tensors.
+    /// \param axis The axis along which to concatenate the input tensors.
+    Concat(const NodeVector& args, int64_t axis);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The concatenation axis.
+    int64_t get_concatenation_axis() const {
+        return m_concat_axis;
+    }
+    void set_concatenation_axis(int64_t concatenation_axis) {
+        m_concat_axis = concatenation_axis;
+    }
+    /// \return The concatenation axis.
+    int64_t get_axis() const {
+        return m_axis;
+    }
+    void set_axis(int64_t axis) {
+        m_axis = axis;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& output_values) const override;
+    bool evaluate_upper(const HostTensorVector& output_values) const override;
+
+protected:
+    /// \ brief m_axis stores default value for all iterations
+    int64_t m_axis;
+    /// \brief m_concat_axis stores m_axis plus the number of rank for each iteration
+    int64_t m_concat_axis = -1;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/constant.hpp b/ngraph/core/include/openvino/op/constant.hpp
new file mode 100644
index 00000000000000..f36f6aeb569ce8
--- /dev/null
+++ b/ngraph/core/include/openvino/op/constant.hpp
@@ -0,0 +1,708 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cmath>
+#include <cstring>
+
+#include "ngraph/runtime/aligned_buffer.hpp"
+#include "ngraph/runtime/host_tensor.hpp"
+#include "ngraph/runtime/shared_buffer.hpp"
+#include "ngraph/util.hpp"
+#include "openvino/core/coordinate_diff.hpp"
+#include "openvino/core/node.hpp"
+#include "openvino/core/type/element_type.hpp"
+#include "openvino/core/type/element_type_traits.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Class for constants.
+class OPENVINO_API Constant : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Constant() = default;
+
+    /// \brief Initialize a constant from tensor
+    /// \param tensor The tensor with data
+    Constant(const std::shared_ptr<ngraph::runtime::Tensor>& tensor);
+
+    /// \brief Constructs a tensor constant.
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param values A vector of literals for initializing the tensor constant. The
+    ///               size of values must match the size of the shape.
+    template <typename T>
+    Constant(const element::Type& type, const Shape& shape, const std::vector<T>& values) : Constant(type, shape) {
+        NODE_VALIDATION_CHECK(this,
+                              values.size() == 1 || values.size() == shape_size(m_shape),
+                              "Did not get the expected number of literals for a constant of shape ",
+                              m_shape,
+                              " (got ",
+                              values.size(),
+                              ", expected ",
+                              (shape_size(m_shape) == 1 ? "" : "1 or "),
+                              shape_size(m_shape),
+                              ").");
+
+        if (values.size() == 1) {
+            fill_data(type, values.front());
+        } else {
+            write_values(values);
+        }
+        m_all_elements_bitwise_identical = are_all_data_elements_bitwise_identical();
+    }
+
+    /// \brief Create uninitialized constant
+    Constant(const element::Type& type, const Shape& shape);
+    /// \brief Constructs a uniform tensor constant.
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param value A scalar for initializing the uniform tensor constant. The
+    ///               value is broadcast to the specified shape.
+    template <class T, class = typename std::enable_if<std::is_fundamental<T>::value>::type>
+    Constant(const element::Type& type, const Shape& shape, T value) : Constant(type, shape) {
+        fill_data(type, value);
+        m_all_elements_bitwise_identical = true;
+    }
+
+    template <typename T>
+    void fill_data(const element::Type& type, T value) {
+        using Type_t = element::Type_t;
+#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
+#    pragma GCC diagnostic push
+#    pragma GCC diagnostic error "-Wswitch"
+#    pragma GCC diagnostic error "-Wswitch-enum"
+#endif
+        switch (type) {
+        case Type_t::boolean:
+            fill_data<Type_t::boolean>(value);
+            break;
+        case Type_t::bf16:
+            fill_data<Type_t::bf16>(value);
+            break;
+        case Type_t::f16:
+            fill_data<Type_t::f16>(value);
+            break;
+        case Type_t::f32:
+            fill_data<Type_t::f32>(value);
+            break;
+        case Type_t::f64:
+            fill_data<Type_t::f64>(value);
+            break;
+        case Type_t::i4:
+            fill_data<Type_t::i4>(value);
+            break;
+        case Type_t::i8:
+            fill_data<Type_t::i8>(value);
+            break;
+        case Type_t::i16:
+            fill_data<Type_t::i16>(value);
+            break;
+        case Type_t::i32:
+            fill_data<Type_t::i32>(value);
+            break;
+        case Type_t::i64:
+            fill_data<Type_t::i64>(value);
+            break;
+        case Type_t::u1:
+            fill_data<Type_t::u1>(value);
+            break;
+        case Type_t::u4:
+            fill_data<Type_t::u4>(value);
+            break;
+        case Type_t::u8:
+            fill_data<Type_t::u8>(value);
+            break;
+        case Type_t::u16:
+            fill_data<Type_t::u16>(value);
+            break;
+        case Type_t::u32:
+            fill_data<Type_t::u32>(value);
+            break;
+        case Type_t::u64:
+            fill_data<Type_t::u64>(value);
+            break;
+        case Type_t::undefined:
+        case Type_t::dynamic:
+            throw std::runtime_error("unsupported type");
+        }
+#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
+#    pragma GCC diagnostic pop
+#endif
+    }
+
+    /// \brief Constructs a tensor constant
+    ///        This constructor is mainly to support deserialization of constants.
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param values A list of string values to use as the constant data.
+    Constant(const element::Type& type, const Shape& shape, const std::vector<std::string>& values);
+
+    /// \brief Constructs a tensor constant with the supplied data
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param data A void* to constant data.
+    Constant(const element::Type& type, const Shape& shape, const void* data);
+
+    /// \brief Constructs a tensor constant with the supplied data
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param data A pointer to pre-allocated shared data.
+    template <typename T>
+    Constant(const element::Type& type, const Shape& shape, std::shared_ptr<ngraph::runtime::SharedBuffer<T>> data)
+        : m_element_type(type),
+          m_shape(shape) {
+        m_data = data;
+        constructor_validate_and_infer_types();
+    }
+
+    Constant(const Constant& other);
+    Constant(const Constant& other, const Shape& new_shape);
+    Constant& operator=(const Constant&) = delete;
+
+    ~Constant() override;
+
+    void validate_and_infer_types() override {
+        infer_element_type();
+        set_output_type(0, m_element_type, m_shape);
+    }
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+
+    // Don't constant fold a constant; it would make a copy
+    bool constant_fold(OutputVector& outputs, const OutputVector& inputs) override {
+        (void)outputs;
+        (void)inputs;
+        return false;
+    }
+
+    /// \brief Returns the value of the constant node as a Shape object
+    ///        Can only be used on element::i64 nodes and interprets
+    ///        negative values as zeros.
+    Shape get_shape_val() const;
+    /// \brief Returns the value of the constant node as a Strides
+    ///        object
+    ///        Can only be used on element::i64 nodes and interprets
+    ///        negative values as zeros.
+    Strides get_strides_val() const;
+    /// \brief Returns the value of the constant node as a Coordinate
+    ///        object
+    ///        Can only be used on element::i64 nodes and interprets
+    ///        negative values as zeros.
+    Coordinate get_coordinate_val() const;
+    /// \brief Returns the value of the constant node as a
+    ///        CoordinateDiff object
+    ///        Can only be used on element::i64 nodes.
+    CoordinateDiff get_coordinate_diff_val() const;
+    /// \brief Returns the value of the constant node as an AxisVector
+    ///        object
+    ///        Can only be used on element::i64 nodes and interprets
+    ///        negative values as zeros.
+    AxisVector get_axis_vector_val() const;
+    /// \brief Returns the value of the constant node as an AxisSet
+    ///        object
+    ///        Can only be used on element::i64 nodes and interprets
+    ///        negative values as zeros.
+    ///        Repeated values are allowed.
+    AxisSet get_axis_set_val() const;
+
+    /// \brief Update Constant shape. New shape size must equal to the data elements
+    /// count
+    ///
+    /// \param shape The shape of the tensor constant.
+    OPENVINO_DEPRECATED("Use Constant c-tor with shape argument instead")
+    void set_data_shape(const Shape& shape);
+
+    /// \brief Wrapper around constructing a shared_ptr of a Constant
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param values A vector of values to use as the constant data.
+    template <typename T>
+    static std::shared_ptr<Constant> create(const element::Type& type,
+                                            const Shape& shape,
+                                            const std::vector<T>& values) {
+        return std::make_shared<Constant>(type, shape, values);
+    }
+
+    /// \brief Wrapper around constructing a shared_ptr of a Constant
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param values An initializer_list of values to use as the constant data.
+    template <typename T>
+    static std::shared_ptr<Constant> create(const element::Type& type,
+                                            const Shape& shape,
+                                            std::initializer_list<T> values) {
+        return std::make_shared<Constant>(type, shape, std::vector<T>{values});
+    }
+
+    /// \brief Wrapper around constructing a shared_ptr of a Constant
+    ///
+    /// \param type The element type of the tensor constant.
+    /// \param shape The shape of the tensor constant.
+    /// \param memory An continues memory chunk which contains the constant data.
+    static std::shared_ptr<Constant> create(const element::Type& type, const Shape& shape, const void* memory) {
+        return std::make_shared<Constant>(type, shape, memory);
+    }
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The initialization literals for the tensor constant.
+    std::vector<std::string> get_value_strings() const;
+
+    template <typename T>
+    std::vector<T> get_vector() const {
+        const T* p = get_data_ptr<T>();
+        if (p == nullptr)
+            throw std::runtime_error("Cannot create vector! Buffer is not allocated.");
+        return std::vector<T>(p, p + shape_size(m_shape));
+    }
+
+    /// \brief Return the Constant's value as a vector cast to type T
+    ///
+    /// \tparam T  Type to which data vector's entries will be cast.
+    /// \return    Constant's data vector.
+    template <typename T>
+    std::vector<T> cast_vector() const {
+        auto source_type = get_element_type();
+        std::vector<T> rc;
+        using Type_t = element::Type_t;
+#if defined(_MSC_VER)
+#    pragma warning(push)
+#    pragma warning(disable : 4244)
+#endif
+        switch (source_type) {
+        case Type_t::boolean:
+            cast_vector<Type_t::boolean>(rc);
+            break;
+        case Type_t::bf16:
+            cast_vector<Type_t::bf16>(rc);
+            break;
+        case Type_t::f16:
+            cast_vector<Type_t::f16>(rc);
+            break;
+        case Type_t::f32:
+            cast_vector<Type_t::f32>(rc);
+            break;
+        case Type_t::f64:
+            cast_vector<Type_t::f64>(rc);
+            break;
+        case Type_t::i4:
+            cast_vector<Type_t::i4>(rc);
+            break;
+        case Type_t::i8:
+            cast_vector<Type_t::i8>(rc);
+            break;
+        case Type_t::i16:
+            cast_vector<Type_t::i16>(rc);
+            break;
+        case Type_t::i32:
+            cast_vector<Type_t::i32>(rc);
+            break;
+        case Type_t::i64:
+            cast_vector<Type_t::i64>(rc);
+            break;
+        case Type_t::u1:
+            cast_vector<Type_t::u1>(rc);
+            break;
+        case Type_t::u4:
+            cast_vector<Type_t::u4>(rc);
+            break;
+        case Type_t::u8:
+            cast_vector<Type_t::u8>(rc);
+            break;
+        case Type_t::u16:
+            cast_vector<Type_t::u16>(rc);
+            break;
+        case Type_t::u32:
+            cast_vector<Type_t::u32>(rc);
+            break;
+        case Type_t::u64:
+            cast_vector<Type_t::u64>(rc);
+            break;
+        default:
+            throw std::runtime_error("unsupported type");
+        }
+#if defined(_MSC_VER)
+#    pragma warning(pop)
+#endif
+        return rc;
+    }
+
+    const void* get_data_ptr() const {
+        return (m_data ? m_data->get_ptr() : nullptr);
+    }
+    template <typename T>
+    const T* get_data_ptr() const {
+        if (sizeof(T) > m_element_type.size() && shape_size(m_shape) > 0) {
+            throw ov::Exception("Buffer over-read");
+        }
+
+        return static_cast<const T*>(get_data_ptr());
+    }
+
+    template <element::Type_t ET>
+    const typename element_type_traits<ET>::value_type* get_data_ptr() const {
+        NGRAPH_CHECK(ET == get_element_type(), "get_data_ptr() called for incorrect element type.");
+        return static_cast<const typename element_type_traits<ET>::value_type*>(get_data_ptr());
+    }
+
+    bool get_all_data_elements_bitwise_identical() const {
+        return m_all_elements_bitwise_identical;
+    }
+    std::string convert_value_to_string(size_t index) const;
+
+    /**
+     * \brief Allows to avoid buffer allocation on the visit_attributes call
+     */
+    void alloc_buffer_on_visit_attributes(bool val) {
+        m_alloc_buffer_on_visit_attributes = val;
+    }
+
+private:
+    template <element::Type_t Type,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
+                                          Type != element::Type_t::i4,
+                                      bool>::type = true>
+    StorageDataType get_element_value(size_t index) const {
+        return get_data_ptr<Type>()[index];
+    }
+
+    template <element::Type_t Type,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
+    StorageDataType get_element_value(size_t index) const {
+        return (get_data_ptr<uint8_t>()[index / 8] >> (7 - (index % 8))) & 1;
+    }
+
+    template <element::Type_t Type,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type == element::Type_t::u4, bool>::type = true>
+    StorageDataType get_element_value(size_t index) const {
+        return (get_data_ptr<uint8_t>()[index / 2] >> (index % 2 ? 0 : 4)) & 0x0F;
+    }
+
+    template <element::Type_t Type,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type == element::Type_t::i4, bool>::type = true>
+    StorageDataType get_element_value(size_t index) const {
+        const uint8_t i4data = (get_data_ptr<uint8_t>()[index / 2] >> (index % 2 ? 0 : 4)) & 0x0F;
+        const bool is_negative_number = (i4data >> 3) & 0x01;
+        const int8_t data = is_negative_number ? i4data | 0xF0 : i4data;
+        return data;
+    }
+
+    template <element::Type_t Type,
+              typename OUT_T,
+              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
+                                          Type != element::Type_t::i4,
+                                      bool>::type = true>
+    void cast_vector(std::vector<OUT_T>& output_vector) const {
+        // this function is workaround for waring during windows building
+        // build complains for vector creation based on iterators
+        // which point on different type than destination vector::value_type
+        using IN_T = fundamental_type_for<Type>;
+        auto source_vector = get_vector<IN_T>();
+        output_vector.reserve(source_vector.size());
+
+        std::transform(source_vector.begin(), source_vector.end(), std::back_inserter(output_vector), [](IN_T c) {
+            return static_cast<OUT_T>(c);
+        });
+    }
+
+    template <element::Type_t Type,
+              typename OUT_T,
+              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
+    void cast_vector(std::vector<OUT_T>& output) const {
+        using IN_T = fundamental_type_for<Type>;
+        const auto element_number = shape_size(m_shape);
+        const auto source_begin = get_data_ptr<uint8_t>();
+        const auto source_end = std::next(source_begin, (element_number + 7) / 8);
+        const auto round_element_no = element_number % 8 ? element_number - element_number % 8 + 8 : element_number;
+        output.reserve(round_element_no);  // adds 7 more elements here?
+        std::for_each(source_begin, source_end, [&](IN_T c) {
+            for (const auto i : {7, 6, 5, 4, 3, 2, 1, 0}) {
+                const uint8_t data = (c >> i) & 0x01;
+                output.push_back(data);
+            }
+        });
+        output.resize(element_number);
+    }
+
+    template <element::Type_t Type,
+              typename OUT_T,
+              typename std::enable_if<Type == element::Type_t::u4, bool>::type = true>
+    void cast_vector(std::vector<OUT_T>& output) const {
+        using IN_T = fundamental_type_for<Type>;
+        const auto element_number = shape_size(m_shape);
+        const auto source_begin = get_data_ptr<uint8_t>();
+        const auto source_end = std::next(source_begin, (element_number + 1) / 2);
+        const auto round_element_no = element_number % 2 ? element_number + 1 : element_number;
+        output.reserve(round_element_no);  // adds 1 more elements here?
+        std::for_each(source_begin, source_end, [&](IN_T c) {
+            for (const auto i : {4, 0}) {
+                const uint8_t data = (c >> i) & 0x0F;
+                output.push_back(data);
+            }
+        });
+        output.resize(element_number);
+    }
+    template <element::Type_t Type,
+              typename OUT_T,
+              typename std::enable_if<Type == element::Type_t::i4, bool>::type = true>
+    void cast_vector(std::vector<OUT_T>& output) const {
+        using IN_T = fundamental_type_for<Type>;
+        const auto element_number = shape_size(m_shape);
+        const auto source_begin = get_data_ptr<uint8_t>();
+        const auto source_end = std::next(source_begin, (element_number + 1) / 2);
+        const auto round_element_no = element_number % 2 ? element_number + 1 : element_number;
+        output.reserve(round_element_no);  // adds 1 more elements here?
+        std::for_each(source_begin, source_end, [&](IN_T c) {
+            for (const auto i : {4, 0}) {
+                const uint8_t i4data = (c >> i) & 0x0F;
+                const bool is_negative_number = (i4data >> 3) & 0x01;
+                const int8_t data = is_negative_number ? i4data | 0xF0 : i4data;
+                output.push_back(data);
+            }
+        });
+        output.resize(element_number);
+    }
+
+    template <element::Type_t Type,
+              typename T,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
+                                          Type != element::Type_t::i4,
+                                      bool>::type = true>
+    void fill_data(const T& value) {
+        const auto size = shape_size(m_shape);
+        const auto v = static_cast<StorageDataType>(value);
+        std::fill_n(get_data_ptr_nc<Type>(), size, v);
+    }
+
+    template <element::Type_t Type,
+              typename T,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
+    void fill_data(const T& value) {
+        const StorageDataType v = value ? 0xFF : 0x00;
+        std::fill_n(get_data_ptr_nc<Type>(), mem_size(), v);
+    }
+
+    template <element::Type_t Type,
+              typename T,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type == element::Type_t::u4 || Type == element::Type_t::i4, bool>::type = true>
+    void fill_data(const T& value) {
+        uint8_t v = value_in_range<Type>(value);
+        v &= 0x0F;
+        v += v << 4;
+        std::fill_n(get_data_ptr_nc<Type>(), mem_size(), v);
+    }
+
+    void allocate_buffer();
+
+    void* get_data_ptr_nc() {
+        return (m_data ? m_data->get_ptr() : nullptr);
+    }
+
+    template <element::Type_t ET>
+    typename element_type_traits<ET>::value_type* get_data_ptr_nc() {
+        NGRAPH_CHECK(ET == get_element_type(), "get_data_ptr_nc() called for incorrect element type.");
+        return static_cast<typename element_type_traits<ET>::value_type*>(get_data_ptr_nc());
+    }
+
+    Constant(const OutputVector& args) : Op(args), m_shape({}) {}
+
+    virtual void infer_element_type() {}
+    template <typename T>
+    void write_values(const std::vector<T>& values) {
+        write_to_buffer(values);
+    }
+
+    template <element::Type_t Type,
+              typename T,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type != element::Type_t::u1 && Type != element::Type_t::u4 &&
+                                          Type != element::Type_t::i4,
+                                      bool>::type = true>
+    void write_buffer(const std::vector<T>& source) {
+        auto p = get_data_ptr_nc<Type>();
+        for (size_t i = 0; i < source.size(); i++) {
+            p[i] = static_cast<StorageDataType>(source[i]);
+        }
+    }
+
+    template <element::Type_t Type,
+              typename T,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type == element::Type_t::u4 || Type == element::Type_t::i4, bool>::type = true>
+    void write_buffer(const std::vector<T>& source) {
+        auto p = get_data_ptr_nc<Type>();
+        size_t i = 0;
+        for (; i < source.size() / 2; i++) {
+            const auto v1 = value_in_range<Type>(source[i * 2]) & 0x0F;
+            const auto v2 = value_in_range<Type>(source[i * 2 + 1]) & 0x0F;
+            const auto v = (v1 << 4) | v2;
+            p[i] = static_cast<StorageDataType>(v);
+        }
+        if (source.size() % 2) {
+            const auto v1 = value_in_range<Type>(source[i * 2]) & 0x0F;
+            const auto v = v1 << 4;
+            p[i] = static_cast<StorageDataType>(v);
+        }
+    }
+
+    template <element::Type_t Type,
+              typename T,
+              typename StorageDataType = fundamental_type_for<Type>,
+              typename std::enable_if<Type == element::Type_t::u1, bool>::type = true>
+    void write_buffer(const std::vector<T>& source) {
+        auto p = get_data_ptr_nc<Type>();
+        size_t i = 0;
+        for (; i < source.size() / 8; i++) {
+            uint8_t v{};
+            for (int j = 0; j != 8; j++) {
+                const uint8_t b = source[i * 8 + j] ? 0x01 << (7 - j) : 0;
+                v |= b;
+            }
+            p[i] = static_cast<StorageDataType>(v);
+        }
+        uint8_t v{};
+        for (unsigned j = 0; j != source.size() % 8; j++) {
+            const uint8_t b = source[i * 8 + j] ? 0x01 << (7 - j) : 0;
+            v |= b;
+        }
+        p[i] = static_cast<StorageDataType>(v);
+    }
+
+    template <typename T>
+    void write_to_buffer(const std::vector<T>& source) {
+        const auto& target_type = m_element_type;
+        size_t target_element_count = shape_size(m_shape);
+        if (source.size() != target_element_count) {
+            throw std::runtime_error("Constant initializer does not match shape");
+        }
+        using Type_t = element::Type_t;
+#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
+#    pragma GCC diagnostic push
+#    pragma GCC diagnostic error "-Wswitch"
+#    pragma GCC diagnostic error "-Wswitch-enum"
+#endif
+        switch (target_type) {
+        case Type_t::boolean:
+            write_buffer<Type_t::boolean>(source);
+            break;
+        case Type_t::bf16:
+            write_buffer<Type_t::bf16>(source);
+            break;
+        case Type_t::f16:
+            write_buffer<Type_t::f16>(source);
+            break;
+        case Type_t::f32:
+            write_buffer<Type_t::f32>(source);
+            break;
+        case Type_t::f64:
+            write_buffer<Type_t::f64>(source);
+            break;
+        case Type_t::i4:
+            write_buffer<Type_t::i4>(source);
+            break;
+        case Type_t::i8:
+            write_buffer<Type_t::i8>(source);
+            break;
+        case Type_t::i16:
+            write_buffer<Type_t::i16>(source);
+            break;
+        case Type_t::i32:
+            write_buffer<Type_t::i32>(source);
+            break;
+        case Type_t::i64:
+            write_buffer<Type_t::i64>(source);
+            break;
+        case Type_t::u1:
+            write_buffer<Type_t::u1>(source);
+            break;
+        case Type_t::u4:
+            write_buffer<Type_t::u4>(source);
+            break;
+        case Type_t::u8:
+            write_buffer<Type_t::u8>(source);
+            break;
+        case Type_t::u16:
+            write_buffer<Type_t::u16>(source);
+            break;
+        case Type_t::u32:
+            write_buffer<Type_t::u32>(source);
+            break;
+        case Type_t::u64:
+            write_buffer<Type_t::u64>(source);
+            break;
+        case element::Type_t::undefined:
+        case element::Type_t::dynamic:
+            throw std::runtime_error("unsupported type");
+        }
+#if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
+#    pragma GCC diagnostic pop
+#endif
+    }
+    template <ngraph::element::Type_t Type,
+              typename ValueT,
+              typename std::enable_if<Type == ngraph::element::Type_t::u4, bool>::type = true>
+    static ngraph::fundamental_type_for<Type> value_in_range(const ValueT& value) {
+        const auto result = ngraph::fundamental_type_for<Type>(value);
+        NGRAPH_CHECK(0 <= result && result <= 15, "assigned value out of range u4 values");
+        return result;
+    }
+
+    template <ngraph::element::Type_t Type,
+              typename ValueT,
+              typename std::enable_if<Type == ngraph::element::Type_t::i4, bool>::type = true>
+    static ngraph::fundamental_type_for<Type> value_in_range(const ValueT& value) {
+        const auto result = ngraph::fundamental_type_for<Type>(value);
+        NGRAPH_CHECK(-8 <= result && result <= 7, "assigned value out of range i4 values");
+        return result;
+    }
+
+    bool are_all_data_elements_bitwise_identical() const;
+    static constexpr size_t host_alignment() {
+        return 64;
+    }
+
+    size_t mem_size() const {
+        const bool bitwidth_less_than_byte = m_element_type.bitwidth() < 8;
+        if (bitwidth_less_than_byte) {
+            const auto size = shape_size(m_shape);
+            const auto bitwidth = size * m_element_type.bitwidth();
+            // for rounding by `(bitwidth + 7) / 8` will work for
+            // `bitwidth < numeric_limits<size_t>::max() - 7`
+            return bitwidth / 8 + (bitwidth % 8 ? 1 : 0);
+        }
+        return shape_size(m_shape) * m_element_type.size();
+    }
+
+    element::Type m_element_type;
+    Shape m_shape{};
+    std::shared_ptr<ngraph::runtime::AlignedBuffer> m_data;
+    bool m_all_elements_bitwise_identical;
+    bool m_alloc_buffer_on_visit_attributes = true;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/convert.hpp b/ngraph/core/include/openvino/op/convert.hpp
new file mode 100644
index 00000000000000..6626f494abe5ac
--- /dev/null
+++ b/ngraph/core/include/openvino/op/convert.hpp
@@ -0,0 +1,52 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise type conversion operation.
+class OPENVINO_API Convert : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a conversion operation.
+    Convert() = default;
+    /// \brief Constructs a conversion operation.
+    ///
+    /// \param arg          Node that produces the input tensor.
+    /// \param destination_type  Element type for the output tensor.
+    Convert(const Output<Node>& arg, const ov::element::Type& destination_type);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    const element::Type& get_destination_type() const {
+        return m_destination_type;
+    }
+    void set_destination_type(const element::Type& destination_type) {
+        m_destination_type = destination_type;
+    }
+    const element::Type& get_convert_element_type() const {
+        return m_destination_type;
+    }
+    void set_convert_element_type(const element::Type& destination_type) {
+        m_destination_type = destination_type;
+    }
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+
+protected:
+    ov::element::Type m_destination_type;
+};
+}  // namespace v0
+using v0::Convert;
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/convert_like.hpp b/ngraph/core/include/openvino/op/convert_like.hpp
new file mode 100644
index 00000000000000..38c36df44ab9a1
--- /dev/null
+++ b/ngraph/core/include/openvino/op/convert_like.hpp
@@ -0,0 +1,33 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise type conversion operation.
+class OPENVINO_API ConvertLike : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a conversion operation.
+    ConvertLike() = default;
+    /// \brief Constructs a conversion operation.
+    /// \param data  Node that produces the input tensor.
+    /// \param like  Node which provides the target type information for the conversion.
+    ConvertLike(const Output<Node>& data, const Output<Node>& like);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool constant_fold(OutputVector& output_values, const OutputVector& input_values) override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/convolution.hpp b/ngraph/core/include/openvino/op/convolution.hpp
new file mode 100644
index 00000000000000..8e3134e7b9ae6c
--- /dev/null
+++ b/ngraph/core/include/openvino/op/convolution.hpp
@@ -0,0 +1,225 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/coordinate_diff.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Batched convolution operation, with optional window dilation and stride.
+///
+class OPENVINO_API Convolution : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a batched convolution operation.
+    Convolution() = default;
+    /// \brief Constructs a batched convolution operation.
+    ///
+    /// \param data_batch The node producing the input data batch tensor.<br>
+    /// `[N, C_IN, D1, ... Df]`
+    /// \param filters The node producing the filters tensor.<br>
+    /// `[C_OUT, C_IN, F1, ... Ff]`
+    /// \param strides The strides.<br>
+    /// `[f]`
+    /// \param dilations The dilations.<br>
+    /// `[f]`
+    /// \param pads_begin The beginning of padding shape.<br>
+    /// `[f]`
+    /// \param pads_end The end of padding shape.<br>
+    /// `[f]`
+    /// \param auto_pad The pad type for automatically computing padding sizes.<br>
+    /// `[f]`
+    ///
+    /// Output `[N, C_OUT, R1, ... Rf]`
+    ///
+    Convolution(const Output<Node>& data_batch,
+                const Output<Node>& filters,
+                const Strides& strides,
+                const CoordinateDiff& pads_begin,
+                const CoordinateDiff& pads_end,
+                const Strides& dilations,
+                const PadType& auto_pad = PadType::EXPLICIT);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The strides.
+    const Strides& get_strides() const {
+        return m_strides;
+    }
+    void set_strides(const Strides& strides) {
+        m_strides = strides;
+    }
+    /// \return The dilations.
+    const Strides& get_dilations() const {
+        return m_dilations;
+    }
+    void set_dilations(const Strides& dilations) {
+        m_dilations = dilations;
+    }
+    /// \return The padding-below sizes (possibly negative).
+    const CoordinateDiff& get_pads_begin() const {
+        return m_pads_begin;
+    }
+    void set_pads_begin(const CoordinateDiff& pads_begin) {
+        m_pads_begin = pads_begin;
+    }
+    /// \return The padding-above sizes (possibly negative).
+    const CoordinateDiff& get_pads_end() const {
+        return m_pads_end;
+    }
+    void set_adding_above(const CoordinateDiff& pads_end) {
+        m_pads_end = pads_end;
+    }
+    /// \return The pad type for convolution.
+    const PadType& get_auto_pad() const {
+        return m_auto_pad;
+    }
+    void set_auto_pad(const PadType& auto_pad) {
+        m_auto_pad = auto_pad;
+    }
+    /// \return The default value for Convolution.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+protected:
+    Strides m_strides;
+    Strides m_dilations;
+    CoordinateDiff m_pads_begin;
+    CoordinateDiff m_pads_end;
+    PadType m_auto_pad;
+};
+
+/// \brief Data batch backprop for batched convolution operation.
+class OPENVINO_API ConvolutionBackpropData : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a batched-convolution data batch-backprop operation.
+    ConvolutionBackpropData() = default;
+    // clang-format off
+                //
+                // \brief      Constructs a batched-convolution data batch-backprop operation.
+                //
+                // \param      data            The node producing data from forward-prop. Shape: [N,
+                //                             C_INPUT, X1, ..., XD].
+                // \param      filters         The node producing the filter from forward-prop. Shape:
+                //                             [C_INPUT, C_OUTPUT, K_D, ..., K_1]
+                // \param      output_shape    The shape of the data batch from forward-prop. It's size
+                //                             should be equal to number of data spatial dimensions.
+                // \param      strides         The strides from forward-prop.
+                // \param      pads_begin      The padding-below sizes from forward-prop.
+                // \param      pads_end        The padding-above sizes from forward-prop.
+                // \param      dilations       The dilations from forward-prop.
+                // \param      auto_pad        The pad type for automatically computing padding sizes.
+                // \param      output_padding  The output padding adds additional amount of paddings per
+                //                             each spatial axis in the output tensor. clang-format on
+                //
+                ConvolutionBackpropData(const Output<Node>& data,
+                                        const Output<Node>& filters,
+                                        const Output<Node>& output_shape,
+                                        const Strides& strides,
+                                        const CoordinateDiff& pads_begin,
+                                        const CoordinateDiff& pads_end,
+                                        const Strides& dilations,
+                                        const PadType& auto_pad = PadType::EXPLICIT,
+                                        const CoordinateDiff& output_padding = {});
+
+                // clang-format off
+                //
+                // \brief      Constructs a batched-convolution data batch-backprop operation.
+                //
+                // \param      data            The node producing data from forward-prop. Shape: [N,
+                //                             C_INPUT, X1, ..., XD].
+                // \param      filters         The node producing the filter from forward-prop. Shape:
+                //                             [C_INPUT, C_OUTPUT, K_D, ..., K_1]
+                // \param      strides         The strides from forward-prop.
+                // \param      pads_begin      The padding-below sizes from forward-prop.
+                // \param      pads_end        The padding-above sizes from forward-prop.
+                // \param      dilations       The dilations from forward-prop.
+                // \param      auto_pad        The pad type for automatically computing padding sizes.
+                // \param      output_padding  The output padding adds additional amount of paddings per
+                //                             each spatial axis in the output tensor. clang-format on
+                //
+                ConvolutionBackpropData(const Output<Node>& data,
+                                        const Output<Node>& filters,
+                                        const Strides& strides,
+                                        const CoordinateDiff& pads_begin,
+                                        const CoordinateDiff& pads_end,
+                                        const Strides& dilations,
+                                        const PadType& auto_pad = PadType::EXPLICIT,
+                                        const CoordinateDiff& output_padding = {});
+
+                void validate_and_infer_types() override;
+                bool visit_attributes(AttributeVisitor& visitor) override;
+                bool is_dynamic() const override;
+
+                std::shared_ptr<Node>
+                    clone_with_new_inputs(const OutputVector& new_args) const override;
+
+                /// \return The output spatial dimensions shape.
+                const PartialShape get_output_shape() const;
+                void set_output_shape(const Shape& output_shape);
+                /// \return The strides from the forward prop.
+                const Strides& get_strides() const { return m_strides; }
+                void set_strides(const Strides& strides) { m_strides = strides; }
+                /// \return The dilations from the forward prop.
+                const Strides& get_dilations() const { return m_dilations; }
+                void set_dilations(const Strides& dilations) { m_dilations = dilations; }
+                /// \return The padding-below sizes (possibly negative) from the forward prop.
+                const CoordinateDiff& get_pads_begin() const { return m_pads_begin; }
+                void set_pads_begin(const CoordinateDiff& pads_begin) { m_pads_begin = pads_begin; }
+                /// \return The padding-above sizes (possibly negative) from the forward prop.
+                const CoordinateDiff& get_pads_end() const { return m_pads_end; }
+                void set_pads_end(const CoordinateDiff& pads_end) { m_pads_end = pads_end; }
+                /// \return The auto pad.
+                const PadType& get_auto_pad() const { return m_auto_pad; }
+                void set_auto_pad(const PadType& auto_pad) { m_auto_pad = auto_pad; }
+                /// \return The output padding.
+                const CoordinateDiff& get_output_padding() const { return m_output_padding; }
+                void set_output_padding(const CoordinateDiff& output_padding)
+                {
+                    m_output_padding = output_padding;
+                }
+                /// \brief      Calculates output spatial features size.
+                ///
+                /// \param[in]  input_data_shape      The input data partial shape
+                /// \param[in]  filters_shape         The filters partial shape
+                /// \param[in]  strides               The strides values.
+                /// \param[in]  dilations             The dilations values.
+                /// \param[in]  pads_begin            The paddings at the beginning of axis.
+                /// \param[in]  pads_end              The paddings at the end of axis.
+                /// \param[in]  output_padding    The output padding values.
+                /// \param      output_spatial_shape  The placeholder for computed output spatial partial
+                /// shape.
+                ///
+                void
+                    infer_conv_backprop_output_spatial_shape(const std::vector<Dimension>& input_data_shape,
+                                                            const std::vector<Dimension>& filters_shape,
+                                                            const Strides& strides,
+                                                            const Strides& dilations,
+                                                            const CoordinateDiff& pads_begin,
+                                                            const CoordinateDiff& pads_end,
+                                                            const CoordinateDiff& output_padding,
+                                                            std::vector<Dimension>& output_spatial_shape);
+
+            protected:
+                Strides m_strides;
+                Strides m_dilations;
+                CoordinateDiff m_pads_begin;
+                CoordinateDiff m_pads_end;
+                PadType m_auto_pad;
+                CoordinateDiff m_output_padding;
+            };
+        } // namespace v1
+    } // namespace op
+} // namespace ngraph
diff --git a/ngraph/core/include/openvino/op/cos.hpp b/ngraph/core/include/openvino/op/cos.hpp
new file mode 100644
index 00000000000000..1e251e0f4e0307
--- /dev/null
+++ b/ngraph/core/include/openvino/op/cos.hpp
@@ -0,0 +1,31 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise cosine operation.
+class OPENVINO_API Cos : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a cosine operation.
+    Cos() = default;
+    /// \brief Constructs a cosine operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Cos(const Output<Node>& arg);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/cosh.hpp b/ngraph/core/include/openvino/op/cosh.hpp
new file mode 100644
index 00000000000000..844f43282998ae
--- /dev/null
+++ b/ngraph/core/include/openvino/op/cosh.hpp
@@ -0,0 +1,31 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise hyperbolic cosine (cosh) operation.
+class OPENVINO_API Cosh : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a hyperbolic cosine operation.
+    Cosh() = default;
+    /// \brief Constructs a hyperbolic cosine operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Cosh(const Output<Node>& arg);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/ctc_greedy_decoder.hpp b/ngraph/core/include/openvino/op/ctc_greedy_decoder.hpp
new file mode 100644
index 00000000000000..d5b6ff5c483611
--- /dev/null
+++ b/ngraph/core/include/openvino/op/ctc_greedy_decoder.hpp
@@ -0,0 +1,37 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API CTCGreedyDecoder : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    CTCGreedyDecoder() = default;
+    /// \brief Constructs a CTCGreedyDecoder operation
+    ///
+    /// \param input              Logits on which greedy decoding is performed
+    /// \param seq_len            Sequence lengths
+    /// \param ctc_merge_repeated Whether to merge repeated labels
+    CTCGreedyDecoder(const Output<Node>& input, const Output<Node>& seq_len, const bool ctc_merge_repeated);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool get_ctc_merge_repeated() const {
+        return m_ctc_merge_repeated;
+    }
+
+private:
+    bool m_ctc_merge_repeated;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/ctc_greedy_decoder_seq_len.hpp b/ngraph/core/include/openvino/op/ctc_greedy_decoder_seq_len.hpp
new file mode 100644
index 00000000000000..9338e2ebe3e507
--- /dev/null
+++ b/ngraph/core/include/openvino/op/ctc_greedy_decoder_seq_len.hpp
@@ -0,0 +1,100 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v6 {
+/// \brief Operator performing CTCGreedyDecoder
+///
+class OPENVINO_API CTCGreedyDecoderSeqLen : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    CTCGreedyDecoderSeqLen() = default;
+    /// \brief Constructs a CTCGreedyDecoderSeqLen operation
+    ///
+    /// \param input                3-D tensor of logits on which greedy decoding is
+    /// performed
+    /// \param seq_len              1-D tensor of sequence lengths
+    /// \param merge_repeated       Whether to merge repeated labels
+    /// \param classes_index_type   Specifies the output classes_index tensor type
+    /// \param sequence_length_type Specifies the output sequence_length tensor type
+    CTCGreedyDecoderSeqLen(const Output<Node>& input,
+                           const Output<Node>& seq_len,
+                           const bool merge_repeated = true,
+                           const element::Type& classes_index_type = element::i32,
+                           const element::Type& sequence_length_type = element::i32);
+    /// \brief Constructs a CTCGreedyDecoderSeqLen operation
+    ///
+    /// \param input                3-D tensor of logits on which greedy decoding is
+    /// performed
+    /// \param seq_len              1-D tensor of sequence lengths
+    /// \param blank_index          Scalar or 1-D tensor with 1 element used to mark a
+    /// blank index
+    /// \param merge_repeated       Whether to merge repeated labels
+    /// \param classes_index_type   Specifies the output classes_index tensor type
+    /// \param sequence_length_type Specifies the output sequence_length tensor type
+    CTCGreedyDecoderSeqLen(const Output<Node>& input,
+                           const Output<Node>& seq_len,
+                           const Output<Node>& blank_index,
+                           const bool merge_repeated = true,
+                           const element::Type& classes_index_type = element::i32,
+                           const element::Type& sequence_length_type = element::i32);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \brief Get merge_repeated attribute
+    ///
+    /// \return Current value of merge_repeated attribute
+    ///
+    bool get_merge_repeated() const {
+        return m_merge_repeated;
+    }
+    /// \brief Get classes_index_type attribute
+    ///
+    /// \return Current value of classes_index_type attribute
+    ///
+    const element::Type& get_classes_index_type() const {
+        return m_classes_index_type;
+    }
+    /// \brief Set classes_index_type attribute
+    ///
+    /// \param classes_index_type Type of classes_index
+    ///
+    void set_classes_index_type(const element::Type& classes_index_type) {
+        m_classes_index_type = classes_index_type;
+        validate_and_infer_types();
+    }
+
+    /// \brief Get sequence_length_type attribute
+    ///
+    /// \return Current value of sequence_length_type attribute
+    ///
+    const element::Type& get_sequence_length_type() const {
+        return m_sequence_length_type;
+    }
+
+    /// \brief Set sequence_length_type attribute
+    ///
+    /// \param sequence_length_type Type of sequence length
+    ///
+    void set_sequence_length_type(const element::Type& sequence_length_type) {
+        m_sequence_length_type = sequence_length_type;
+        validate_and_infer_types();
+    }
+
+private:
+    bool m_merge_repeated;
+    element::Type m_classes_index_type{element::i32};
+    element::Type m_sequence_length_type{element::i32};
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/ctc_loss.hpp b/ngraph/core/include/openvino/op/ctc_loss.hpp
new file mode 100644
index 00000000000000..5407fd0d113131
--- /dev/null
+++ b/ngraph/core/include/openvino/op/ctc_loss.hpp
@@ -0,0 +1,71 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+class OPENVINO_API CTCLoss : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    CTCLoss() = default;
+    /// \brief Constructs a CTCLoss operation
+    ///
+    /// \param logits                         3-D tensor of logits
+    /// \param logit_length                   1-D tensor of length for each object from
+    /// a batch
+    /// \param labels                         2-D tensor of labels for which likelyhood
+    /// is estimated using logist
+    /// \param label_length                   1-D tensor of length for each label
+    /// sequence
+    /// \param blank_index                    Scalar used to mark a blank index
+    /// \param preprocess_collapse_repeated   Flag for preprocessing labels before loss
+    /// calculation
+    /// \param ctc_merge_repeated             Flag for merging repeated characters in a
+    /// potential alignment
+    /// \param unique                         Flag to find unique elements in a target
+    /// before matching with alignment
+    CTCLoss(const Output<Node>& logits,
+            const Output<Node>& logit_length,
+            const Output<Node>& labels,
+            const Output<Node>& label_length,
+            const bool preprocess_collapse_repeated = false,
+            const bool ctc_merge_repeated = true,
+            const bool unique = false);
+
+    CTCLoss(const Output<Node>& logits,
+            const Output<Node>& logit_length,
+            const Output<Node>& labels,
+            const Output<Node>& label_length,
+            const Output<Node>& blank_index,
+            const bool preprocess_collapse_repeated = false,
+            const bool ctc_merge_repeated = true,
+            const bool unique = false);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool get_preprocess_collapse_repeated() const {
+        return preprocess_collapse_repeated_;
+    }
+    bool get_ctc_merge_repeated() const {
+        return ctc_merge_repeated_;
+    }
+    bool get_unique() const {
+        return unique_;
+    }
+
+private:
+    bool preprocess_collapse_repeated_;
+    bool ctc_merge_repeated_;
+    bool unique_;
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/cum_sum.hpp b/ngraph/core/include/openvino/op/cum_sum.hpp
new file mode 100644
index 00000000000000..073a168bfbc910
--- /dev/null
+++ b/ngraph/core/include/openvino/op/cum_sum.hpp
@@ -0,0 +1,60 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Tensor cumulative sum operation.
+///
+/// Compute the cumulative sum of the input tensor along the axis specified.
+///
+class OPENVINO_API CumSum : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a cumulative summation operation.
+    CumSum() = default;
+
+    /// \brief Constructs a cumulative summation operation.
+    ///
+    /// \param arg The tensor to be summed.
+    /// \param axis zero dimension tensor specifying axis position along which
+    /// cumulative sum must be performed
+    /// \param exclusive if set to true, the top element is not included
+    /// \param reverse if set to true, will perform the sums in reverse direction
+    CumSum(const Output<Node>& arg, const Output<Node>& axis, const bool exclusive = false, const bool reverse = false);
+
+    /// \brief Constructs a cumulative summation operation with axis = 0
+    ///
+    /// \param arg The tensor to be summed
+    CumSum(const Output<Node>& arg, const bool exclusive = false, const bool reverse = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    /// \return The default value for CumSum.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+    bool is_exclusive() const {
+        return m_exclusive;
+    }
+    bool is_reverse() const {
+        return m_reverse;
+    }
+
+private:
+    bool m_exclusive = false;
+    bool m_reverse = false;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/deformable_convolution.hpp b/ngraph/core/include/openvino/op/deformable_convolution.hpp
new file mode 100644
index 00000000000000..3670ee1a059626
--- /dev/null
+++ b/ngraph/core/include/openvino/op/deformable_convolution.hpp
@@ -0,0 +1,175 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/coordinate_diff.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+#include "openvino/op/util/deformable_convolution_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief DeformableConvolution operation.
+class OPENVINO_API DeformableConvolution : public op::util::DeformableConvolutionBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a conversion operation.
+    DeformableConvolution() = default;
+    /// \brief Constructs a conversion operation.
+    ///
+    /// \param arg                Node that produces the input tensor.
+    /// \param offsets            Node producing the deformable values tensor.
+    /// \param filters            Node producing the filters(kernels) tensor with OIZYX
+    ///                           layout.
+    /// \param strides            Convolution strides.
+    /// \param pads_begin         Amount of padding to be added to the beginning along
+    ///                           each axis. For example in case of a 2D input the value
+    ///                           of (1, 2) means that 1 element will be added to the
+    ///                           top and 2 elements to the left.
+    /// \param pads_end           Amount of padding to be added to the end along each
+    ///                           axis.
+    /// \param dilations          The distance in width and height between the weights
+    ///                           in the filters tensor.
+    /// \param auto_pad           Specifies how the automatic calculation of padding
+    ///                           should be done.
+    /// \param group              The number of groups which both output and input
+    ///                           should be split into.
+    /// \param deformable_group   The number of groups which deformable values and
+    ///                           output should be split into along the channel axis.
+    DeformableConvolution(const Output<Node>& arg,
+                          const Output<Node>& offsets,
+                          const Output<Node>& filters,
+                          const Strides& strides,
+                          const CoordinateDiff& pads_begin,
+                          const CoordinateDiff& pads_end,
+                          const Strides& dilations,
+                          const PadType& auto_pad = PadType::EXPLICIT,
+                          const int64_t group = 1,
+                          const int64_t deformable_group = 1);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v1
+
+namespace v8 {
+class OPENVINO_API DeformableConvolution : public op::util::DeformableConvolutionBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a conversion operation.
+    DeformableConvolution() = default;
+    /// \brief Constructs a conversion operation.
+    ///
+    /// \param arg                Node that produces the input tensor.
+    /// \param offsets            Node producing the deformable values tensor.
+    /// \param filters            Node producing the filters(kernels) tensor with OIZYX
+    ///                           layout.
+    /// \param strides            Convolution strides.
+    /// \param pads_begin         Amount of padding to be added to the beginning along
+    ///                           each axis. For example in case of a 2D input the value
+    ///                           of (1, 2) means that 1 element will be added to the
+    ///                           top and 2 elements to the left.
+    /// \param pads_end           Amount of padding to be added to the end along each
+    ///                           axis.
+    /// \param dilations          The distance in width and height between the weights
+    ///                           in the filters tensor.
+    /// \param auto_pad           Specifies how the automatic calculation of padding
+    ///                           should be done.
+    /// \param group              The number of groups which both output and input
+    ///                           should be split into.
+    /// \param deformable_group   The number of groups which deformable values and
+    ///                           output should be split into along the channel axis.
+    /// \param bilinear_interpolation_pad
+    ///                           The flag that determines the mode of bilinear
+    ///                           interpolation execution.
+    ///                           If the flag is `true` and the sampling location is
+    ///                           within one pixel outside of the feature map boundary,
+    ///                           then bilinear interpolation is performed on the zero
+    ///                           padded feature map. If the flag is `false` and the
+    ///                           sampling location is within one pixel outside of the
+    ///                           feature map boundary, then the sampling location
+    ///                           shifts to the inner boundary of the feature map.`
+    DeformableConvolution(const Output<Node>& arg,
+                          const Output<Node>& offsets,
+                          const Output<Node>& filters,
+                          const Strides& strides,
+                          const CoordinateDiff& pads_begin,
+                          const CoordinateDiff& pads_end,
+                          const Strides& dilations,
+                          const PadType& auto_pad = PadType::EXPLICIT,
+                          const int64_t group = 1,
+                          const int64_t deformable_group = 1,
+                          const bool bilinear_interpolation_pad = false);
+
+    /// \brief Constructs a conversion operation.
+    ///
+    /// \param arg                Node that produces the input tensor.
+    /// \param offsets            Node producing the deformable values tensor.
+    /// \param filters            Node producing the filters(kernels) tensor with OIZYX
+    ///                           layout.
+    /// \param mask               Node producing the mask(mask) tensor.
+    /// \param strides            Convolution strides.
+    /// \param pads_begin         Amount of padding to be added to the beginning along
+    ///                           each axis. For example in case of a 2D input the value
+    ///                           of (1, 2) means that 1 element will be added to the
+    ///                           top and 2 elements to the left.
+    /// \param pads_end           Amount of padding to be added to the end along each
+    ///                           axis.
+    /// \param dilations          The distance in width and height between the weights
+    ///                           in the filters tensor.
+    /// \param auto_pad           Specifies how the automatic calculation of padding
+    ///                           should be done.
+    /// \param group              The number of groups which both output and input
+    ///                           should be split into.
+    /// \param deformable_group   The number of groups which deformable values and
+    ///                           output should be split into along the channel axis.
+    /// \param bilinear_interpolation_pad
+    ///                           The flag that determines the mode of bilinear
+    ///                           interpolation execution.
+    ///                           If the flag is `true` and the sampling location is
+    ///                           within one pixel outside of the feature map boundary,
+    ///                           then bilinear interpolation is performed on the zero
+    ///                           padded feature map. If the flag is `false` and the
+    ///                           sampling location is within one pixel outside of the
+    ///                           feature map boundary, then the sampling location
+    ///                           shifts to the inner boundary of the feature map.
+    DeformableConvolution(const Output<Node>& arg,
+                          const Output<Node>& offsets,
+                          const Output<Node>& filters,
+                          const Output<Node>& mask,
+                          const Strides& strides,
+                          const CoordinateDiff& pads_begin,
+                          const CoordinateDiff& pads_end,
+                          const Strides& dilations,
+                          const PadType& auto_pad = PadType::EXPLICIT,
+                          const int64_t group = 1,
+                          const int64_t deformable_group = 1,
+                          const bool bilinear_interpolation_pad = false);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+
+    bool has_evaluate() const override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool get_bilinear_interpolation_pad() const {
+        return m_bilinear_interpolation_pad;
+    }
+
+    void set_bilinear_interpolation_pad(const bool bilinear_interpolation_pad) {
+        m_bilinear_interpolation_pad = bilinear_interpolation_pad;
+    }
+
+private:
+    bool m_bilinear_interpolation_pad;
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/deformable_psroi_pooling.hpp b/ngraph/core/include/openvino/op/deformable_psroi_pooling.hpp
new file mode 100644
index 00000000000000..06ee5c551f44fd
--- /dev/null
+++ b/ngraph/core/include/openvino/op/deformable_psroi_pooling.hpp
@@ -0,0 +1,107 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API DeformablePSROIPooling : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    DeformablePSROIPooling() = default;
+    /// \brief Constructs a DeformablePSROIPooling operation
+    ///
+    /// \param input           Input tensor with position sensitive score maps
+    /// \param coords          Input tensor with list of five element tuples
+    ///                        describing ROI coordinates
+    /// \param offsets         Input tensor with transformation values
+    /// \param output_dim      Pooled output channel number
+    /// \param group_size      Number of horizontal bins per row to divide ROI area,
+    ///                        it defines output width and height
+    /// \param spatial_scale   Multiplicative spatial scale factor to translate ROI
+    ///                        coordinates from their input scale to the scale used when
+    ///                        pooling
+    /// \param mode            Specifies mode for pooling.
+    /// \param spatial_bins_x  Specifies numbers of bins to divide ROI single
+    ///                        bin over width
+    /// \param spatial_bins_y  Specifies numbers of bins to divide ROI single
+    ///                        bin over height
+    /// \param no_trans        The flag that specifies whenever third input exists
+    ///                        and contains transformation (offset) values
+    /// \param trans_std       The value that all transformation (offset) values are
+    ///                        multiplied with
+    /// \param part_size       The number of parts the output tensor spatial dimensions
+    ///                        are divided into. Basically it is the height
+    ///                        and width of the third input
+    DeformablePSROIPooling(const Output<Node>& input,
+                           const Output<Node>& coords,
+                           const Output<Node>& offsets,
+                           const int64_t output_dim,
+                           const float spatial_scale,
+                           const int64_t group_size = 1,
+                           const std::string mode = "bilinear_deformable",
+                           int64_t spatial_bins_x = 1,
+                           int64_t spatial_bins_y = 1,
+                           float trans_std = 1,
+                           int64_t part_size = 1);
+
+    DeformablePSROIPooling(const Output<Node>& input,
+                           const Output<Node>& coords,
+                           const int64_t output_dim,
+                           const float spatial_scale,
+                           const int64_t group_size = 1,
+                           const std::string mode = "bilinear_deformable",
+                           int64_t spatial_bins_x = 1,
+                           int64_t spatial_bins_y = 1,
+                           float trans_std = 1,
+                           int64_t part_size = 1);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    int64_t get_output_dim() const {
+        return m_output_dim;
+    }
+    int64_t get_group_size() const {
+        return m_group_size;
+    }
+    float get_spatial_scale() const {
+        return m_spatial_scale;
+    }
+    const std::string& get_mode() const {
+        return m_mode;
+    }
+    int64_t get_spatial_bins_x() const {
+        return m_spatial_bins_x;
+    }
+    int64_t get_spatial_bins_y() const {
+        return m_spatial_bins_y;
+    }
+    float get_trans_std() const {
+        return m_trans_std;
+    }
+    int64_t get_part_size() const {
+        return m_part_size;
+    }
+
+private:
+    int64_t m_output_dim;
+    float m_spatial_scale;
+    int64_t m_group_size = 1;
+    std::string m_mode = "bilinear_deformable";
+    int64_t m_spatial_bins_x = 1;
+    int64_t m_spatial_bins_y = 1;
+    float m_trans_std = 1.f;
+    int64_t m_part_size = 1;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/depth_to_space.hpp b/ngraph/core/include/openvino/op/depth_to_space.hpp
new file mode 100644
index 00000000000000..216359dcf5852f
--- /dev/null
+++ b/ngraph/core/include/openvino/op/depth_to_space.hpp
@@ -0,0 +1,78 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief DepthToSpace permutes data from the depth dimension of the input blob into
+///        spatial dimensions.
+///
+/// \note  Values from the depth dimension (assuming NCHW layout) are moved in
+///        spatial blocks to the height and width dimensions.
+///
+///        Output node produces a tensor with shape:
+///        [N, C/(blocksize * blocksize), H * blocksize, W * blocksize]
+class OPENVINO_API DepthToSpace : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    enum class DepthToSpaceMode {
+        // The input depth is divided to [block_size, ..., block_size, new_depth]
+        BLOCKS_FIRST,
+        // The input depth is divided to [new_depth, block_size, ..., block_size]
+        DEPTH_FIRST
+    };
+
+    DepthToSpace() = default;
+    /// \brief Constructs a DepthToSpace operation.
+    ///
+    /// \param data Node producing the input tensor
+    /// \param mode Specifies how the input depth dimension is split to block
+    /// coordinates
+    /// \param block_size The size of the block of values to be moved
+    DepthToSpace(const Output<Node>& data, const DepthToSpaceMode& mode, std::size_t block_size = 1);
+
+    DepthToSpace(const Output<Node>& data, const std::string& mode, std::size_t block_size = 1);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::size_t get_block_size() const {
+        return m_blocksize;
+    }
+    DepthToSpaceMode get_mode() const {
+        return m_mode;
+    }
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    void validate_and_infer_types() override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    std::size_t m_blocksize;
+    DepthToSpaceMode m_mode;
+};
+}  // namespace v0
+}  // namespace op
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v0::DepthToSpace::DepthToSpaceMode& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v0::DepthToSpace::DepthToSpaceMode>
+    : public EnumAttributeAdapterBase<op::v0::DepthToSpace::DepthToSpaceMode> {
+public:
+    AttributeAdapter(op::v0::DepthToSpace::DepthToSpaceMode& value)
+        : EnumAttributeAdapterBase<op::v0::DepthToSpace::DepthToSpaceMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v0::DepthToSpace::DepthToSpaceMode>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/detection_output.hpp b/ngraph/core/include/openvino/op/detection_output.hpp
new file mode 100644
index 00000000000000..26c9d9828a9b2e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/detection_output.hpp
@@ -0,0 +1,78 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Layer which performs non-max suppression to
+/// generate detection output using location and confidence predictions
+class OPENVINO_API DetectionOutput : public Op {
+public:
+    struct Attributes {
+        int num_classes;
+        int background_label_id = 0;
+        int top_k = -1;
+        bool variance_encoded_in_target = false;
+        std::vector<int> keep_top_k;
+        std::string code_type = std::string{"caffe.PriorBoxParameter.CORNER"};
+        bool share_location = true;
+        float nms_threshold;
+        float confidence_threshold = 0;
+        bool clip_after_nms = false;
+        bool clip_before_nms = false;
+        bool decrease_label_id = false;
+        bool normalized = false;
+        size_t input_height = 1;
+        size_t input_width = 1;
+        float objectness_score = 0;
+    };
+
+    OPENVINO_RTTI_DECLARATION;
+
+    DetectionOutput() = default;
+    /// \brief Constructs a DetectionOutput operation
+    ///
+    /// \param box_logits			Box logits
+    /// \param class_preds			Class predictions
+    /// \param proposals			Proposals
+    /// \param aux_class_preds		Auxilary class predictions
+    /// \param aux_box_preds		Auxilary box predictions
+    /// \param attrs				Detection Output attributes
+    DetectionOutput(const Output<Node>& box_logits,
+                    const Output<Node>& class_preds,
+                    const Output<Node>& proposals,
+                    const Output<Node>& aux_class_preds,
+                    const Output<Node>& aux_box_preds,
+                    const Attributes& attrs);
+
+    /// \brief Constructs a DetectionOutput operation
+    ///
+    /// \param box_logits			Box logits
+    /// \param class_preds			Class predictions
+    /// \param proposals			Proposals
+    /// \param attrs				Detection Output attributes
+    DetectionOutput(const Output<Node>& box_logits,
+                    const Output<Node>& class_preds,
+                    const Output<Node>& proposals,
+                    const Attributes& attrs);
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    Attributes m_attrs;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/dft.hpp b/ngraph/core/include/openvino/op/dft.hpp
new file mode 100644
index 00000000000000..954bcb7f5f677b
--- /dev/null
+++ b/ngraph/core/include/openvino/op/dft.hpp
@@ -0,0 +1,53 @@
+//*****************************************************************************
+// Copyright 2017-2021 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//*****************************************************************************
+
+#pragma once
+
+#include <cstddef>
+#include <vector>
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/fft_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v7 {
+/// \brief An operation DFT that computes the discrete Fourier transformation.
+class OPENVINO_API DFT : public util::FFTBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    DFT() = default;
+
+    /// \brief Constructs a DFT operation. DFT is performed for full size axes.
+    ///
+    /// \param data  Input data
+    /// \param axes Axes to perform DFT
+    DFT(const Output<Node>& data, const Output<Node>& axes);
+
+    /// \brief Constructs a DFT operation.
+    ///
+    /// \param data  Input data
+    /// \param axes Axes to perform DFT
+    /// \param signal_size Signal sizes for 'axes'
+    DFT(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v7
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/divide.hpp b/ngraph/core/include/openvino/op/divide.hpp
new file mode 100644
index 00000000000000..065c5f641e0dfd
--- /dev/null
+++ b/ngraph/core/include/openvino/op/divide.hpp
@@ -0,0 +1,55 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise division operation.
+class OPENVINO_API Divide : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a division operation.
+    Divide() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs a division operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param pythondiv Use Python style rounding for integral type
+    /// \param auto_broadcast Auto broadcast specification
+    Divide(const Output<Node>& arg0,
+           const Output<Node>& arg1,
+           bool pythondiv,
+           const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    /// \brief Constructs a division operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Divide(const Output<Node>& arg0,
+           const Output<Node>& arg1,
+           const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool is_pythondiv() const {
+        return m_pythondiv;
+    }
+    void set_is_pythondiv(bool pythondiv) {
+        m_pythondiv = pythondiv;
+    }
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    bool m_pythondiv{true};
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/einsum.hpp b/ngraph/core/include/openvino/op/einsum.hpp
new file mode 100644
index 00000000000000..14f10ba8b884c0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/einsum.hpp
@@ -0,0 +1,71 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v7 {
+/// \brief Einsum operation.
+class OPENVINO_API Einsum : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Einsum() = default;
+
+    ///
+    /// \brief      Constructs Einsum operation.
+    ///
+    /// \param      inputs        Input nodes on which Einsum operation performs
+    /// contraction
+    ///
+    /// \param      equation      Einstein summation convention
+    ///
+    Einsum(const OutputVector& inputs, const std::string& equation);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \brief      Get an equation of Einsum operation
+    ///
+    /// \return     Einsum equation
+    ///
+    std::string get_equation() const {
+        return m_equation;
+    }
+
+    /// \brief      Check correctness of equation format and extract input subscripts
+    /// and output subscript
+    ///
+    /// \param      equation              Equation to be parsed and checked
+    ///
+    /// \param      input_subscripts      A vector of extracted input subscripts
+    ///
+    /// \param      output_subscript      An output subscript
+    ///
+    static void parse_equation(const std::string& equation,
+                               std::vector<std::string>& input_subscripts,
+                               std::string& output_subscript);
+
+    /// \brief      Extract labels (from subscript) that can be alphabetic letters or
+    /// ellipsis
+    ///
+    /// \param      subscript      Subscript
+    ///
+    /// \return     A vector of extracted labels from the input subscript in the order
+    /// of appearence
+    ///
+    static std::vector<std::string> extract_labels(const std::string& subscript);
+
+private:
+    std::string m_equation;
+};
+}  // namespace v7
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/elu.hpp b/ngraph/core/include/openvino/op/elu.hpp
new file mode 100644
index 00000000000000..eb9c8aaa093e87
--- /dev/null
+++ b/ngraph/core/include/openvino/op/elu.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Exponential Linear Unit
+/// x <  0 => f(x) = alpha * (exp(x) - 1.)
+/// x >= 0 => f(x) = x
+///
+class OPENVINO_API Elu : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Elu() = default;
+    /// \brief Constructs an Elu operation.
+    ///
+    /// \param data Input tensor
+    /// \param alpha Multiplier for negative values
+    Elu(const Output<Node>& data, const double alpha);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    double get_alpha() const {
+        return m_alpha;
+    }
+
+private:
+    double m_alpha;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/embedding_segments_sum.hpp b/ngraph/core/include/openvino/op/embedding_segments_sum.hpp
new file mode 100644
index 00000000000000..fb73228343eeff
--- /dev/null
+++ b/ngraph/core/include/openvino/op/embedding_segments_sum.hpp
@@ -0,0 +1,77 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/op/util/index_reduction.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Returns embeddings for given indices
+class OPENVINO_API EmbeddingSegmentsSum : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a EmbeddingSegmentsSum operation.
+    EmbeddingSegmentsSum() = default;
+    /// \brief Constructs a EmbeddingSegmentsSum operation.
+    ///
+    /// EmbeddingSegmentsSum constructs an output tensor by replacing every index in a
+    /// given
+    /// input tensor with a row (from the weights matrix) at that index
+    ///
+    /// \param 'emb_table' tensor containing the embedding lookup table of the module of
+    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
+    /// \param 'indices' tensor of shape [num_indices] and of type T_IND. Required
+    /// \param `segment_ids` tensor of shape `[num_indices]` and of type *T_IND* with
+    /// indices
+    /// into the output Tensor. Values should be sorted and can be repeated. Required.
+    /// \param `num_segments` scalar of type *T_IND* indicating the number of segments.
+    /// Required.
+    /// \param 'default_index' scalar of type T_IND containing default index in
+    /// embedding
+    /// table to fill empty "bags". If not provided empty "bags"
+    /// are filled with zeros. Optional.
+    /// \param 'per_sample_weights' tensor of the same shape as indices and of type T.
+    /// Each value in this tensor are multiplied with each
+    /// value pooled from embedding table for each index. Optional.
+
+    EmbeddingSegmentsSum(const Output<Node>& emb_table,
+                         const Output<Node>& indices,
+                         const Output<Node>& segment_ids,
+                         const Output<Node>& num_segments,
+                         const Output<Node>& default_index,
+                         const Output<Node>& per_sample_weights);
+
+    EmbeddingSegmentsSum(const Output<Node>& emb_table,
+                         const Output<Node>& indices,
+                         const Output<Node>& segment_ids,
+                         const Output<Node>& num_segments,
+                         const Output<Node>& default_index);
+
+    EmbeddingSegmentsSum(const Output<Node>& emb_table,
+                         const Output<Node>& indices,
+                         const Output<Node>& segment_ids,
+                         const Output<Node>& num_segments);
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor&) override {
+        return true;
+    }
+
+private:
+    static constexpr int EMB_TABLE = 0;
+    static constexpr int INDICES = 1;
+    static constexpr int SEGMENT_IDS = 2;
+    static constexpr int NUM_SEGMENTS = 3;
+    static constexpr int DEFAULT_INDEX = 4;
+    static constexpr int PER_SAMPLE_WEIGHTS = 5;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/embeddingbag_offsets_sum.hpp b/ngraph/core/include/openvino/op/embeddingbag_offsets_sum.hpp
new file mode 100644
index 00000000000000..0d2326c3a57dab
--- /dev/null
+++ b/ngraph/core/include/openvino/op/embeddingbag_offsets_sum.hpp
@@ -0,0 +1,55 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/op/util/embeddingbag_offsets_base.hpp"
+#include "openvino/op/util/index_reduction.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Returns embeddings for given indices
+class OPENVINO_API EmbeddingBagOffsetsSum : public util::EmbeddingBagOffsetsBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a EmbeddingBagOffsetsSum operation.
+    EmbeddingBagOffsetsSum() = default;
+    /// \brief Constructs a EmbeddingBagOffsetsSum operation.
+    ///
+    /// EmbeddingBagOffsetsSum constructs an output tensor by replacing every index in a
+    /// given
+    /// input tensor with a row (from the weights matrix) at that index
+    ///
+    /// \param emb_table tensor containing the embedding lookup table of the module of
+    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
+    /// \param tensor of shape [num_indices] and of type T_IND. Required
+    /// \param offsets tensor of shape [batch] and of type T_IND containing the starting
+    /// index positions of each "bag" in indices. Required.
+    /// \param default_index scalar of type T_IND containing default index in embedding
+    /// table to fill empty "bags". If not provided empty "bags"
+    /// are filled with zeros. Optional.
+    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
+    /// Each value in this tensor are multiplied with each
+    /// value pooled from embedding table for each index. Optional.
+
+    EmbeddingBagOffsetsSum(const Output<Node>& emb_table,
+                           const Output<Node>& indices,
+                           const Output<Node>& offsets,
+                           const Output<Node>& default_index,
+                           const Output<Node>& per_sample_weights);
+
+    EmbeddingBagOffsetsSum(const Output<Node>& emb_table,
+                           const Output<Node>& indices,
+                           const Output<Node>& offsets,
+                           const Output<Node>& default_index);
+
+    EmbeddingBagOffsetsSum(const Output<Node>& emb_table, const Output<Node>& indices, const Output<Node>& offsets);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/embeddingbag_packedsum.hpp b/ngraph/core/include/openvino/op/embeddingbag_packedsum.hpp
new file mode 100644
index 00000000000000..68c3dc3f96ff05
--- /dev/null
+++ b/ngraph/core/include/openvino/op/embeddingbag_packedsum.hpp
@@ -0,0 +1,44 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/op/util/embeddingbag_packed_base.hpp"
+#include "openvino/op/util/index_reduction.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Returns embeddings for given indices
+class OPENVINO_API EmbeddingBagPackedSum : public util::EmbeddingBagPackedBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a EmbeddingBagPackedSum operation.
+    EmbeddingBagPackedSum() = default;
+    /// \brief Constructs a EmbeddingBagPackedSum operation.
+    ///
+    /// EmbeddingBagPackedSum constructs an output tensor by replacing every index in a
+    /// given
+    /// input tensor with a row (from the weights matrix) at that index
+    ///
+    /// \param emb_table Tensor containing the embedding lookup table of the module of
+    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
+    /// \param  indices Tensor of shape `[batch, indices_per_bag]` and of type *T_IND*.
+    /// Required.
+    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
+    /// Each value in this tensor are multiplied with each
+    /// value pooled from embedding table for each index. Optional.
+
+    EmbeddingBagPackedSum(const Output<Node>& emb_table,
+                          const Output<Node>& indices,
+                          const Output<Node>& per_sample_weights);
+
+    EmbeddingBagPackedSum(const Output<Node>& emb_table, const Output<Node>& indices);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/equal.hpp b/ngraph/core/include/openvino/op/equal.hpp
new file mode 100644
index 00000000000000..ce73248ffcbe6d
--- /dev/null
+++ b/ngraph/core/include/openvino/op/equal.hpp
@@ -0,0 +1,51 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_comparison.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+// clang-format off
+/// \brief Elementwise is-equal operation.
+///
+/// ## Inputs
+///
+/// |        | Type                              | Description                                            |
+/// | ------ | --------------------------------- | ------------------------------------------------------ |
+/// | `arg0` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and element type.                |
+/// | `arg1` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
+/// | `autob`| AutoBroadcastSpec                 | Auto broadcast specification.                          |
+///
+/// ## Output
+///
+/// | Type                               | Description                                                                                                                                |
+/// | ---------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------ |
+/// | \f$\texttt{bool}[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = 1\text{ if }\texttt{arg0}[i_1,\dots,i_n] = \texttt{arg1}[i_1,\dots,i_n]\text{, else } 0\f$ |
+// clang-format on
+class OPENVINO_API Equal : public util::BinaryElementwiseComparison {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs an equal operation.
+    Equal() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
+    /// \brief Constructs an equal operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Equal(const Output<Node>& arg0,
+          const Output<Node>& arg1,
+          const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/erf.hpp b/ngraph/core/include/openvino/op/erf.hpp
new file mode 100644
index 00000000000000..b3be867dda93b5
--- /dev/null
+++ b/ngraph/core/include/openvino/op/erf.hpp
@@ -0,0 +1,30 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise erf operation.
+class OPENVINO_API Erf : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a floor operation.
+    Erf() = default;
+    /// \brief Constructs a floor operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Erf(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/exp.hpp b/ngraph/core/include/openvino/op/exp.hpp
new file mode 100644
index 00000000000000..7bb23dbd3f6012
--- /dev/null
+++ b/ngraph/core/include/openvino/op/exp.hpp
@@ -0,0 +1,32 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise natural exponential (exp) operation.
+class OPENVINO_API Exp : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an exponential operation.
+    Exp() = default;
+    /// \brief Constructs an exponential operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Exp(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/experimental_detectron_detection_output.hpp b/ngraph/core/include/openvino/op/experimental_detectron_detection_output.hpp
new file mode 100644
index 00000000000000..4f04bf2a0bf03e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/experimental_detectron_detection_output.hpp
@@ -0,0 +1,74 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v6 {
+/// \brief An operation ExperimentalDetectronDetectionOutput performs
+/// non-maximum suppression to generate the detection output using
+/// information on location and score predictions.
+class OPENVINO_API ExperimentalDetectronDetectionOutput : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Structure that specifies attributes of the operation
+    struct Attributes {
+        // specifies score threshold
+        float score_threshold;
+        // specifies NMS threshold
+        float nms_threshold;
+        // specifies maximal delta of logarithms for width and height
+        float max_delta_log_wh;
+        // specifies number of detected classes
+        int64_t num_classes;
+        // specifies maximal number of detections per class
+        int64_t post_nms_count;
+        // specifies maximual number of detections per image
+        size_t max_detections_per_image;
+        // a flag specifies whether to delete background classes or not
+        // `true`  means background classes should be deleted,
+        // `false` means background classes shouldn't be deleted.
+        bool class_agnostic_box_regression;
+        // specifies deltas of weights
+        std::vector<float> deltas_weights;
+    };
+
+    ExperimentalDetectronDetectionOutput() = default;
+    /// \brief Constructs a ExperimentalDetectronDetectionOutput operation.
+    ///
+    /// \param input_rois  Input rois
+    /// \param input_deltas Input deltas
+    /// \param input_scores Input scores
+    /// \param input_im_info Input image info
+    /// \param attrs  Attributes attributes
+    ExperimentalDetectronDetectionOutput(const Output<Node>& input_rois,
+                                         const Output<Node>& input_deltas,
+                                         const Output<Node>& input_scores,
+                                         const Output<Node>& input_im_info,
+                                         const Attributes& attrs);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    /// \brief Returns attributes of the operation ExperimentalDetectronDetectionOutput
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+
+private:
+    Attributes m_attrs;
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/experimental_detectron_generate_proposals.hpp b/ngraph/core/include/openvino/op/experimental_detectron_generate_proposals.hpp
new file mode 100644
index 00000000000000..c17fdcae970e28
--- /dev/null
+++ b/ngraph/core/include/openvino/op/experimental_detectron_generate_proposals.hpp
@@ -0,0 +1,64 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstdint>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v6 {
+/// \brief An operation ExperimentalDetectronGenerateProposalsSingleImage
+/// computes ROIs and their scores based on input data.
+class OPENVINO_API ExperimentalDetectronGenerateProposalsSingleImage : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Structure that specifies attributes of the operation
+    struct Attributes {
+        // minimum box width & height
+        float min_size;
+        // specifies NMS threshold
+        float nms_threshold;
+        // number of top-n proposals after NMS
+        int64_t post_nms_count;
+        // number of top-n proposals before NMS
+        int64_t pre_nms_count;
+    };
+
+    ExperimentalDetectronGenerateProposalsSingleImage() = default;
+    /// \brief Constructs a ExperimentalDetectronGenerateProposalsSingleImage operation.
+    ///
+    /// \param im_info Input image info
+    /// \param anchors Input anchors
+    /// \param deltas Input deltas
+    /// \param scores Input scores
+    /// \param attrs Operation attributes
+    ExperimentalDetectronGenerateProposalsSingleImage(const Output<Node>& im_info,
+                                                      const Output<Node>& anchors,
+                                                      const Output<Node>& deltas,
+                                                      const Output<Node>& scores,
+                                                      const Attributes& attrs);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+
+private:
+    Attributes m_attrs;
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/experimental_detectron_prior_grid_generator.hpp b/ngraph/core/include/openvino/op/experimental_detectron_prior_grid_generator.hpp
new file mode 100644
index 00000000000000..14933e22dff81e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/experimental_detectron_prior_grid_generator.hpp
@@ -0,0 +1,67 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstdint>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v6 {
+/// \brief An operation ExperimentalDetectronPriorGridGenerator generates prior
+/// grids of specified sizes.
+class OPENVINO_API ExperimentalDetectronPriorGridGenerator : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Structure that specifies attributes of the operation
+    struct Attributes {
+        // Specifies whether the output tensor should be 2D or 4D
+        // `true`  means the output tensor should be 2D tensor,
+        // `false` means the output tensor should be 4D tensor.
+        bool flatten;
+        // Specifies number of cells of the generated grid with respect to height.
+        int64_t h;
+        // Specifies number of cells of the generated grid with respect to width.
+        int64_t w;
+        // Specifies the step of generated grid with respect to x coordinate
+        float stride_x;
+        // Specifies the step of generated grid with respect to y coordinate
+        float stride_y;
+    };
+
+    ExperimentalDetectronPriorGridGenerator() = default;
+    /// \brief Constructs a ExperimentalDetectronDetectionOutput operation.
+    ///
+    /// \param priors  Input priors
+    /// \param feature_map Input feature map
+    /// \param im_data Image data
+    /// \param attrs   attributes
+    ExperimentalDetectronPriorGridGenerator(const Output<Node>& priors,
+                                            const Output<Node>& feature_map,
+                                            const Output<Node>& im_data,
+                                            const Attributes& attrs);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    /// \brief Returns attributes of this operation.
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+
+private:
+    Attributes m_attrs;
+
+    void validate();
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/experimental_detectron_roi_feature.hpp b/ngraph/core/include/openvino/op/experimental_detectron_roi_feature.hpp
new file mode 100644
index 00000000000000..052b7c0bc4b439
--- /dev/null
+++ b/ngraph/core/include/openvino/op/experimental_detectron_roi_feature.hpp
@@ -0,0 +1,59 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <cstdint>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v6 {
+/// \brief An operation ExperimentalDetectronROIFeatureExtractor
+/// is the ROIAlign operation applied over a feature pyramid.
+class OPENVINO_API ExperimentalDetectronROIFeatureExtractor : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Structure that specifies attributes of the operation
+    struct Attributes {
+        int64_t output_size;
+        int64_t sampling_ratio;
+        std::vector<int64_t> pyramid_scales;
+        bool aligned;
+    };
+
+    ExperimentalDetectronROIFeatureExtractor() = default;
+    /// \brief Constructs a ExperimentalDetectronROIFeatureExtractor operation.
+    ///
+    /// \param args  Inputs of ExperimentalDetectronROIFeatureExtractor
+    /// \param attrs  Operation attributes
+    ExperimentalDetectronROIFeatureExtractor(const OutputVector& args, const Attributes& attrs);
+
+    /// \brief Constructs a ExperimentalDetectronROIFeatureExtractor operation.
+    ///
+    /// \param args  Inputs of ExperimentalDetectronROIFeatureExtractor
+    /// \param attrs  Operation attributes
+    ExperimentalDetectronROIFeatureExtractor(const NodeVector& args, const Attributes& attrs);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    /// \brief Returns attributes of the operation.
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+
+private:
+    Attributes m_attrs;
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/experimental_detectron_topkrois.hpp b/ngraph/core/include/openvino/op/experimental_detectron_topkrois.hpp
new file mode 100644
index 00000000000000..50f73ac5588694
--- /dev/null
+++ b/ngraph/core/include/openvino/op/experimental_detectron_topkrois.hpp
@@ -0,0 +1,45 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstdint>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v6 {
+/// \brief An operation ExperimentalDetectronTopKROIs, according to the repository
+/// is TopK operation applied to probabilities of input ROIs.
+class OPENVINO_API ExperimentalDetectronTopKROIs : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ExperimentalDetectronTopKROIs() = default;
+    /// \brief Constructs a ExperimentalDetectronTopKROIs operation.
+    ///
+    /// \param input_rois  Input rois
+    /// \param rois_probs Probabilities for input rois
+    /// \param max_rois Maximal numbers of output rois
+    ExperimentalDetectronTopKROIs(const Output<Node>& input_rois, const Output<Node>& rois_probs, size_t max_rois = 0);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    size_t get_max_rois() const {
+        return m_max_rois;
+    }
+
+private:
+    size_t m_max_rois;
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/extractimagepatches.hpp b/ngraph/core/include/openvino/op/extractimagepatches.hpp
new file mode 100644
index 00000000000000..7514ec6610ff49
--- /dev/null
+++ b/ngraph/core/include/openvino/op/extractimagepatches.hpp
@@ -0,0 +1,70 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+class OPENVINO_API ExtractImagePatches : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ExtractImagePatches() = default;
+    /// \brief Constructs a ExtractImagePatches operation
+    ///
+    /// \param data 4-D Input data to extract image patches
+    /// \param sizes Patch size in the format of [size_rows, size_cols]
+    /// \param strides Patch movement stride in the format of [stride_rows, stride_cols]
+    /// \param rates Element seleciton rate for creating a patch. in the format of
+    /// [rate_rows, rate_cols]
+    /// \param auto_pad Padding type. it can be any value from
+    /// valid, same_lower, same_upper
+    ExtractImagePatches(const Output<Node>& image,
+                        const Shape& sizes,
+                        const Strides& strides,
+                        const Shape& rates,
+                        const PadType& auto_pad);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    const Shape& get_sizes() const {
+        return m_patch_sizes;
+    }
+    void set_sizes(const Shape& sizes) {
+        m_patch_sizes = sizes;
+    }
+    const Strides& get_strides() const {
+        return m_patch_movement_strides;
+    }
+    void set_strides(const Strides& strides) {
+        m_patch_movement_strides = strides;
+    }
+    const Shape& get_rates() const {
+        return m_patch_selection_rates;
+    }
+    void set_rates(const Shape& rates) {
+        m_patch_selection_rates = rates;
+    }
+    const PadType& get_auto_pad() const {
+        return m_padding;
+    }
+    void set_auto_pad(PadType& padding) {
+        m_padding = padding;
+    }
+
+private:
+    Shape m_patch_sizes;
+    Strides m_patch_movement_strides;
+    Shape m_patch_selection_rates;
+    PadType m_padding;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/fake_quantize.hpp b/ngraph/core/include/openvino/op/fake_quantize.hpp
new file mode 100644
index 00000000000000..86f10ec377896c
--- /dev/null
+++ b/ngraph/core/include/openvino/op/fake_quantize.hpp
@@ -0,0 +1,81 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+///
+/// \brief      Class performing element-wise linear quantization.
+///
+/// \note       Input floating point values are quantized into a discrete
+///             set of floating point values.
+///
+/// \paragraph Implementation This class creates a node which performs the following
+///            operation:
+///
+///            round((data - input_low) / (input_high - input_low) * (levels-1)) /
+///                 (levels-1) * (output_high - output_low) + output_low
+///
+///
+class OPENVINO_API FakeQuantize : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    FakeQuantize();
+    ///
+    /// \brief      Constructs a FakeQuantize operation node.
+    ///
+    /// \param[in]  data            The input data tensor.
+    /// \param[in]  input_low       The minimum limit for input values.
+    /// \param[in]  input_high      The maximum limit for input values.
+    /// \param[in]  output_low      The minimum quantized value.
+    /// \param[in]  output_high     The maximum quantized value.
+    /// \param[in]  levels          The number of quantization levels.
+    /// \param[in]  auto_broadcast  AutoBroadcast mode to be used for broadcasting
+    ///                             limit values
+    ///
+    FakeQuantize(const Output<Node>& data,
+                 const Output<Node>& input_low,
+                 const Output<Node>& input_high,
+                 const Output<Node>& output_low,
+                 const Output<Node>& output_high,
+                 std::size_t levels,
+                 const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    std::size_t get_levels() const {
+        return m_levels;
+    }
+    void set_levels(std::size_t levels) {
+        m_levels = levels;
+    }
+    const AutoBroadcastSpec& get_auto_broadcast() const {
+        return m_auto_broadcast;
+    }
+    void set_auto_broadcast(const AutoBroadcastSpec& auto_broadcast) {
+        m_auto_broadcast = auto_broadcast;
+    }
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override {
+        return false;
+    }
+
+private:
+    std::size_t m_levels;
+    AutoBroadcastSpec m_auto_broadcast = op::AutoBroadcastType::NUMPY;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/floor.hpp b/ngraph/core/include/openvino/op/floor.hpp
new file mode 100644
index 00000000000000..a5a759d4d944fb
--- /dev/null
+++ b/ngraph/core/include/openvino/op/floor.hpp
@@ -0,0 +1,30 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise floor operation.
+class OPENVINO_API Floor : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a floor operation.
+    Floor() = default;
+    /// \brief Constructs a floor operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Floor(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/floor_mod.hpp b/ngraph/core/include/openvino/op/floor_mod.hpp
new file mode 100644
index 00000000000000..a26bbe34bdfd2d
--- /dev/null
+++ b/ngraph/core/include/openvino/op/floor_mod.hpp
@@ -0,0 +1,42 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise FloorMod operation.
+///
+class OPENVINO_API FloorMod : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an uninitialized addition operation
+    FloorMod() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY){};
+
+    /// \brief Constructs an Floor Mod operation.
+    ///
+    /// \param arg0 Output that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param arg1 Output that produces the second input tensor.<br>
+    /// `[d0, ...]`
+    /// \param auto_broadcast Auto broadcast specification
+    ///
+    /// Output `[d0, ...]`
+    ///
+    FloorMod(const Output<Node>& arg0,
+             const Output<Node>& arg1,
+             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastType::NUMPY);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/gather.hpp b/ngraph/core/include/openvino/op/gather.hpp
new file mode 100644
index 00000000000000..f9546ffc08b912
--- /dev/null
+++ b/ngraph/core/include/openvino/op/gather.hpp
@@ -0,0 +1,80 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/gather_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Gather slices from axis of data according to indices
+class OPENVINO_API Gather : public op::util::GatherBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    static const int64_t AXIS_NOT_SET_VALUE = std::numeric_limits<int64_t>::max();
+    Gather() = default;
+    /// \param data The tensor from which slices are gathered
+    /// \param indices Tensor with indexes to gather
+    /// \param axis The tensor is a dimension index to gather data from
+    Gather(const Output<Node>& params, const Output<Node>& indices, const Output<Node>& axis);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    int64_t get_axis() const override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v1
+
+namespace v7 {
+/// \brief Gather slices from axis of data according to indices
+class OPENVINO_API Gather : public op::util::GatherBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Gather() = default;
+
+    /// \param data The tensor from which slices are gathered
+    /// \param indices Tensor with indexes to gather
+    /// \param axis The tensor is a dimension index to gather data from
+    /// \param batch_dims The number of batch dimension in data and indices tensors.
+    /// If batch_dims = 0 Gather v7 is identical to Gather v1.
+    Gather(const Output<Node>& data,
+           const Output<Node>& indices,
+           const Output<Node>& axis,
+           const int64_t batch_dims = 0);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+    int64_t get_batch_dims() const;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v7
+
+namespace v8 {
+/// \brief Gather slices from axis of data according to indices. Negative indices
+/// are supported and indicate reverse indexing from the end
+class OPENVINO_API Gather : public op::util::GatherBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Gather() = default;
+
+    /// \param data The tensor from which slices are gathered
+    /// \param indices Tensor with indexes to gather
+    /// \param axis The tensor is a dimension index to gather data from
+    /// \param batch_dims The number of batch dimension in data and indices tensors.
+    Gather(const Output<Node>& data,
+           const Output<Node>& indices,
+           const Output<Node>& axis,
+           const int64_t batch_dims = 0);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+    int64_t get_batch_dims() const;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/gather_elements.hpp b/ngraph/core/include/openvino/op/gather_elements.hpp
new file mode 100644
index 00000000000000..ae00119bbed3e9
--- /dev/null
+++ b/ngraph/core/include/openvino/op/gather_elements.hpp
@@ -0,0 +1,39 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v6 {
+/// \brief GatherElements operation
+///
+class OPENVINO_API GatherElements : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    GatherElements() = default;
+
+    /// \brief Constructs a GatherElements operation.
+    ///
+    /// \param data Node producing data that are gathered
+    /// \param indices Node producing indices by which the operation gathers elements
+    /// \param axis specifies axis along which indices are specified
+    GatherElements(const Output<Node>& data, const Output<Node>& indices, const int64_t axis);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    int64_t get_axis() const {
+        return m_axis;
+    }
+
+private:
+    int64_t m_axis;
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/gather_nd.hpp b/ngraph/core/include/openvino/op/gather_nd.hpp
new file mode 100644
index 00000000000000..82fcd2b7ac9f20
--- /dev/null
+++ b/ngraph/core/include/openvino/op/gather_nd.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v5 {
+/// \brief GatherND operation
+///
+class OPENVINO_API GatherND : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    GatherND() = default;
+
+    /// \brief Constructs a GatherND operation.
+    ///
+    /// \param data Node producing data that are gathered
+    /// \param indices Node producing indices by which the operation gathers elements
+    /// or slices from data
+    /// \param batch_dims Specifies a number of batch dimensions
+    GatherND(const Output<Node>& data, const Output<Node>& indices, const size_t batch_dims = 0);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    size_t get_batch_dims() const {
+        return m_batch_dims;
+    }
+
+private:
+    size_t m_batch_dims;
+};
+}  // namespace v5
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/gather_tree.hpp b/ngraph/core/include/openvino/op/gather_tree.hpp
new file mode 100644
index 00000000000000..e6f2828d9cd5df
--- /dev/null
+++ b/ngraph/core/include/openvino/op/gather_tree.hpp
@@ -0,0 +1,38 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Generates the complete beams from the ids per each step and the parent beam
+/// ids.
+class OPENVINO_API GatherTree : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    GatherTree() = default;
+    /// \param step_ids     Tensor of shape [MAX_TIME, BATCH_SIZE, BEAM_WIDTH] with
+    ///                     indices from per each step
+    /// \param parent_idx   Tensor of shape [MAX_TIME, BATCH_SIZE, BEAM_WIDTH] with
+    ///                     parent beam indices
+    /// \param max_seq_len  Tensor of shape [BATCH_SIZE] with maximum lengths for each
+    ///                     sequence in the batch
+    /// \param end_token    Tensor of shape [MAX_TIME, BATCH_SIZE, BEAM_WIDTH]
+    GatherTree(const Output<Node>& step_ids,
+               const Output<Node>& parent_idx,
+               const Output<Node>& max_seq_len,
+               const Output<Node>& end_token);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/gelu.hpp b/ngraph/core/include/openvino/op/gelu.hpp
new file mode 100644
index 00000000000000..f8b4ed66a4a252
--- /dev/null
+++ b/ngraph/core/include/openvino/op/gelu.hpp
@@ -0,0 +1,81 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Gaussian Error Linear Unit
+/// f(x) = 0.5 * x * (1 + erf( x / sqrt(2) )
+class OPENVINO_API Gelu : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Gelu();
+    /// \brief Constructs a Gelu operation.
+    ///
+    /// \param data Input tensor
+    Gelu(const Output<Node>& data);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v0
+
+/// \brief Specifies the approximation to calculate Gelu
+enum class GeluApproximationMode { TANH, ERF };
+OPENVINO_API std::ostream& operator<<(std::ostream& s, const GeluApproximationMode& type);
+
+namespace v7 {
+/// \brief Gaussian Error Linear Unit
+/// f(x) = 0.5 * x * (1 + erf( x / sqrt(2) ) for "approximation" = "erf"
+/// f(x) = 0.5 * x * (1 + tanh([sqrt(2 / pi)] * [x + 0.044715^3]) for "approximation" =
+/// "tanh"
+class OPENVINO_API Gelu : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Gelu() = default;
+    /// \brief Constructs a Gelu operation.
+    ///
+    /// \param data Input tensor
+    /// \param mode Approximation mode
+    Gelu(const Output<Node>& data, GeluApproximationMode mode = GeluApproximationMode::ERF);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    GeluApproximationMode get_approximation_mode() const;
+
+private:
+    GeluApproximationMode m_approximation_mode = GeluApproximationMode::ERF;
+};
+}  // namespace v7
+}  // namespace op
+
+template <>
+class OPENVINO_API AttributeAdapter<op::GeluApproximationMode>
+    : public EnumAttributeAdapterBase<op::GeluApproximationMode> {
+public:
+    AttributeAdapter(op::GeluApproximationMode& value) : EnumAttributeAdapterBase<op::GeluApproximationMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::GeluApproximationMode>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/greater.hpp b/ngraph/core/include/openvino/op/greater.hpp
new file mode 100644
index 00000000000000..1edfcafa34f3ad
--- /dev/null
+++ b/ngraph/core/include/openvino/op/greater.hpp
@@ -0,0 +1,33 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_comparison.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise greater-than operation.
+class OPENVINO_API Greater : public util::BinaryElementwiseComparison {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a greater-than operation.
+    Greater() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
+    /// \brief Constructs a greater-than operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Greater(const Output<Node>& arg0,
+            const Output<Node>& arg1,
+            const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/greater_eq.hpp b/ngraph/core/include/openvino/op/greater_eq.hpp
new file mode 100644
index 00000000000000..7ce10d2f70d4a7
--- /dev/null
+++ b/ngraph/core/include/openvino/op/greater_eq.hpp
@@ -0,0 +1,33 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_comparison.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise greater-than-or-equal operation.
+class OPENVINO_API GreaterEqual : public util::BinaryElementwiseComparison {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a greater-than-or-equal operation.
+    GreaterEqual() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
+    /// \brief Constructs a greater-than-or-equal operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    GreaterEqual(const Output<Node>& arg0,
+                 const Output<Node>& arg1,
+                 const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/grn.hpp b/ngraph/core/include/openvino/op/grn.hpp
new file mode 100644
index 00000000000000..d151f908aa9fb8
--- /dev/null
+++ b/ngraph/core/include/openvino/op/grn.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief  Global Response Normalization with L2 norm (across channels only).
+///
+class OPENVINO_API GRN : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    GRN() = default;
+    /// \brief      Constructs a GRN operation.
+    ///
+    /// \param      data  - Node producing the input tensor
+    /// \param      bias  - The bias added to the variance.
+    ///
+    GRN(const Output<Node>& data, float bias);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    float get_bias() const {
+        return m_bias;
+    }
+
+protected:
+    float m_bias = 1.0f;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/group_conv.hpp b/ngraph/core/include/openvino/op/group_conv.hpp
new file mode 100644
index 00000000000000..c7a2289b47472b
--- /dev/null
+++ b/ngraph/core/include/openvino/op/group_conv.hpp
@@ -0,0 +1,273 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/convolution.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Batched convolution operation, with optional window dilation and stride.
+class OPENVINO_API GroupConvolution : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a batched convolution operation.
+    GroupConvolution() = default;
+    /// \brief Constructs a batched convolution operation.
+    ///
+    /// \param data_batch The node producing the input data batch tensor.<br>
+    /// `[N, C_IN, D1, ... Df]`
+    /// \param filters The node producing the filters tensor.<br>
+    /// `[GROUPS, FC_OUT, FC_IN, F1, ... Ff]`
+    /// \param strides The strides.<br>
+    /// `[f]`
+    /// \param dilations The dilations.<br>
+    /// `[f]`
+    /// \param pads_begin The beginning of padding shape.<br>
+    /// `[f]`
+    /// \param pads_end The end of padding shape.<br>
+    /// `[f]`
+    /// \param auto_pad The pad type for automatically computing padding sizes.<br>
+    /// `[f]`
+    ///
+    /// Output `[N, FC_OUT * GROUPS, R1, ... Rf]`
+    ///
+    GroupConvolution(const Output<Node>& data_batch,
+                     const Output<Node>& filters,
+                     const Strides& strides,
+                     const CoordinateDiff& pads_begin,
+                     const CoordinateDiff& pads_end,
+                     const Strides& dilations,
+                     const PadType& auto_pad = PadType::EXPLICIT);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    /// \return The strides.
+    const Strides& get_strides() const {
+        return m_strides;
+    }
+    void set_strides(const Strides& strides) {
+        m_strides = strides;
+    }
+    /// \return The dilations.
+    const Strides& get_dilations() const {
+        return m_dilations;
+    }
+    void set_dilations(const Strides& dilations) {
+        m_dilations = dilations;
+    }
+    /// \return The padding-below sizes (possibly negative).
+    const CoordinateDiff& get_pads_begin() const {
+        return m_pads_begin;
+    }
+    void set_pads_begin(const CoordinateDiff& pads_begin) {
+        m_pads_begin = pads_begin;
+    }
+    /// \return The padding-above sizes (possibly negative).
+    const CoordinateDiff& get_pads_end() const {
+        return m_pads_end;
+    }
+    void set_adding_above(const CoordinateDiff& pads_end) {
+        m_pads_end = pads_end;
+    }
+    /// \return The pad type for convolution.
+    const PadType& get_auto_pad() const {
+        return m_auto_pad;
+    }
+    void set_auto_pad(const PadType& auto_pad) {
+        m_auto_pad = auto_pad;
+    }
+    /// \return The default value for Convolution.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+protected:
+    Strides m_strides;
+    Strides m_dilations;
+    CoordinateDiff m_pads_begin;
+    CoordinateDiff m_pads_end;
+    PadType m_auto_pad;
+};
+
+/// \brief Data batch backprop for batched convolution operation.
+class OPENVINO_API GroupConvolutionBackpropData : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a batched-convolution data batch-backprop operation.
+    GroupConvolutionBackpropData();
+    // clang-format off
+                //
+                // \brief      Constructs a batched-convolution data batch-backprop operation.
+                //
+                // \param      data            The node producing data from forward-prop. Shape: [N,
+                //                             C_INPUT * GROUPS, X1, ..., XD].
+                // \param      filter          The node producing the filter from forward-prop. Shape:
+                //                             [GROUPS, C_INPUT, C_OUTPUT, K_D, ..., K_1]
+                // \param      output_shape    The shape of the data batch from forward-prop. It's size
+                //                             should be equal to number of data spatial dimensions.
+                // \param      strides         The strides from forward-prop.
+                // \param      pads_begin      The padding-below sizes from forward-prop.
+                // \param      pads_end        The padding-above sizes from forward-prop.
+                // \param      dilations       The dilations from forward-prop.
+                // \param      auto_pad        The pad type for automatically computing padding sizes.
+                // \param      output_padding  The output padding adds additional amount of paddings per
+                //                             each spatial axis in the output tensor.
+                //
+    // clang-format on
+    //
+    GroupConvolutionBackpropData(const Output<Node>& data,
+                                 const Output<Node>& filter,
+                                 const Output<Node>& output_shape,
+                                 const Strides& strides,
+                                 const CoordinateDiff& pads_begin,
+                                 const CoordinateDiff& pads_end,
+                                 const Strides& dilations,
+                                 const PadType& auto_pad = PadType::EXPLICIT,
+                                 const CoordinateDiff& output_padding = {});
+
+    // clang-format off
+                //
+                // \brief      Constructs a batched-convolution data batch-backprop operation.
+                //
+                // \param      data            The node producing data from forward-prop. Shape: [N,
+                //                             C_INPUT * GROUPS, X1, ..., XD].
+                // \param      filter          The node producing the filter from forward-prop. Shape:
+                //                             [GROUPS, C_INPUT, C_OUTPUT, K_D, ..., K_1]
+                // \param      output_shape    The shape of the data batch from forward-prop. It's size
+                //                             should be equal to number of data spatial dimensions.
+                // \param      strides         The strides from forward-prop.
+                // \param      dilations       The dilations from forward-prop.
+                // \param      auto_pad        The pad type for automatically computing padding sizes.
+                // \param      output_padding  The output padding adds additional amount of paddings per
+                //                             each spatial axis in the output tensor.
+                //
+    // clang-format on
+    //
+    GroupConvolutionBackpropData(const Output<Node>& data,
+                                 const Output<Node>& filter,
+                                 const Output<Node>& output_shape,
+                                 const Strides& strides,
+                                 const Strides& dilations,
+                                 const PadType& auto_pad,
+                                 const CoordinateDiff& output_padding = {});
+
+    // clang-format off
+                //
+                // \brief      Constructs a batched-convolution data batch-backprop operation.
+                //
+                // \param      data            The node producing data from forward-prop. Shape:
+                //                             [N, C_INPUT * GROUPS, X1, ..., XD].
+                // \param      filter          The node producing the filter from forward-prop. Shape:
+                //                             [GROUPS, C_INPUT, C_OUTPUT, K_D, ..., K_1]
+                // \param      strides         The strides from forward-prop.
+                // \param      pads_begin      The padding-below sizes from forward-prop.
+                // \param      pads_end        The padding-above sizes from forward-prop.
+                // \param      dilations       The dilations from forward-prop.
+                // \param      auto_pad        The pad type for automatically computing padding sizes.
+                // \param      output_padding  The output padding adds additional amount of paddings per
+                //                             each spatial axis in the output tensor.
+                //
+    // clang-format on
+    GroupConvolutionBackpropData(const Output<Node>& data,
+                                 const Output<Node>& filter,
+                                 const Strides& strides,
+                                 const CoordinateDiff& pads_begin,
+                                 const CoordinateDiff& pads_end,
+                                 const Strides& dilations,
+                                 const PadType& auto_pad = PadType::EXPLICIT,
+                                 const CoordinateDiff& output_padding = {});
+    ///
+    /// \brief      Calculates output spatial features size.
+    ///
+    /// \param[in]  input_data_shape      The input data partial shape
+    /// \param[in]  filters_shape         The filters partial shape
+    /// \param[in]  strides               The strides values.
+    /// \param[in]  dilations             The dilations values.
+    /// \param[in]  pads_begin            The paddings at the beginning of axis.
+    /// \param[in]  pads_end              The paddings at the end of axis.
+    /// \param[in]  output_padding    The output padding values.
+    /// \param      output_spatial_shape  The placeholder for computed output spatial
+    /// partial
+    /// shape.
+    ///
+    void infer_conv_backprop_output_spatial_shape(const std::vector<Dimension>& input_data_shape,
+                                                  const std::vector<Dimension>& filters_shape,
+                                                  const Strides& strides,
+                                                  const Strides& dilations,
+                                                  const CoordinateDiff& pads_begin,
+                                                  const CoordinateDiff& pads_end,
+                                                  const CoordinateDiff& output_padding,
+                                                  std::vector<Dimension>& output_spatial_shape);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool is_dynamic() const override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The spatial shape of the output.
+    const PartialShape get_convolution_output_shape() const;
+    void set_output_shape(const Shape& output_shape);
+    /// \return The strides from the forward prop.
+    const Strides& get_strides() const {
+        return m_strides;
+    }
+    void set_strides(const Strides& strides) {
+        m_strides = strides;
+    }
+    /// \return The dilations from the forward prop.
+    const Strides& get_dilations() const {
+        return m_dilations;
+    }
+    void set_dilations(const Strides& dilations) {
+        m_dilations = dilations;
+    }
+    /// \return The number of pixels to add to the beginning along each axis.
+    const CoordinateDiff& get_pads_begin() const {
+        return m_pads_begin;
+    }
+    void set_pads_begin(const CoordinateDiff& pads_begin) {
+        m_pads_begin = pads_begin;
+    }
+    /// \return The number of pixels to add to the ending along each axis.
+    const CoordinateDiff& get_pads_end() const {
+        return m_pads_end;
+    }
+    void set_pads_end(const CoordinateDiff& pads_end) {
+        m_pads_end = pads_end;
+    }
+    /// \return The auto pad.
+    const PadType& get_auto_pad() const {
+        return m_auto_pad;
+    }
+    void set_auto_pad(const PadType& auto_pad) {
+        m_auto_pad = auto_pad;
+    }
+    /// \return The output padding.
+    const CoordinateDiff& get_output_padding() const {
+        return m_output_padding;
+    }
+    void set_output_padding(const CoordinateDiff& output_padding) {
+        m_output_padding = output_padding;
+    }
+
+protected:
+    Strides m_strides;
+    Strides m_dilations;
+    CoordinateDiff m_pads_begin;
+    CoordinateDiff m_pads_end;
+    PadType m_auto_pad;
+    CoordinateDiff m_output_padding;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/gru_cell.hpp b/ngraph/core/include/openvino/op/gru_cell.hpp
new file mode 100644
index 00000000000000..f417b3bb05c701
--- /dev/null
+++ b/ngraph/core/include/openvino/op/gru_cell.hpp
@@ -0,0 +1,160 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/activation_functions.hpp"
+#include "openvino/op/util/rnn_cell_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+///
+/// \brief      Class for GRU cell node.
+///
+/// \note       Note this class represents only single *cell* and not whole GRU *layer*.
+///
+class OPENVINO_API GRUCell : public util::RNNCellBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    GRUCell();
+    ///
+    /// \brief      Constructs GRUCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape:
+    ///                                   [gates_count * hidden_size, input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [gates_count * hidden_size, hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    ///
+    GRUCell(const Output<Node>& X,
+            const Output<Node>& initial_hidden_state,
+            const Output<Node>& W,
+            const Output<Node>& R,
+            std::size_t hidden_size);
+
+    ///
+    /// \brief      Constructs GRUCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape:
+    ///                                   [gates_count * hidden_size, input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [gates_count * hidden_size, hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    ///
+    GRUCell(const Output<Node>& X,
+            const Output<Node>& initial_hidden_state,
+            const Output<Node>& W,
+            const Output<Node>& R,
+            std::size_t hidden_size,
+            const std::vector<std::string>& activations,
+            const std::vector<float>& activations_alpha,
+            const std::vector<float>& activations_beta,
+            float clip,
+            bool linear_before_reset);
+
+    ///
+    /// \brief      Constructs GRUCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape: [gates_count *
+    ///                                   hidden_size, input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [gates_count * hidden_size, hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  B                     The sum of biases (weight and recurrence) for
+    ///                                   update, reset and hidden gates.
+    ///                                   If linear_before_reset := true then biases for
+    ///                                   hidden gates are
+    ///                                   placed separately (weight and recurrence).
+    ///                                   Shape: [gates_count * hidden_size] if
+    ///                                   linear_before_reset := false
+    ///                                   Shape: [(gates_count + 1) * hidden_size] if
+    ///                                   linear_before_reset := true
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    /// \param[in]  linear_before_reset   Whether or not to apply the linear
+    ///                                   transformation before multiplying by the
+    ///                                   output of the reset gate.
+    ///
+    GRUCell(const Output<Node>& X,
+            const Output<Node>& initial_hidden_state,
+            const Output<Node>& W,
+            const Output<Node>& R,
+            const Output<Node>& B,
+            std::size_t hidden_size,
+            const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh"},
+            const std::vector<float>& activations_alpha = {},
+            const std::vector<float>& activations_beta = {},
+            float clip = 0.f,
+            bool linear_before_reset = false);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool get_linear_before_reset() const {
+        return m_linear_before_reset;
+    }
+
+private:
+    /// brief Add and initialize bias input to all zeros.
+    void add_default_bias_input();
+
+    ///
+    /// \brief The Activation function f.
+    ///
+    util::ActivationFunction m_activation_f;
+    ///
+    /// \brief The Activation function g.
+    ///
+    util::ActivationFunction m_activation_g;
+
+    static constexpr std::size_t s_gates_count{3};
+    ///
+    /// \brief Control whether or not apply the linear transformation.
+    ///
+    /// \note The linear transformation may be applied when computing the output of
+    ///       hidden gate. It's done before multiplying by the output of the reset gate.
+    ///
+    bool m_linear_before_reset;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/gru_sequence.hpp b/ngraph/core/include/openvino/op/gru_sequence.hpp
new file mode 100644
index 00000000000000..3421d5d31a4cf1
--- /dev/null
+++ b/ngraph/core/include/openvino/op/gru_sequence.hpp
@@ -0,0 +1,54 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/rnn_cell_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v5 {
+class OPENVINO_API GRUSequence : public util::RNNCellBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    GRUSequence();
+
+    GRUSequence(const Output<Node>& X,
+                const Output<Node>& H_t,
+                const Output<Node>& sequence_lengths,
+                const Output<Node>& W,
+                const Output<Node>& R,
+                const Output<Node>& B,
+                size_t hidden_size,
+                op::RecurrentSequenceDirection direction,
+                const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh"},
+                const std::vector<float>& activations_alpha = {},
+                const std::vector<float>& activations_beta = {},
+                float clip = 0.f,
+                bool linear_before_reset = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool get_linear_before_reset() const {
+        return m_linear_before_reset;
+    }
+    op::RecurrentSequenceDirection get_direction() const {
+        return m_direction;
+    }
+
+protected:
+    op::RecurrentSequenceDirection m_direction;
+    bool m_linear_before_reset;
+};
+}  // namespace v5
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/hard_sigmoid.hpp b/ngraph/core/include/openvino/op/hard_sigmoid.hpp
new file mode 100644
index 00000000000000..bea9b15b0b1a4e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/hard_sigmoid.hpp
@@ -0,0 +1,35 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief      Parameterized, bounded sigmoid-like, piecewise linear
+///             function. min(max(alpha*x + beta, 0), 1)
+///
+class OPENVINO_API HardSigmoid : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    HardSigmoid();
+
+    /// \brief      Constructs a HardSigmoid operation.
+    ///
+    /// \param      data   Input tensor.
+    /// \param[in]  alpha  A scalar value representing the alpha parameter.
+    /// \param[in]  beta   A scalar value representing the beta parameter.
+    ///
+    HardSigmoid(const Output<Node>& data, const Output<Node>& alpha, const Output<Node>& beta);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/hsigmoid.hpp b/ngraph/core/include/openvino/op/hsigmoid.hpp
new file mode 100644
index 00000000000000..4b7c891724d9a1
--- /dev/null
+++ b/ngraph/core/include/openvino/op/hsigmoid.hpp
@@ -0,0 +1,35 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v5 {
+/// \brief A HSigmoid Activation Function
+/// f(x) = min(max(x + 3, 0), 6) / 6 or
+/// f(x) = min(ReLU(x + 3), 6) / 6
+///
+class OPENVINO_API HSigmoid : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    HSigmoid() = default;
+
+    /// \brief Constructs a HSigmoid operation.
+    ///
+    /// \param data Input tensor
+    HSigmoid(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v5
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/hswish.hpp b/ngraph/core/include/openvino/op/hswish.hpp
new file mode 100644
index 00000000000000..7c64232eaddbf7
--- /dev/null
+++ b/ngraph/core/include/openvino/op/hswish.hpp
@@ -0,0 +1,35 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+/// \brief A HSwish Activation Function
+/// f(x) =  x * min(max(x + 3, 0), 6) / 6 or
+/// f(x) = x * min(ReLU(x + 3), 6) / 6
+///
+class OPENVINO_API HSwish : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    HSwish() = default;
+
+    /// \brief Constructs a HSwish (hard version of Swish) operation.
+    ///
+    /// \param data Input tensor
+    HSwish(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/idft.hpp b/ngraph/core/include/openvino/op/idft.hpp
new file mode 100644
index 00000000000000..cf0352c679bd34
--- /dev/null
+++ b/ngraph/core/include/openvino/op/idft.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <vector>
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/fft_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v7 {
+/// \brief An operation IDFT that computes the inverse discrete Fourier transformation.
+class OPENVINO_API IDFT : public util::FFTBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    IDFT() = default;
+
+    /// \brief Constructs a IDFT operation. IDFT is performed for full size axes.
+    ///
+    /// \param data  Input data
+    /// \param axes Axes to perform IDFT
+    IDFT(const Output<Node>& data, const Output<Node>& axes);
+
+    /// \brief Constructs a IDFT operation.
+    ///
+    /// \param data  Input data
+    /// \param axes Axes to perform IDFT
+    /// \param signal_size Signal sizes for 'axes'
+    IDFT(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v7
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/if.hpp b/ngraph/core/include/openvino/op/if.hpp
new file mode 100644
index 00000000000000..f262a0e71794da
--- /dev/null
+++ b/ngraph/core/include/openvino/op/if.hpp
@@ -0,0 +1,94 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <vector>
+
+#include "openvino/core/function.hpp"
+#include "openvino/op/parameter.hpp"
+#include "openvino/op/util/multi_subgraph_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v8 {
+/// \brief  If operation.
+class OPENVINO_API If : public util::MultiSubGraphOp {
+public:
+    enum BodyIndexes { THEN_BODY_INDEX = 0, ELSE_BODY_INDEX = 1 };
+
+    OPENVINO_RTTI_DECLARATION;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    /// \brief     Constructs If with condition
+    ///
+    /// \param     execution_condition   condition node.
+    If(const Output<Node>& execution_condition);
+    If();
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \brief     gets then_body as ngraph::Function.
+    ///
+    /// \return then_body as ngraph::Function.
+    const std::shared_ptr<Function>& get_then_body() const {
+        return m_bodies[THEN_BODY_INDEX];
+    }
+
+    /// \brief     gets else_body as ngraph::Function.
+    ///
+    /// \return else_body as ngraph::Function.
+    const std::shared_ptr<Function>& get_else_body() const {
+        return m_bodies[ELSE_BODY_INDEX];
+    }
+
+    /// \brief     sets new ngraph::Function as new then_body.
+    ///
+    /// \param     body   new body for 'then' branch.
+    void set_then_body(const std::shared_ptr<Function>& body) {
+        m_bodies[THEN_BODY_INDEX] = body;
+    }
+
+    /// \brief     sets new ngraph::Function as new else_body.
+    ///
+    /// \param     body   new body for 'else' branch.
+    void set_else_body(const std::shared_ptr<Function>& body) {
+        m_bodies[ELSE_BODY_INDEX] = body;
+    }
+
+    /// \brief     sets new input to the operation associated with parameters
+    /// of each sub-graphs
+    ///
+    /// \param     value           input to operation
+    /// \param     then_parameter  parameter for then_body or nullptr
+    /// \param     else_parameter  parameter for else_body or nullpt
+    void set_input(const Output<Node>& value,
+                   const std::shared_ptr<v0::Parameter>& then_parameter,
+                   const std::shared_ptr<v0::Parameter>& else_parameter);
+
+    /// \brief     sets new output from the operation associated with results
+    /// of each sub-graphs
+    ///
+    /// \param     then_result     result from then_body
+    /// \param     else_parameter  result from else_body
+    /// \return    output from operation
+    Output<Node> set_output(const std::shared_ptr<v0::Result>& then_result,
+                            const std::shared_ptr<v0::Result>& else_result);
+
+    void validate_and_infer_types() override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+
+    bool has_evaluate() const override;
+
+private:
+    using OutputMap = std::map<int64_t, std::shared_ptr<MultiSubGraphOp::OutputDescription>>;
+
+    void validate_and_infer_type_body(const std::shared_ptr<Function>& body,
+                                      const MultiSubgraphInputDescriptionVector& input_descriptors);
+
+    OutputMap get_mapping_outputs_on_body_description(const MultiSubgraphOutputDescriptionVector& output_descriptors);
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/interpolate.hpp b/ngraph/core/include/openvino/op/interpolate.hpp
new file mode 100644
index 00000000000000..bc195f3d8c59f4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/interpolate.hpp
@@ -0,0 +1,360 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstdint>
+#include <vector>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+
+/// \brief Layer which performs bilinear interpolation
+class OPENVINO_API Interpolate : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Structure that specifies attributes for interpolation
+    struct Attributes {
+        // specify dimension indices where interpolation is applied, and `axes` is any
+        // unordered list of indeces of different dimensions of input tensor. Required.
+        AxisSet axes;
+        // specifies type of interpolation
+        // one of `nearest`, `linear`, `cubic`, `area`. Required.
+        std::string mode;
+        // a flag that specifies whether to align corners or not.
+        // `true` (default) means the alignment is applied,
+        // `false` means the alignment isn't applied.
+        bool align_corners = true;
+        // a flag that specifies whether to perform anti-aliasing. default is `false`
+        bool antialias = false;
+        // specify the number of pixels to add to the beginning of the image being
+        // interpolated. This addition of pixels is done before interpolation calculation.
+        std::vector<size_t> pads_begin;
+        // specify the number of pixels to add to the end of the image being interpolated.
+        // This addition of pixels is done before interpolation calculation.
+        std::vector<size_t> pads_end;
+    };
+
+    enum class InterpolateMode {
+        NEAREST,
+        LINEAR,
+        CUBIC,
+        AREA,
+        nearest OPENVINO_ENUM_DEPRECATED("Please use NEAREST instead") = NEAREST,
+        linear OPENVINO_ENUM_DEPRECATED("Please use LINEAR instead") = LINEAR,
+        cubic OPENVINO_ENUM_DEPRECATED("Please use CUBIC instead") = CUBIC,
+        area OPENVINO_ENUM_DEPRECATED("Please use AREA instead") = AREA
+    };
+
+    Interpolate() = default;
+    /// \brief Constructs a Interpolate operation
+    ///
+    /// \param image        Input image
+    /// \param output_shape Output shape of spatial axes
+    /// \param attrs        Interpolation attributes
+    Interpolate(const Output<Node>& image, const Output<Node>& output_shape, const Attributes& attrs);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+
+private:
+    Attributes m_attrs;
+};
+}  // namespace v0
+
+namespace v4 {
+class OPENVINO_API Interpolate : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief PartialShape calculation mode
+    ///
+    /// sizes  - output shape for interpolated axes is calculated using input `sizes`
+    /// scales - output shape for interpolated axes is calculated using input `scales`
+    enum class ShapeCalcMode {
+        SIZES,
+        SCALES,
+        sizes OPENVINO_ENUM_DEPRECATED("Please use SIZES instead") = SIZES,
+        scales OPENVINO_ENUM_DEPRECATED("Please use SCALES instead") = SCALES
+    };
+
+    /// \brief Interpolation mode
+    ///
+    /// nearest     - nearest interpolation
+    /// linear      - linear interpolation as in TensorFlow
+    /// linear_onnx - linear interpolation as in ONNX
+    /// cubic       - cubic interpolation
+    enum class InterpolateMode {
+        NEAREST,
+        LINEAR,
+        LINEAR_ONNX,
+        CUBIC,
+        nearest OPENVINO_ENUM_DEPRECATED("Please use NEAREST instead") = NEAREST,
+        linear OPENVINO_ENUM_DEPRECATED("Please use LINEAR instead") = LINEAR,
+        linear_onnx OPENVINO_ENUM_DEPRECATED("Please use LINEAR_ONNX instead") = LINEAR_ONNX,
+        cubic OPENVINO_ENUM_DEPRECATED("Please use CUBIC instead") = CUBIC
+    };
+
+    /// \brief Mode of the calculation of the source coordinate from resized one
+    ///
+    /// These modes are modes from ONNX runtime.
+    enum class CoordinateTransformMode {
+        HALF_PIXEL,
+        PYTORCH_HALF_PIXEL,
+        ASYMMETRIC,
+        TF_HALF_PIXEL_FOR_NN,
+        ALIGN_CORNERS,
+        half_pixel OPENVINO_ENUM_DEPRECATED("Please use HALF_PIXEL instead") = HALF_PIXEL,
+        pytorch_half_pixel OPENVINO_ENUM_DEPRECATED("Please use PYTORCH_HALF_PIXEL instead") = PYTORCH_HALF_PIXEL,
+        asymmetric OPENVINO_ENUM_DEPRECATED("Please use ASYMMETRIC instead") = ASYMMETRIC,
+        tf_half_pixel_for_nn OPENVINO_ENUM_DEPRECATED("Please use TF_HALF_PIXEL_FOR_NN instead") = TF_HALF_PIXEL_FOR_NN,
+        align_corners OPENVINO_ENUM_DEPRECATED("Please use ALIGN_CORNERS instead") = ALIGN_CORNERS
+    };
+
+    /// \brief Round modes for the nearest interpolation.
+    enum class NearestMode {
+        ROUND_PREFER_FLOOR,
+        ROUND_PREFER_CEIL,
+        FLOOR,
+        CEIL,
+        SIMPLE,
+        round_prefer_floor OPENVINO_ENUM_DEPRECATED("Please use ROUND_PREFER_FLOOR instead") = ROUND_PREFER_FLOOR,
+        round_prefer_ceil OPENVINO_ENUM_DEPRECATED("Please use ROUND_PREFER_CEIL instead") = ROUND_PREFER_CEIL,
+        floor OPENVINO_ENUM_DEPRECATED("Please use FLOOR instead") = FLOOR,
+        ceil OPENVINO_ENUM_DEPRECATED("Please use CEIL instead") = CEIL,
+        simple OPENVINO_ENUM_DEPRECATED("Please use SIMPLE instead") = SIMPLE
+    };
+
+    struct InterpolateAttrs {
+        // specifies type of interpolation
+        // one of `nearest`, `linear`, `linear_onnx`, `cubic` Required.
+        InterpolateMode mode = InterpolateMode::NEAREST;
+        // specifies shape calculation mode
+        // one of `sizes`, `scales` Required
+        ShapeCalcMode shape_calculation_mode = ShapeCalcMode::SIZES;
+        // specify the number of pixels to add to the beginning of the image being
+        // interpolated. This addition of pixels is done before interpolation
+        // calculation.
+        std::vector<size_t> pads_begin;
+        // specify the number of pixels to add to the end of the image being
+        // interpolated. This addition of pixels is done before interpolation
+        // calculation.
+        std::vector<size_t> pads_end;
+        // specifies how to transform the coordinate in the resized tensor to the
+        // coordinate in the original tensor. one of `half_pixel`, `pytorch_half_pixel`,
+        // `asymmetric`, `tf_half_pixel_for_nn`, `align_corners`
+        CoordinateTransformMode coordinate_transformation_mode = CoordinateTransformMode::HALF_PIXEL;
+        // specifies round mode when `mode == nearest` and is used only when `mode ==
+        // nearest`. one of `round_prefer_floor`, `round_prefer_ceil`, `floor`, `ceil`,
+        // `simple`
+        NearestMode nearest_mode = NearestMode::ROUND_PREFER_FLOOR;
+        // a flag that specifies whether to perform anti-aliasing. default is `false`
+        bool antialias = false;
+        // specifies the parameter *a* for cubic interpolation (see, e.g.
+        // [article](https://ieeexplore.ieee.org/document/1163711/)).  *cube_coeff* is
+        // used only when `mode == cubic`
+        double cube_coeff = -0.75f;
+
+        InterpolateAttrs() = default;
+
+        InterpolateAttrs(InterpolateMode mode,
+                         ShapeCalcMode shape_calculation_mode,
+                         const std::vector<size_t>& pads_begin,
+                         const std::vector<size_t>& pads_end,
+                         CoordinateTransformMode coordinate_transformation_mode = CoordinateTransformMode::HALF_PIXEL,
+                         NearestMode nearest_mode = NearestMode::ROUND_PREFER_FLOOR,
+                         bool antialias = false,
+                         double cube_coeff = -0.75)
+            : mode(mode),
+              shape_calculation_mode(shape_calculation_mode),
+              pads_begin(pads_begin),
+              pads_end(pads_end),
+              coordinate_transformation_mode(coordinate_transformation_mode),
+              nearest_mode(nearest_mode),
+              antialias(antialias),
+              cube_coeff(cube_coeff) {}
+    };
+
+    Interpolate() = default;
+    /// \brief Constructs a Interpolate operation without 'axes' input.
+    ///
+    /// \param image  Input image
+    /// \param output_shape Output shape of spatial axes
+    /// \param scales Scales of spatial axes, i.e. output_shape / input_shape
+    /// \param attrs  Interpolation attributes
+    Interpolate(const Output<Node>& image,
+                const Output<Node>& output_shape,
+                const Output<Node>& scales,
+                const InterpolateAttrs& attrs);
+
+    /// \brief Constructs a Interpolate operation with 'axes' input.
+    ///
+    /// \param image  Input image
+    /// \param output_shape Output shape of spatial axes
+    /// \param scales Scales of spatial axes, i.e. output_shape / input_shape
+    /// \param axes   Interpolation axes
+    /// \param attrs  Interpolation attributes
+    Interpolate(const Output<Node>& image,
+                const Output<Node>& output_shape,
+                const Output<Node>& scales,
+                const Output<Node>& axes,
+                const InterpolateAttrs& attrs);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+    const InterpolateAttrs& get_attrs() const {
+        return m_attrs;
+    }
+
+protected:
+    /// \return The interpolation axes.
+    std::vector<int64_t> get_axes() const;
+
+private:
+    bool evaluate_interpolate(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+    InterpolateAttrs m_attrs;
+
+    /// \brief Corrects pads_begin and pads_end attributes.
+    ///
+    /// \details When Interpolate-4 is a result of some transformation, it is possible
+    ///          that pads_begin.size() != pads_end.size() or
+    ///          pads_begin.size() != input_rank. In such case, we should correct
+    ///          pads_begin and pads_end, using padding of pads_begin and pads_end by
+    ///          zeros or using pads_begin[0 : input_rank], pads_end[0 : input_rank].
+    ///
+    ///          Padding of pads_begin is performed when pads_begin.size() < input_rank,
+    ///          and pads_begin[0 : input_rank] is used when
+    ///          pads_begin.size() < input_rank.
+    ///
+    ///          Similarly for pads_end.
+    void correct_pads();
+
+    /// \brief Calculates input shape after padding.
+    ///
+    /// \param input_shape PartialShape of input data.
+    ///
+    /// \return Padded input shape, i.e. input_shape + pads_begin + pads_end
+    PartialShape get_padded_input_shape(const PartialShape& input_shape) const;
+
+    /// \brief Infers output shape using scales.
+    ///
+    /// \param output_shape[in,out] output shape
+    /// \param axes Interpolation axes
+    /// \param scales Scales for interpolated axes
+    /// \param padded_input_shape input shape after padding
+    void infer_using_scales(PartialShape& output_shape,
+                            const std::vector<int64_t>& axes,
+                            const std::vector<float>& scales,
+                            const PartialShape& padded_input_shape) const;
+
+    /// \brief Infers output shape using sizes.
+    ///
+    /// \param output_shape[in,out] output shape
+    /// \param axes Interpolation axes
+    /// \param sizes sizes for interpolated axes
+    void infer_using_shapes(PartialShape& output_shape,
+                            const std::vector<int64_t>& axes,
+                            const std::vector<int64_t>& sizes) const;
+};
+}  // namespace v4
+}  // namespace op
+
+//---------------------------------------- v0 --------------------------------------------------
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v0::Interpolate::InterpolateMode& type);
+
+//---------------------------------------- v4 --------------------------------------------------
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::InterpolateMode& type);
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::CoordinateTransformMode& type);
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::NearestMode& type);
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::ShapeCalcMode& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v0::Interpolate::InterpolateMode>
+    : public EnumAttributeAdapterBase<op::v0::Interpolate::InterpolateMode> {
+public:
+    AttributeAdapter(op::v0::Interpolate::InterpolateMode& value)
+        : EnumAttributeAdapterBase<op::v0::Interpolate::InterpolateMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v0::Interpolate::InterpolateMode>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+template <>
+class OPENVINO_API AttributeAdapter<op::v4::Interpolate::InterpolateMode>
+    : public EnumAttributeAdapterBase<op::v4::Interpolate::InterpolateMode> {
+public:
+    AttributeAdapter(op::v4::Interpolate::InterpolateMode& value)
+        : EnumAttributeAdapterBase<op::v4::Interpolate::InterpolateMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::InterpolateMode>", 4};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v4::Interpolate::CoordinateTransformMode>
+    : public EnumAttributeAdapterBase<op::v4::Interpolate::CoordinateTransformMode> {
+public:
+    AttributeAdapter(op::v4::Interpolate::CoordinateTransformMode& value)
+        : EnumAttributeAdapterBase<op::v4::Interpolate::CoordinateTransformMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::CoordinateTransformMode>", 4};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v4::Interpolate::NearestMode>
+    : public EnumAttributeAdapterBase<op::v4::Interpolate::NearestMode> {
+public:
+    AttributeAdapter(op::v4::Interpolate::NearestMode& value)
+        : EnumAttributeAdapterBase<op::v4::Interpolate::NearestMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::NearestMode>", 4};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v4::Interpolate::ShapeCalcMode>
+    : public EnumAttributeAdapterBase<op::v4::Interpolate::ShapeCalcMode> {
+public:
+    AttributeAdapter(op::v4::Interpolate::ShapeCalcMode& value)
+        : EnumAttributeAdapterBase<op::v4::Interpolate::ShapeCalcMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v4::Interpolate::ShapeCalcMode>", 4};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/less.hpp b/ngraph/core/include/openvino/op/less.hpp
new file mode 100644
index 00000000000000..19f8919216a1a2
--- /dev/null
+++ b/ngraph/core/include/openvino/op/less.hpp
@@ -0,0 +1,33 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_comparison.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise less-than operation.
+class OPENVINO_API Less : public util::BinaryElementwiseComparison {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a less-than operation.
+    Less() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
+    /// \brief Constructs a less-than operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Less(const Output<Node>& arg0,
+         const Output<Node>& arg1,
+         const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/less_eq.hpp b/ngraph/core/include/openvino/op/less_eq.hpp
new file mode 100644
index 00000000000000..b18c84bef4f3c7
--- /dev/null
+++ b/ngraph/core/include/openvino/op/less_eq.hpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_comparison.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise less-than-or-equal operation.
+class OPENVINO_API LessEqual : public util::BinaryElementwiseComparison {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a less-than-or-equal operation.
+    LessEqual() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs a less-than-or-equal operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    LessEqual(const Output<Node>& arg0,
+              const Output<Node>& arg1,
+              const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/log.hpp b/ngraph/core/include/openvino/op/log.hpp
new file mode 100644
index 00000000000000..da3ff95949b91a
--- /dev/null
+++ b/ngraph/core/include/openvino/op/log.hpp
@@ -0,0 +1,30 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise natural log operation.
+class OPENVINO_API Log : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a natural log operation.
+    Log() = default;
+    /// \brief Constructs a natural log operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Log(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/log_softmax.hpp b/ngraph/core/include/openvino/op/log_softmax.hpp
new file mode 100644
index 00000000000000..b737d0815414f6
--- /dev/null
+++ b/ngraph/core/include/openvino/op/log_softmax.hpp
@@ -0,0 +1,43 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v5 {
+class OPENVINO_API LogSoftmax : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    LogSoftmax() = default;
+    /// \brief Constructs a LogSoftmax operation.
+    ///
+    /// \param arg Node that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param axis The axis position (0-based) on which to calculate the LogSoftmax.
+    ///
+    /// Output `[d0, ...]`
+    ///
+    LogSoftmax(const Output<Node>& arg, const int64_t axis);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    int64_t get_axis() const {
+        return m_axis;
+    }
+    void set_axis(const int64_t axis) {
+        m_axis = axis;
+    }
+
+private:
+    int64_t m_axis = 1;
+};
+}  // namespace v5
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/logical_and.hpp b/ngraph/core/include/openvino/op/logical_and.hpp
new file mode 100644
index 00000000000000..a2d09829abe66e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/logical_and.hpp
@@ -0,0 +1,43 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/binary_elementwise_logical.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise logical-and operation.
+///
+class OPENVINO_API LogicalAnd : public util::BinaryElementwiseLogical {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a logical-and operation.
+    LogicalAnd() = default;
+
+    /// \brief Constructs a logical-and operation.
+    ///
+    /// \param arg0 Output that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param arg1 Output that produces the second input tensor.<br>
+    /// `[d0, ...]`
+    /// \param auto_broadcast Auto broadcast specification
+    ///
+    /// Output `[d0, ...]`
+    ///
+    LogicalAnd(const Output<Node>& arg0,
+               const Output<Node>& arg1,
+               const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/logical_not.hpp b/ngraph/core/include/openvino/op/logical_not.hpp
new file mode 100644
index 00000000000000..2156e70166a163
--- /dev/null
+++ b/ngraph/core/include/openvino/op/logical_not.hpp
@@ -0,0 +1,32 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise logical negation operation.
+class OPENVINO_API LogicalNot : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a logical negation operation.
+    LogicalNot() = default;
+    /// \brief Constructs a logical negation operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    LogicalNot(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/logical_or.hpp b/ngraph/core/include/openvino/op/logical_or.hpp
new file mode 100644
index 00000000000000..a95eadd5ef39f6
--- /dev/null
+++ b/ngraph/core/include/openvino/op/logical_or.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/binary_elementwise_logical.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise logical-or operation.
+///
+class OPENVINO_API LogicalOr : public util::BinaryElementwiseLogical {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    LogicalOr() = default;
+    /// \brief Constructs a logical-or operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param arg1 Node that produces the second input tensor.<br>
+    /// `[d0, ...]`
+    /// \param auto_broadcast Auto broadcast specification
+    ///
+    /// Output `[d0, ...]`
+    ///
+    LogicalOr(const Output<Node>& arg0,
+              const Output<Node>& arg1,
+              const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/logical_xor.hpp b/ngraph/core/include/openvino/op/logical_xor.hpp
new file mode 100644
index 00000000000000..beda8749ce2a11
--- /dev/null
+++ b/ngraph/core/include/openvino/op/logical_xor.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/binary_elementwise_logical.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise logical-xor operation.
+///
+class OPENVINO_API LogicalXor : public util::BinaryElementwiseLogical {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    LogicalXor() = default;
+    /// \brief Constructs a logical-xor operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param arg1 Node that produces the second input tensor.<br>
+    /// `[d0, ...]`
+    /// \param auto_broadcast Auto broadcast specification
+    ///
+    /// Output `[d0, ...]`
+    ///
+    LogicalXor(const Output<Node>& arg0,
+               const Output<Node>& arg1,
+               const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/loop.hpp b/ngraph/core/include/openvino/op/loop.hpp
new file mode 100644
index 00000000000000..c19c53a7b2cb15
--- /dev/null
+++ b/ngraph/core/include/openvino/op/loop.hpp
@@ -0,0 +1,90 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <vector>
+
+#include "openvino/core/function.hpp"
+#include "openvino/op/constant.hpp"
+#include "openvino/op/parameter.hpp"
+#include "openvino/op/util/sub_graph_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v5 {
+/// \brief  Iterate a body over tensors, accumulating into tensors.
+class NGRAPH_API Loop : public op::util::SubGraphOp {
+public:
+    /// \brief  Allows to define the purpose of inputs/outputs in the body
+    struct SpecialBodyPorts {
+        SpecialBodyPorts() = default;
+        SpecialBodyPorts(int64_t in_current_iteration_input_idx, int64_t in_body_condition_output_idx)
+            : current_iteration_input_idx(in_current_iteration_input_idx),
+              body_condition_output_idx(in_body_condition_output_idx) {}
+        // -1 means the input is not provided, this input is optional
+        int64_t current_iteration_input_idx = -1;
+        // -1 means the output is not provided,
+        // this output is required, throw an exception if not provided
+        int64_t body_condition_output_idx = -1;
+    };
+
+    NGRAPH_RTTI_DECLARATION;
+
+    /// \brief Constructs a Loop operation.
+    Loop() = default;
+
+    /// \brief Constructs a Loop operation.
+    ///
+    /// \param trip_count Node specifies the maximum number of iterations.
+    /// \param execution_condition Node determines whether to execute the first
+    /// iteration or not.
+    Loop(const Output<Node>& trip_count, const Output<Node>& execution_condition);
+
+    Output<Node> get_concatenated_slices(const Output<Node>& value,
+                                         int64_t start,
+                                         int64_t stride,
+                                         int64_t part_size,
+                                         int64_t end,
+                                         int64_t axis) override;
+
+    void set_special_body_ports(const SpecialBodyPorts& special_body_ports) {
+        m_special_body_ports = special_body_ports;
+    }
+
+    SpecialBodyPorts get_special_body_ports() const {
+        return m_special_body_ports;
+    }
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    Loop(const Loop&);
+
+private:
+    void clone_to(Loop& dst, const OutputVector& new_args) const;
+
+    SpecialBodyPorts m_special_body_ports;
+};
+}  // namespace v5
+}  // namespace op
+
+template <>
+class NGRAPH_API AttributeAdapter<op::v5::Loop::SpecialBodyPorts>
+    : public DirectValueAccessor<op::v5::Loop::SpecialBodyPorts> {
+public:
+    AttributeAdapter(op::v5::Loop::SpecialBodyPorts& value)
+        : DirectValueAccessor<op::v5::Loop::SpecialBodyPorts>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v5::Loop::SpecialBodyPorts>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/lrn.hpp b/ngraph/core/include/openvino/op/lrn.hpp
new file mode 100644
index 00000000000000..adf837cbd49b17
--- /dev/null
+++ b/ngraph/core/include/openvino/op/lrn.hpp
@@ -0,0 +1,78 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+// clang-format off
+/// \brief Elementwise Local Response Normalization (LRN) operation.
+///
+/// ## Inputs
+///
+/// |       | Type                                    | Description                                     |
+/// | ----- | --------------------------------------- | ----------------------------------------------- |
+/// | `arg` | \f$N[n, c, d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
+///
+/// ## Output
+///
+/// | Type                         | Description                                                                                                                                                                                  |
+/// | ---------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+/// | \f$N[n, c, d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[n, c, d_1,\dots,d_n] = \frac{N[n,i,d_1,\dots,d_n]}{ (bias + alpha * (\sum_{i=max(0,(nsize-1)/2)}^{min(C, (nsize-1)/2)+1} N[n,i,d_1,\dots,d_n]^{2}) ^ {2})}\f$ |
+// clang-format on
+class NGRAPH_API LRN : public Op {
+public:
+    NGRAPH_RTTI_DECLARATION;
+
+    /// \brief Constructs a LRN operation.
+    LRN() = default;
+    /// \brief Constructs a LRN operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    LRN(const Output<Node>& arg, double alpha, double beta, double bias, size_t size);
+
+    LRN(const Output<Node>& arg, const Output<Node>& axes, double alpha, double beta, double bias, size_t size);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    void validate_and_infer_types() override;
+
+    double get_alpha() const {
+        return m_alpha;
+    }
+    void set_alpha(double alpha) {
+        m_alpha = alpha;
+    }
+    double get_beta() const {
+        return m_beta;
+    }
+    void set_beta(double beta) {
+        m_beta = beta;
+    }
+    double get_bias() const {
+        return m_bias;
+    }
+    void set_bias(double bias) {
+        m_bias = bias;
+    }
+    size_t get_nsize() const {
+        return m_size;
+    }
+    void set_nsize(size_t size) {
+        m_size = size;
+    }
+    AxisSet get_reduction_axes() const;
+
+protected:
+    double m_alpha;
+    double m_beta;
+    double m_bias;
+    size_t m_size;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/lstm_cell.hpp b/ngraph/core/include/openvino/op/lstm_cell.hpp
new file mode 100644
index 00000000000000..77946d2f0fc7d6
--- /dev/null
+++ b/ngraph/core/include/openvino/op/lstm_cell.hpp
@@ -0,0 +1,397 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/activation_functions.hpp"
+#include "openvino/op/util/rnn_cell_base.hpp"
+
+namespace ov {
+namespace op {
+enum class LSTMWeightsFormat {
+    FICO,  // IE
+    ICOF,  // PyTorch
+    IFCO,  // DNNL, TF, MxNet
+    IFOC,  // Caffe
+    IOFC,  // ONNX
+};
+
+namespace v0 {
+///
+/// \brief      Class for single lstm cell node.
+///
+/// \note       Following implementation supports:
+///             \li \c peepholes Gers & Schmidhuber (2000)
+///             https://ieeexplore.ieee.org/document/861302
+///             \li Coupling input and forget gates.
+///
+/// \note       It calculates following equations:
+///
+///             it = f(Xt*(Wi^T) + Ht-1*(Ri^T) + Pi (.) Ct-1 + Wbi + Rbi)
+///             ft = f(Xt*(Wf^T) + Ht-1*(Rf^T) + Pf (.) Ct-1 + Wbf + Rbf)
+///             ct = g(Xt*(Wc^T) + Ht-1*(Rc^T) + Wbc + Rbc)
+///             Ct = ft (.) Ct-1 + it (.) ct
+///             ot = f(Xt*(Wo^T) + Ht-1*(Ro^T) + Po (.) Ct + Wbo + Rbo)
+///             Ht = ot (.) h(Ct)
+///
+///             *       - Is a dot product,
+///             (.)     - is a Hadamard product (element-wise),
+///             f, g, h - are activation functions.
+///
+/// \note       This class represents only single *cell* (for current time step) and not
+///             the whole LSTM Sequence layer
+///
+/// \sa         LSTMSequence, RNNCell, GRUCell
+///
+class OPENVINO_API LSTMCell : public util::RNNCellBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    LSTMCell();
+    ///
+    /// \brief      Constructs LSTMCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  initial_cell_state    The cell state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The gate weights tensor with shape:
+    ///                                   [4*hidden_size, input_size].
+    /// \param[in]  R                     The recurrence weights tensor with shape:
+    ///                                   [4*hidden_size, hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  weights_format        The order of gates in weights tensors. The
+    ///                                   default format is IFCO since it is used by
+    ///                                   DNNL.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    /// \param[in]  input_forget          Controls coupling input and forget gates.
+    ///
+    LSTMCell(const Output<Node>& X,
+             const Output<Node>& initial_hidden_state,
+             const Output<Node>& initial_cell_state,
+             const Output<Node>& W,
+             const Output<Node>& R,
+             std::size_t hidden_size,
+             LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
+             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
+             const std::vector<float>& activations_alpha = {},
+             const std::vector<float>& activations_beta = {},
+             float clip = 0.f,
+             bool input_forget = false);
+
+    ///
+    /// \brief      Constructs LSTMCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  initial_cell_state    The cell state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape: [4*hidden_size,
+    ///                                   input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [4*hidden_size, hidden_size].
+    /// \param[in]  B                     The bias tensor for gates with shape:
+    ///                                   [4*hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  weights_format        The order of gates in weights tensors. The
+    ///                                   default format is IFCO since it is used by
+    ///                                   DNNL.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    /// \param[in]  input_forget          Controls coupling input and forget gates.
+    ///
+    LSTMCell(const Output<Node>& X,
+             const Output<Node>& initial_hidden_state,
+             const Output<Node>& initial_cell_state,
+             const Output<Node>& W,
+             const Output<Node>& R,
+             const Output<Node>& B,
+             std::size_t hidden_size,
+             LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
+             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
+             const std::vector<float>& activations_alpha = {},
+             const std::vector<float>& activations_beta = {},
+             float clip = 0.f,
+             bool input_forget = false);
+
+    ///
+    /// \brief      Constructs LSTMCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  initial_cell_state    The cell state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape: [4*hidden_size,
+    ///                                   input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [4*hidden_size, hidden_size].
+    /// \param[in]  B                     The bias tensor for gates with shape:
+    ///                                   [4*hidden_size].
+    /// \param[in]  P                     The weight tensor for peepholes with shape:
+    ///                                   [3*hidden_size] - 3 equals to only iof gates.
+    ///                                   The order is: input, output, forget gates.
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  weights_format        The order of gates in weights tensors. The
+    ///                                   default format is IFCO since it is used by
+    ///                                   DNNL.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    /// \param[in]  input_forget          Controls coupling input and forget gates.
+    ///
+    LSTMCell(const Output<Node>& X,
+             const Output<Node>& initial_hidden_state,
+             const Output<Node>& initial_cell_state,
+             const Output<Node>& W,
+             const Output<Node>& R,
+             const Output<Node>& B,
+             const Output<Node>& P,
+             std::size_t hidden_size,
+             LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
+             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
+             const std::vector<float>& activations_alpha = {},
+             const std::vector<float>& activations_beta = {},
+             float clip = 0.f,
+             bool input_forget = false);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool get_input_forget() const {
+        return m_input_forget;
+    }
+    LSTMWeightsFormat get_weights_format() const {
+        return m_weights_format;
+    }
+
+private:
+    ///
+    /// \brief      Creates the default bias input initialized with zeros.
+    ///
+    /// \return     The object of Output class.
+    ///
+    Output<Node> get_default_bias_input() const;
+
+    ///
+    /// \brief      Creates the default peepholes input initialized with zeros.
+    ///
+    /// \return     The object of Output class.
+    ///
+    Output<Node> get_default_peepholes_input() const;
+    ///
+    /// \brief The Activation function f.
+    ///
+    util::ActivationFunction m_activation_f;
+    ///
+    /// \brief The Activation function g.
+    ///
+    util::ActivationFunction m_activation_g;
+    ///
+    /// \brief The Activation function h.
+    ///
+    util::ActivationFunction m_activation_h;
+    ///
+    /// \brief      Controls whether to couple input and forget gates.
+    ///
+    bool m_input_forget = false;
+
+    ///
+    /// \brief The order of gates in weights tensors.
+    ///
+    LSTMWeightsFormat m_weights_format;
+
+    static constexpr std::size_t s_gates_count{4};
+    static constexpr std::size_t s_peepholes_count{3};
+};
+}  // namespace v0
+
+namespace v4 {
+///
+/// \brief      Class for single lstm cell node.
+///
+/// \note       Following implementation supports:
+///             \li \c peepholes Gers & Schmidhuber (2000)
+///             https://ieeexplore.ieee.org/document/861302
+///             \li Coupling input and forget gates.
+///
+/// \note       It calculates following equations:
+///
+///             it = f(Xt*(Wi^T) + Ht-1*(Ri^T) + Wbi + Rbi)
+///             ft = f(Xt*(Wf^T) + Ht-1*(Rf^T)  + Wbf + Rbf)
+///             ct = g(Xt*(Wc^T) + Ht-1*(Rc^T) + Wbc + Rbc)
+///             Ct = ft (.) Ct-1 + it (.) ct
+///             ot = f(Xt*(Wo^T) + Ht-1*(Ro^T) + Wbo + Rbo)
+///             Ht = ot (.) h(Ct)
+///
+///             *       - Is a dot product,
+///             (.)     - is a Hadamard product (element-wise),
+///             f, g, h - are activation functions.
+///
+/// \note       This class represents only single *cell* (for current time step) and not
+///             the whole LSTM Sequence layer
+///
+/// \sa         LSTMSequence, RNNCell, GRUCell
+///
+class OPENVINO_API LSTMCell : public util::RNNCellBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    LSTMCell();
+    ///
+    /// \brief      Constructs LSTMCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  initial_cell_state    The cell state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The gate weights tensor with shape:
+    ///                                   [4*hidden_size, input_size].
+    /// \param[in]  R                     The recurrence weights tensor with shape:
+    ///                                   [4*hidden_size, hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    LSTMCell(const Output<Node>& X,
+             const Output<Node>& initial_hidden_state,
+             const Output<Node>& initial_cell_state,
+             const Output<Node>& W,
+             const Output<Node>& R,
+             std::size_t hidden_size,
+             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
+             const std::vector<float>& activations_alpha = {},
+             const std::vector<float>& activations_beta = {},
+             float clip = 0.f);
+
+    ///
+    /// \brief      Constructs LSTMCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  initial_cell_state    The cell state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape: [4*hidden_size,
+    ///                                   input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [4*hidden_size, hidden_size].
+    /// \param[in]  B                     The bias tensor for gates with shape:
+    ///                                   [4*hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    ///
+    LSTMCell(const Output<Node>& X,
+             const Output<Node>& initial_hidden_state,
+             const Output<Node>& initial_cell_state,
+             const Output<Node>& W,
+             const Output<Node>& R,
+             const Output<Node>& B,
+             std::size_t hidden_size,
+             const std::vector<std::string>& activations = std::vector<std::string>{"sigmoid", "tanh", "tanh"},
+             const std::vector<float>& activations_alpha = {},
+             const std::vector<float>& activations_beta = {},
+             float clip = 0.f);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+private:
+    ///
+    /// \brief      Creates the default bias input initialized with zeros.
+    ///
+    /// \return     The object of Output class.
+    ///
+    Output<Node> get_default_bias_input() const;
+
+    ///
+    /// \brief The Activation function f.
+    ///
+    util::ActivationFunction m_activation_f;
+    ///
+    /// \brief The Activation function g.
+    ///
+    util::ActivationFunction m_activation_g;
+    ///
+    /// \brief The Activation function h.
+    ///
+    util::ActivationFunction m_activation_h;
+
+    static constexpr std::size_t s_gates_count{4};
+};
+}  // namespace v4
+}  // namespace op
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::LSTMWeightsFormat& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::LSTMWeightsFormat> : public EnumAttributeAdapterBase<op::LSTMWeightsFormat> {
+public:
+    AttributeAdapter(op::LSTMWeightsFormat& value) : EnumAttributeAdapterBase<op::LSTMWeightsFormat>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::LSTMWeightsFormat>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/lstm_sequence.hpp b/ngraph/core/include/openvino/op/lstm_sequence.hpp
new file mode 100644
index 00000000000000..fdb733c5815f01
--- /dev/null
+++ b/ngraph/core/include/openvino/op/lstm_sequence.hpp
@@ -0,0 +1,196 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <cstdint>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "openvino/op/constant.hpp"
+#include "openvino/op/lstm_cell.hpp"
+#include "openvino/op/util/attr_types.hpp"
+#include "openvino/op/util/rnn_cell_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+
+///
+/// \brief      Class for lstm sequence node.
+///
+/// \note       It follows notation and equations defined as in ONNX standard:
+///             https://github.com/onnx/onnx/blob/master/docs/Operators.md#LSTM
+///
+/// \sa         LSTMCell, RNNCell, GRUCell
+///
+///
+class OPENVINO_API LSTMSequence : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    LSTMSequence();
+
+    using direction = RecurrentSequenceDirection;
+
+    size_t get_default_output_index() const override {
+        return no_default_index();
+    }
+    explicit LSTMSequence(const Output<Node>& X,
+                          const Output<Node>& initial_hidden_state,
+                          const Output<Node>& initial_cell_state,
+                          const Output<Node>& sequence_lengths,
+                          const Output<Node>& W,
+                          const Output<Node>& R,
+                          const Output<Node>& B,
+                          const Output<Node>& P,
+                          const std::int64_t hidden_size,
+                          const direction lstm_direction,
+                          LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
+                          const std::vector<float> activations_alpha = {},
+                          const std::vector<float> activations_beta = {},
+                          const std::vector<std::string> activations = {"sigmoid", "tanh", "tanh"},
+                          const float clip_threshold = 0,
+                          const bool input_forget = false);
+
+    explicit LSTMSequence(const Output<Node>& X,
+                          const Output<Node>& initial_hidden_state,
+                          const Output<Node>& initial_cell_state,
+                          const Output<Node>& sequence_lengths,
+                          const Output<Node>& W,
+                          const Output<Node>& R,
+                          const Output<Node>& B,
+                          const std::int64_t hidden_size,
+                          const direction lstm_direction,
+                          LSTMWeightsFormat weights_format = LSTMWeightsFormat::IFCO,
+                          const std::vector<float>& activations_alpha = {},
+                          const std::vector<float>& activations_beta = {},
+                          const std::vector<std::string>& activations = {"sigmoid", "tanh", "tanh"},
+                          const float clip_threshold = 0,
+                          const bool input_forget = false);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    std::vector<float> get_activations_alpha() const {
+        return m_activations_alpha;
+    }
+    std::vector<float> get_activations_beta() const {
+        return m_activations_beta;
+    }
+    std::vector<std::string> get_activations() const {
+        return m_activations;
+    }
+    float get_clip_threshold() const {
+        return m_clip_threshold;
+    }
+    direction get_direction() const {
+        return m_direction;
+    }
+    std::int64_t get_hidden_size() const {
+        return m_hidden_size;
+    }
+    bool get_input_forget() const {
+        return m_input_forget;
+    }
+    LSTMWeightsFormat get_weights_format() const {
+        return m_weights_format;
+    }
+
+private:
+    ///
+    /// \brief      Gets the masked value according to sequence length in a batch.
+    ///
+    /// \note       Zeros out values or sets them to default value for inputs with
+    ///             sequence length shorter than currently procssed time step.
+    ///
+    /// \param[in]  data           The input value.
+    /// \param[in]  time_step      The current time step denoting sequence length.
+    /// \param[in]  batch_axis     The batch axis index of data tensor.
+    /// \param[in]  default_value  The default value for masked elements.
+    ///
+    /// \return     The masked value.
+    ///
+    std::shared_ptr<Node> get_masked_node(const Output<Node>& data,
+                                          std::int32_t time_step,
+                                          std::size_t batch_axis = 0,
+                                          const Output<Node>& default_value = Output<Node>()) const;
+
+    OutputVector lstm_pass(bool is_reverse = false) const;
+
+    // Split(bi-directional) and squeeze input data to remove 'num_direction' dimension.
+    std::shared_ptr<Node> prepare_input(Output<Node> node, bool is_reverse, size_t num_direction_axis = 0) const;
+
+    std::vector<float> m_activations_alpha;
+    std::vector<float> m_activations_beta;
+    std::vector<std::string> m_activations;
+    float m_clip_threshold;
+    direction m_direction;
+    std::int64_t m_hidden_size;
+    bool m_input_forget;
+    LSTMWeightsFormat m_weights_format;
+};
+}  // namespace v0
+
+namespace v5 {
+///
+/// \brief      Class for lstm sequence node.
+///
+/// \note       It follows notation and equations defined as in ONNX standard:
+///             https://github.com/onnx/onnx/blob/master/docs/Operators.md#LSTM
+///
+/// \sa         LSTMCell, RNNCell, GRUCell
+///
+///
+class OPENVINO_API LSTMSequence : public util::RNNCellBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    LSTMSequence() = default;
+
+    using direction = RecurrentSequenceDirection;
+
+    size_t get_default_output_index() const override {
+        return no_default_index();
+    }
+    explicit LSTMSequence(const Output<Node>& X,
+                          const Output<Node>& initial_hidden_state,
+                          const Output<Node>& initial_cell_state,
+                          const Output<Node>& sequence_lengths,
+                          const Output<Node>& W,
+                          const Output<Node>& R,
+                          const Output<Node>& B,
+                          const std::int64_t hidden_size,
+                          const direction lstm_direction,
+                          const std::vector<float>& activations_alpha = {},
+                          const std::vector<float>& activations_beta = {},
+                          const std::vector<std::string>& activations = {"sigmoid", "tanh", "tanh"},
+                          const float clip = 0.f)
+        : RNNCellBase({X, initial_hidden_state, initial_cell_state, sequence_lengths, W, R, B},
+                      hidden_size,
+                      clip,
+                      activations,
+                      activations_alpha,
+                      activations_beta),
+          m_direction(lstm_direction) {
+        constructor_validate_and_infer_types();
+    }
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    direction get_direction() const {
+        return m_direction;
+    }
+
+private:
+    direction m_direction;
+};
+}  // namespace v5
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/matmul.hpp b/ngraph/core/include/openvino/op/matmul.hpp
new file mode 100644
index 00000000000000..c511300ada2bab
--- /dev/null
+++ b/ngraph/core/include/openvino/op/matmul.hpp
@@ -0,0 +1,55 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Operator performing Matrix Multiplication.
+class OPENVINO_API MatMul : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    MatMul() = default;
+    /// \brief Constructs an Matrix Multiplication operation.
+    ///
+    /// \param A Matrix A
+    /// \param B Matrix B
+    /// \param transpose_a If matrix A should be transposed.
+    /// \param transpose_b If matrix B should be transposed.
+    MatMul(const Output<Node>& A,
+           const Output<Node>& B,
+           const bool& transpose_a = false,
+           const bool& transpose_b = false);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+    bool get_transpose_a() const {
+        return m_transpose_a;
+    }
+    bool get_transpose_b() const {
+        return m_transpose_b;
+    }
+    void set_transpose_a(bool transpose_a) {
+        m_transpose_a = transpose_a;
+    }
+    void set_transpose_b(bool transpose_b) {
+        m_transpose_b = transpose_b;
+    }
+
+private:
+    bool m_transpose_a;
+    bool m_transpose_b;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/matrix_nms.hpp b/ngraph/core/include/openvino/op/matrix_nms.hpp
new file mode 100644
index 00000000000000..e16b290da188cc
--- /dev/null
+++ b/ngraph/core/include/openvino/op/matrix_nms.hpp
@@ -0,0 +1,91 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/nms_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v8 {
+/// \brief MatrixNms operation
+///
+class OPENVINO_API MatrixNms : public util::NmsBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    enum class DecayFunction { GAUSSIAN, LINEAR };
+
+    /// \brief Structure that specifies attributes of the operation
+    struct Attributes {
+        // specifies order of output elements
+        SortResultType sort_result_type = SortResultType::NONE;
+        // specifies whenever it is necessary to sort selected boxes across batches or
+        // not
+        bool sort_result_across_batch = false;
+        // specifies the output tensor type
+        ngraph::element::Type output_type = ngraph::element::i64;
+        // specifies minimum score to consider box for the processing
+        float score_threshold = 0.0f;
+        // specifies maximum number of boxes to be selected per class, -1 meaning to
+        // keep all boxes
+        int nms_top_k = -1;
+        // specifies maximum number of boxes to be selected per batch element, -1
+        // meaning to keep all boxes
+        int keep_top_k = -1;
+        // specifies the background class id, -1 meaning to keep all classes
+        int background_class = -1;
+        // specifies decay function used to decay scores
+        DecayFunction decay_function = DecayFunction::LINEAR;
+        // specifies gaussian_sigma parameter for gaussian decay_function
+        float gaussian_sigma = 2.0f;
+        // specifies threshold to filter out boxes with low confidence score after
+        // decaying
+        float post_threshold = 0.0f;
+        // specifies whether boxes are normalized or not
+        bool normalized = true;
+    };
+
+    MatrixNms();
+
+    /// \brief Constructs a MatrixNms operation
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param attrs Attributes of the operation
+    MatrixNms(const Output<Node>& boxes, const Output<Node>& scores, const Attributes& attrs);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \brief Returns attributes of the operation MatrixNms
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+
+protected:
+    Attributes m_attrs;
+
+    void validate() override;
+};
+}  // namespace v8
+}  // namespace op
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v8::MatrixNms::DecayFunction& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v8::MatrixNms::DecayFunction>
+    : public EnumAttributeAdapterBase<op::v8::MatrixNms::DecayFunction> {
+public:
+    AttributeAdapter(op::v8::MatrixNms::DecayFunction& value)
+        : EnumAttributeAdapterBase<op::v8::MatrixNms::DecayFunction>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v8::MatrixNms::DecayFunction>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/max.hpp b/ngraph/core/include/openvino/op/max.hpp
new file mode 100644
index 00000000000000..527a3af37803a3
--- /dev/null
+++ b/ngraph/core/include/openvino/op/max.hpp
@@ -0,0 +1,31 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API ReduceMax : public util::ArithmeticReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a summation operation.
+    ReduceMax() = default;
+    /// \brief Constructs a summation operation.
+    ///
+    /// \param arg The tensor to be summed.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
+    ReduceMax(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/max_pool.hpp b/ngraph/core/include/openvino/op/max_pool.hpp
new file mode 100644
index 00000000000000..89672e555cc0f3
--- /dev/null
+++ b/ngraph/core/include/openvino/op/max_pool.hpp
@@ -0,0 +1,133 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <limits>
+
+#include "openvino/op/util/max_pool_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Batched max pooling operation.
+class OPENVINO_API MaxPool : public op::util::MaxPoolBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a batched max pooling operation.
+    MaxPool() = default;
+
+    /// \brief Constructs a batched max pooling operation.
+    ///
+    /// \param arg The node producing the input data batch tensor.
+    /// \param strides The strides.
+    /// \param pads_begin The beginning of padding shape.
+    /// \param pads_end The end of padding shape.
+    /// \param kernel The kernel shape.
+    /// \param rounding_type Whether to use ceiling or floor rounding type while
+    /// computing output shape.
+    /// \param auto_pad The pad type for automatically computing padding sizes.
+    MaxPool(const Output<Node>& arg,
+            const Strides& strides,
+            const Shape& pads_begin,
+            const Shape& pads_end,
+            const Shape& kernel,
+            const op::RoundingType rounding_type = op::RoundingType::FLOOR,
+            const PadType auto_pad = op::PadType::EXPLICIT);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The default value for MaxPool.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool evaluate_maxpool(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v1
+
+namespace v8 {
+/// \brief MaxPooling operation with values and indices calculated as individual outputs
+class OPENVINO_API MaxPool : public op::util::MaxPoolBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an empty MaxPool operation.
+    MaxPool() = default;
+
+    /// \brief Constructs a parametrized MaxPool operation.
+    ///
+    /// \param arg Output of a node producing the feature tensor to be pooled.
+    /// \param strides The strides of the pooling filter.
+    /// \param dilations The dilations of the pooling filter.
+    /// \param pads_begin Paddings at the beginning of each spatial axis.
+    /// \param pads_end Paddings at the end of each spatial axis.
+    /// \param kernel The kernel shape.
+    /// \param rounding_type Whether to use ceiling or floor rounding type while
+    ///                      computing the output shape.
+    /// \param auto_pad The pad type for automatic calculation of the padding sizes.
+    /// \param index_element_type The data type used by the second output tensor
+    ///                           containing the selected indices.
+    /// \param axis Indicates a dimension in the input data shape which should be used
+    ///             as a starting point for calculation of the upper bound of allowed
+    ///             values of the indices output.
+    MaxPool(const Output<Node>& arg,
+            const Strides& strides,
+            const Strides& dilations,
+            const Shape& pads_begin,
+            const Shape& pads_end,
+            const Shape& kernel,
+            const op::RoundingType rounding_type = op::RoundingType::FLOOR,
+            const PadType auto_pad = op::PadType::EXPLICIT,
+            const element::Type index_element_type = element::i64,
+            const int64_t axis = 0);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The pooling filter's dilations.
+    const Strides& get_dilations() const noexcept {
+        return m_dilations;
+    }
+    void set_dilations(const Strides& dilations) {
+        m_dilations = dilations;
+    }
+
+    /// \return The data type of the second output tensor (indices).
+    element::Type get_index_element_type() const noexcept {
+        return m_index_element_type;
+    }
+    void set_index_element_type(const element::Type index_element_type) {
+        m_index_element_type = index_element_type;
+    }
+
+    // \return The 'axis' attribute value.
+    int64_t get_axis() const {
+        return m_axis;
+    }
+    void set_axis(const int64_t axis) {
+        m_axis = axis;
+    }
+
+    bool has_evaluate() const override;
+    bool evaluate(const HostTensorVector&, const HostTensorVector&) const override;
+
+private:
+    Strides m_dilations;
+    element::Type m_index_element_type{element::i64};
+    int64_t m_axis{0};
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/maximum.hpp b/ngraph/core/include/openvino/op/maximum.hpp
new file mode 100644
index 00000000000000..5218eacdce477a
--- /dev/null
+++ b/ngraph/core/include/openvino/op/maximum.hpp
@@ -0,0 +1,36 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise maximum operation.
+class OPENVINO_API Maximum : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a maximum operation.
+    Maximum() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs a maximum operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Maximum(const Output<Node>& arg0,
+            const Output<Node>& arg1,
+            const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/minimum.hpp b/ngraph/core/include/openvino/op/minimum.hpp
new file mode 100644
index 00000000000000..7219af61379966
--- /dev/null
+++ b/ngraph/core/include/openvino/op/minimum.hpp
@@ -0,0 +1,36 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise minimum operation.
+class OPENVINO_API Minimum : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a minimum operation.
+    Minimum() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs a minimum operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Minimum(const Output<Node>& arg0,
+            const Output<Node>& arg1,
+            const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/mish.hpp b/ngraph/core/include/openvino/op/mish.hpp
new file mode 100644
index 00000000000000..37e1bcab11260c
--- /dev/null
+++ b/ngraph/core/include/openvino/op/mish.hpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+/// \brief A Self Regularized Non-Monotonic Neural Activation Function
+/// f(x) =  x * tanh(log(exp(x) + 1.))
+///
+class OPENVINO_API Mish : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Mish() = default;
+    /// \brief Constructs an Mish operation.
+    ///
+    /// \param data Input tensor
+    Mish(const Output<Node>& arg);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/mod.hpp b/ngraph/core/include/openvino/op/mod.hpp
new file mode 100644
index 00000000000000..679a8d591bafca
--- /dev/null
+++ b/ngraph/core/include/openvino/op/mod.hpp
@@ -0,0 +1,32 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Mod returns an element-wise division reminder with two given tensors applying
+/// multi-directional broadcast rules.
+class OPENVINO_API Mod : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a Mod node.
+    Mod() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+    ///
+    /// \param A - Dividend tensor
+    /// \param B - Divisor tensor
+    /// \param auto_broadcast Auto broadcast specification
+    Mod(const Output<Node>& A,
+        const Output<Node>& B,
+        const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/multiclass_nms.hpp b/ngraph/core/include/openvino/op/multiclass_nms.hpp
new file mode 100644
index 00000000000000..55d4a10e6610d8
--- /dev/null
+++ b/ngraph/core/include/openvino/op/multiclass_nms.hpp
@@ -0,0 +1,69 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/nms_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v8 {
+/// \brief MulticlassNms operation
+///
+class OPENVINO_API MulticlassNms : public util::NmsBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Structure that specifies attributes of the operation
+    struct Attributes {
+        // specifies order of output elements
+        SortResultType sort_result_type = SortResultType::NONE;
+        // specifies whenever it is necessary to sort selected boxes across batches or
+        // not
+        bool sort_result_across_batch = false;
+        // specifies the output tensor type
+        ngraph::element::Type output_type = ngraph::element::i64;
+        // specifies intersection over union threshold
+        float iou_threshold = 0.0f;
+        // specifies minimum score to consider box for the processing
+        float score_threshold = 0.0f;
+        // specifies maximum number of boxes to be selected per class, -1 meaning to
+        // keep all boxes
+        int nms_top_k = -1;
+        // specifies maximum number of boxes to be selected per batch element, -1
+        // meaning to keep all boxes
+        int keep_top_k = -1;
+        // specifies the background class id, -1 meaning to keep all classes
+        int background_class = -1;
+        // specifies eta parameter for adpative NMS, in close range [0, 1.0]
+        float nms_eta = 1.0f;
+        // specifies whether boxes are normalized or not
+        bool normalized = true;
+    };
+
+    MulticlassNms();
+
+    /// \brief Constructs a MulticlassNms operation
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param attrs Attributes of the operation
+    MulticlassNms(const Output<Node>& boxes, const Output<Node>& scores, const Attributes& attrs);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \brief Returns attributes of the operation MulticlassNms
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+
+protected:
+    Attributes m_attrs;
+    void validate() override;
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/multiply.hpp b/ngraph/core/include/openvino/op/multiply.hpp
new file mode 100644
index 00000000000000..57fb9cdfceb3ce
--- /dev/null
+++ b/ngraph/core/include/openvino/op/multiply.hpp
@@ -0,0 +1,36 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise multiplication operation.
+class OPENVINO_API Multiply : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a multiplication operation.
+    Multiply() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs a multiplication operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Multiply(const Output<Node>& arg0,
+             const Output<Node>& arg1,
+             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/mvn.hpp b/ngraph/core/include/openvino/op/mvn.hpp
new file mode 100644
index 00000000000000..8e315f947a92ed
--- /dev/null
+++ b/ngraph/core/include/openvino/op/mvn.hpp
@@ -0,0 +1,144 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <utility>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+
+namespace v0 {
+/// \brief Operator performing Mean Variance Normalization
+///
+class OPENVINO_API MVN : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    MVN() = default;
+    /// \brief Constructs an MVN operation.
+    ///
+    /// \param data Input tensor with data
+    /// \param normalize_variance flag that denotes whether to perform variance
+    ///                           normalization.
+    /// \param across_channels flag that denotes if mean values are shared across
+    /// channels.
+    /// \param eps the number to be added to the variance to avoid division by zero when
+    ///            normalizing the value
+    ///
+    MVN(const Output<Node>& data, bool across_channels = true, bool normalize_variance = true, double eps = 1e-9);
+
+    /// \brief Constructs an MVN operation.
+    ///
+    /// \param data Input tensor with data
+    /// \param reduction_axes A list of axes, along which to reduce.
+    /// \param normalize_variance flag that denotes whether to perform variance
+    ///                           normalization.
+    /// \param eps the number to be added to the variance to avoid division by zero when
+    ///            normalizing the value
+    ///
+    MVN(const Output<Node>& data, AxisSet reduction_axes, bool normalize_variance = true, double eps = 1e-9);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    double get_eps() const {
+        return m_eps;
+    }
+    bool get_across_channels() const {
+        return m_across_channels;
+    }
+    bool get_normalize_variance() const {
+        return m_normalize_variance;
+    }
+    AxisSet get_reduction_axes() const {
+        return m_reduction_axes;
+    }
+    void set_reduction_axes(AxisSet axes) {
+        m_reduction_axes = std::move(axes);
+    }
+
+private:
+    double m_eps;
+    bool m_across_channels;
+    bool m_normalize_variance;
+    AxisSet m_reduction_axes;
+};
+}  // namespace v0
+
+/// \brief Specifies how eps is applied in MVN
+enum class MVNEpsMode {
+    // Apply eps inside sqrt
+    INSIDE_SQRT,
+    // Apply eps outside sqrt
+    OUTSIDE_SQRT
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const MVNEpsMode& type);
+
+namespace v6 {
+/// \brief Operator performing Mean Variance Normalization
+///
+class OPENVINO_API MVN : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    MVN() = default;
+    /// \brief Constructs an MVN operation.
+    ///
+    /// \param data Input tensor with data
+    /// \param reduction_axes A list of axes, along which to reduce.
+    /// \param normalize_variance flag that denotes whether to perform variance
+    ///                           normalization.
+    /// \param eps the number to be added to the variance to avoid division by zero when
+    ///            normalizing the value
+    /// \param eps_mode the mode of applying epsilon
+    ///
+    MVN(const Output<Node>& data,
+        const Output<Node>& reduction_axes,
+        bool normalize_variance,
+        float eps,
+        MVNEpsMode eps_mode);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    float get_eps() const {
+        return m_eps;
+    }
+    bool get_normalize_variance() const {
+        return m_normalize_variance;
+    }
+    MVNEpsMode get_eps_mode() const {
+        return m_eps_mode;
+    }
+
+private:
+    bool m_normalize_variance;
+    float m_eps;
+    MVNEpsMode m_eps_mode;
+};
+}  // namespace v6
+}  // namespace op
+
+template <>
+class OPENVINO_API AttributeAdapter<op::MVNEpsMode> : public EnumAttributeAdapterBase<op::MVNEpsMode> {
+public:
+    AttributeAdapter(op::MVNEpsMode& value) : EnumAttributeAdapterBase<op::MVNEpsMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::MVNEpsMode>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/negative.hpp b/ngraph/core/include/openvino/op/negative.hpp
new file mode 100644
index 00000000000000..2aa2448df5bf28
--- /dev/null
+++ b/ngraph/core/include/openvino/op/negative.hpp
@@ -0,0 +1,30 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise negative operation.
+class OPENVINO_API Negative : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a negative operation.
+    Negative() = default;
+    /// \brief Constructs a negative operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Negative(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/non_max_suppression.hpp b/ngraph/core/include/openvino/op/non_max_suppression.hpp
new file mode 100644
index 00000000000000..b51119090054fc
--- /dev/null
+++ b/ngraph/core/include/openvino/op/non_max_suppression.hpp
@@ -0,0 +1,408 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise addition operation.
+///
+class OPENVINO_API NonMaxSuppression : public Op {
+public:
+    enum class BoxEncodingType { CORNER, CENTER };
+
+    OPENVINO_RTTI_DECLARATION;
+
+    NonMaxSuppression() = default;
+
+    /// \brief Constructs a NonMaxSuppression operation.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
+    /// selected per class
+    /// \param iou_threshold Node producing intersection over union threshold
+    /// \param score_threshold Node producing minimum score threshold
+    /// \param box_encoding Specifies the format of boxes data encoding
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const Output<Node>& max_output_boxes_per_class,
+                      const Output<Node>& iou_threshold,
+                      const Output<Node>& score_threshold,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true);
+
+    /// \brief Constructs a NonMaxSuppression operation with default values for the last
+    ///        3 inputs
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box coordinates
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    BoxEncodingType get_box_encoding() const {
+        return m_box_encoding;
+    }
+    void set_box_encoding(const BoxEncodingType box_encoding) {
+        m_box_encoding = box_encoding;
+    }
+    bool get_sort_result_descending() const {
+        return m_sort_result_descending;
+    }
+    void set_sort_result_descending(const bool sort_result_descending) {
+        m_sort_result_descending = sort_result_descending;
+    }
+
+protected:
+    BoxEncodingType m_box_encoding = BoxEncodingType::CORNER;
+    bool m_sort_result_descending = true;
+
+private:
+    int64_t max_boxes_output_from_input() const;
+};
+}  // namespace v1
+
+namespace v3 {
+/// \brief NonMaxSuppression operation
+///
+class OPENVINO_API NonMaxSuppression : public Op {
+public:
+    enum class BoxEncodingType { CORNER, CENTER };
+
+    OPENVINO_RTTI_DECLARATION;
+    NonMaxSuppression() = default;
+
+    /// \brief Constructs a NonMaxSuppression operation.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
+    /// selected per class
+    /// \param iou_threshold Node producing intersection over union threshold
+    /// \param score_threshold Node producing minimum score threshold
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const Output<Node>& max_output_boxes_per_class,
+                      const Output<Node>& iou_threshold,
+                      const Output<Node>& score_threshold,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    /// \brief Constructs a NonMaxSuppression operation with default values for the last
+    ///        3 inputs
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box coordinates
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    BoxEncodingType get_box_encoding() const {
+        return m_box_encoding;
+    }
+    void set_box_encoding(const BoxEncodingType box_encoding) {
+        m_box_encoding = box_encoding;
+    }
+    bool get_sort_result_descending() const {
+        return m_sort_result_descending;
+    }
+    void set_sort_result_descending(const bool sort_result_descending) {
+        m_sort_result_descending = sort_result_descending;
+    }
+
+    element::Type get_output_type() const {
+        return m_output_type;
+    }
+    void set_output_type(const element::Type& output_type) {
+        m_output_type = output_type;
+    }
+    using Node::set_output_type;
+
+protected:
+    BoxEncodingType m_box_encoding = BoxEncodingType::CORNER;
+    bool m_sort_result_descending = true;
+    ngraph::element::Type m_output_type = ngraph::element::i64;
+    void validate();
+    int64_t max_boxes_output_from_input() const;
+};
+}  // namespace v3
+
+namespace v4 {
+/// \brief NonMaxSuppression operation
+///
+class OPENVINO_API NonMaxSuppression : public op::v3::NonMaxSuppression {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    NonMaxSuppression() = default;
+
+    /// \brief Constructs a NonMaxSuppression operation.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
+    /// selected per class
+    /// \param iou_threshold Node producing intersection over union threshold
+    /// \param score_threshold Node producing minimum score threshold
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const Output<Node>& max_output_boxes_per_class,
+                      const Output<Node>& iou_threshold,
+                      const Output<Node>& score_threshold,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    /// \brief Constructs a NonMaxSuppression operation with default values for the last
+    ///        3 inputs
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box coordinates
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v4
+
+namespace v5 {
+/// \brief NonMaxSuppression operation
+///
+class OPENVINO_API NonMaxSuppression : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    enum class BoxEncodingType { CORNER, CENTER };
+
+    NonMaxSuppression() = default;
+
+    /// \brief Constructs a NonMaxSuppression operation with default values in the last
+    ///        4 inputs.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    /// \brief Constructs a NonMaxSuppression operation with default values in the last.
+    ///        3 inputs.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
+    /// selected per class
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const Output<Node>& max_output_boxes_per_class,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    /// \brief Constructs a NonMaxSuppression operation with default values in the last.
+    ///        2 inputs.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
+    /// selected per class
+    /// \param iou_threshold Node producing intersection over union threshold
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const Output<Node>& max_output_boxes_per_class,
+                      const Output<Node>& iou_threshold,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    /// \brief Constructs a NonMaxSuppression operation with default value in the last.
+    ///        input.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
+    /// selected per class
+    /// \param iou_threshold Node producing intersection over union threshold
+    /// \param score_threshold Node producing minimum score threshold
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const Output<Node>& max_output_boxes_per_class,
+                      const Output<Node>& iou_threshold,
+                      const Output<Node>& score_threshold,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    /// \brief Constructs a NonMaxSuppression operation.
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param max_output_boxes_per_class Node producing maximum number of boxes to be
+    /// selected per class
+    /// \param iou_threshold Node producing intersection over union threshold
+    /// \param score_threshold Node producing minimum score threshold
+    /// \param soft_nms_sigma Node specifying the sigma parameter for Soft-NMS
+    /// \param box_encoding Specifies the format of boxes data encoding
+    /// \param sort_result_descending Specifies whether it is necessary to sort selected
+    /// boxes across batches
+    /// \param output_type Specifies the output tensor type
+    NonMaxSuppression(const Output<Node>& boxes,
+                      const Output<Node>& scores,
+                      const Output<Node>& max_output_boxes_per_class,
+                      const Output<Node>& iou_threshold,
+                      const Output<Node>& score_threshold,
+                      const Output<Node>& soft_nms_sigma,
+                      const BoxEncodingType box_encoding = BoxEncodingType::CORNER,
+                      const bool sort_result_descending = true,
+                      const ngraph::element::Type& output_type = ngraph::element::i64);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    BoxEncodingType get_box_encoding() const {
+        return m_box_encoding;
+    }
+    void set_box_encoding(const BoxEncodingType box_encoding) {
+        m_box_encoding = box_encoding;
+    }
+    bool get_sort_result_descending() const {
+        return m_sort_result_descending;
+    }
+    void set_sort_result_descending(const bool sort_result_descending) {
+        m_sort_result_descending = sort_result_descending;
+    }
+
+    element::Type get_output_type() const {
+        return m_output_type;
+    }
+    void set_output_type(const element::Type& output_type) {
+        m_output_type = output_type;
+    }
+    using Node::set_output_type;
+
+    int64_t max_boxes_output_from_input() const;
+    float iou_threshold_from_input() const;
+    float score_threshold_from_input() const;
+    float soft_nms_sigma_from_input() const;
+    bool is_soft_nms_sigma_constant_and_default() const;
+
+protected:
+    BoxEncodingType m_box_encoding = BoxEncodingType::CORNER;
+    bool m_sort_result_descending = true;
+    ngraph::element::Type m_output_type = ngraph::element::i64;
+    void validate();
+};
+}  // namespace v5
+}  // namespace op
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v1::NonMaxSuppression::BoxEncodingType& type);
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v3::NonMaxSuppression::BoxEncodingType& type);
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v5::NonMaxSuppression::BoxEncodingType& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v1::NonMaxSuppression::BoxEncodingType>
+    : public EnumAttributeAdapterBase<op::v1::NonMaxSuppression::BoxEncodingType> {
+public:
+    AttributeAdapter(op::v1::NonMaxSuppression::BoxEncodingType& value)
+        : EnumAttributeAdapterBase<op::v1::NonMaxSuppression::BoxEncodingType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v1::NonMaxSuppression::BoxEncodingType>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v3::NonMaxSuppression::BoxEncodingType>
+    : public EnumAttributeAdapterBase<op::v3::NonMaxSuppression::BoxEncodingType> {
+public:
+    AttributeAdapter(op::v3::NonMaxSuppression::BoxEncodingType& value)
+        : EnumAttributeAdapterBase<op::v3::NonMaxSuppression::BoxEncodingType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v3::NonMaxSuppression::BoxEncodingType>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v5::NonMaxSuppression::BoxEncodingType>
+    : public EnumAttributeAdapterBase<op::v5::NonMaxSuppression::BoxEncodingType> {
+public:
+    AttributeAdapter(op::v5::NonMaxSuppression::BoxEncodingType& value)
+        : EnumAttributeAdapterBase<op::v5::NonMaxSuppression::BoxEncodingType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v5::NonMaxSuppression::BoxEncodingType>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/non_zero.hpp b/ngraph/core/include/openvino/op/non_zero.hpp
new file mode 100644
index 00000000000000..13fc7728243155
--- /dev/null
+++ b/ngraph/core/include/openvino/op/non_zero.hpp
@@ -0,0 +1,67 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief NonZero operation returning indices of non-zero elements in the input tensor.
+///
+/// \note The indices are returned by-dimension in row-major order. For example
+///       the following output contains 3 indices of a 3D input tensor elements:
+///       [[0, 0, 2],
+///        [0, 1, 1],
+///        [0, 1, 2]]
+///       The values point to input elements at [0,0,0], [0,1,1] and [2,1,2]
+class OPENVINO_API NonZero : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a NonZero operation.
+    NonZero() = default;
+    /// \brief Constructs a NonZero operation.
+    ///
+    /// \note The output type is int64.
+    ///
+    /// \param arg Node that produces the input tensor.
+    NonZero(const Output<Node>& arg);
+    /// \brief Constructs a NonZero operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    /// \param output_type produce indices. Currently, only 'int64' or 'int32'
+    /// are
+    ///                           supported
+    NonZero(const Output<Node>& arg, const std::string& output_type);
+    /// \brief Constructs a NonZero operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    /// \param output_type produce indices. Currently, only int64 or int32 are
+    ///                           supported
+    NonZero(const Output<Node>& arg, const element::Type& output_type);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    element::Type get_output_type() const {
+        return m_output_type;
+    }
+    void set_output_type(element::Type output_type) {
+        m_output_type = output_type;
+    }
+    // Overload collision with method on Node
+    using Node::set_output_type;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    element::Type m_output_type = element::i64;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/normalize_l2.hpp b/ngraph/core/include/openvino/op/normalize_l2.hpp
new file mode 100644
index 00000000000000..dee0ef24eebd5d
--- /dev/null
+++ b/ngraph/core/include/openvino/op/normalize_l2.hpp
@@ -0,0 +1,53 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief  Normalization with L2 norm.
+///
+class OPENVINO_API NormalizeL2 : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    NormalizeL2() = default;
+    ///
+    /// \brief      Constructs a NormalizeL2 operation.
+    ///
+    /// \param      data            - Node producing the input tensor
+    /// \param      axes            - Node indicating axes along which reduction is
+    ///                               calculated
+    /// \param      eps             - The epsilon added to L2 norm.
+    /// \param      eps_mode        - Specifies how eps is combined with L2 value
+    ///                               calculated before division
+    ///
+    NormalizeL2(const Output<Node>& data, const Output<Node>& axes, float eps, EpsMode eps_mode);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    float get_eps() const {
+        return m_eps;
+    }
+    EpsMode get_eps_mode() const {
+        return m_eps_mode;
+    }
+    AxisSet get_reduction_axes() const;
+
+protected:
+    float m_eps;
+    EpsMode m_eps_mode;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/not_equal.hpp b/ngraph/core/include/openvino/op/not_equal.hpp
new file mode 100644
index 00000000000000..b31944e9939bba
--- /dev/null
+++ b/ngraph/core/include/openvino/op/not_equal.hpp
@@ -0,0 +1,35 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_comparison.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise not-equal operation.
+class OPENVINO_API NotEqual : public util::BinaryElementwiseComparison {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a not-equal operation.
+    NotEqual() : util::BinaryElementwiseComparison(AutoBroadcastSpec::NUMPY) {}
+    /// \brief Constructs a not-equal operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    NotEqual(const Output<Node>& arg0,
+             const Output<Node>& arg1,
+             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/one_hot.hpp b/ngraph/core/include/openvino/op/one_hot.hpp
new file mode 100644
index 00000000000000..6680ff1d0993eb
--- /dev/null
+++ b/ngraph/core/include/openvino/op/one_hot.hpp
@@ -0,0 +1,54 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API OneHot : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a one-hot operation.
+    OneHot() = default;
+    /// \brief Constructs a one-hot operation.
+    ///
+    /// \param indices   Input tensor containing indices.
+    /// \param depth     Specifies number of classes and the size of one-hot dimension.
+    /// \param on_value  Specifies value that the locations in output tensor represented
+    ///                  by indices in input take.
+    /// \param off_value Specifies value that the locations in output tensor not
+    /// represented
+    ///                  by indices in input take.
+    /// \param axis      Axis along which one-hot representation in added.
+    OneHot(const Output<Node>& indices,
+           const Output<Node>& depth,
+           const Output<Node>& on_value,
+           const Output<Node>& off_value,
+           int64_t axis);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    void validate_and_infer_types() override;
+
+    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
+    bool has_evaluate() const override;
+
+    /// \return The index of the one-hot axis.
+    int64_t get_axis() const {
+        return m_axis;
+    }
+    void set_axis(int64_t axis) {
+        m_axis = axis;
+    }
+
+protected:
+    int64_t m_axis;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/op.hpp b/ngraph/core/include/openvino/op/op.hpp
new file mode 100644
index 00000000000000..65a1493d630209
--- /dev/null
+++ b/ngraph/core/include/openvino/op/op.hpp
@@ -0,0 +1,20 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+
+#include "openvino/core/node.hpp"
+
+namespace ov {
+namespace op {
+/// Root of all actual ops
+class OPENVINO_API Op : public Node {
+protected:
+    Op() : Node() {}
+    Op(const OutputVector& arguments);
+};
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/ops.hpp b/ngraph/core/include/openvino/op/ops.hpp
new file mode 100644
index 00000000000000..d1f2d22ab93f05
--- /dev/null
+++ b/ngraph/core/include/openvino/op/ops.hpp
@@ -0,0 +1,173 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+// All OpenVINO Operation Headers
+
+#pragma once
+
+#include "openvino/op/abs.hpp"
+#include "openvino/op/acos.hpp"
+#include "openvino/op/acosh.hpp"
+#include "openvino/op/adaptive_avg_pool.hpp"
+#include "openvino/op/adaptive_max_pool.hpp"
+#include "openvino/op/add.hpp"
+#include "openvino/op/asin.hpp"
+#include "openvino/op/asinh.hpp"
+#include "openvino/op/assign.hpp"
+#include "openvino/op/atan.hpp"
+#include "openvino/op/atanh.hpp"
+#include "openvino/op/avg_pool.hpp"
+#include "openvino/op/batch_norm.hpp"
+#include "openvino/op/batch_to_space.hpp"
+#include "openvino/op/binary_convolution.hpp"
+#include "openvino/op/broadcast.hpp"
+#include "openvino/op/bucketize.hpp"
+#include "openvino/op/ceiling.hpp"
+#include "openvino/op/clamp.hpp"
+#include "openvino/op/concat.hpp"
+#include "openvino/op/constant.hpp"
+#include "openvino/op/convert.hpp"
+#include "openvino/op/convert_like.hpp"
+#include "openvino/op/convolution.hpp"
+#include "openvino/op/cos.hpp"
+#include "openvino/op/cosh.hpp"
+#include "openvino/op/ctc_greedy_decoder.hpp"
+#include "openvino/op/ctc_greedy_decoder_seq_len.hpp"
+#include "openvino/op/ctc_loss.hpp"
+#include "openvino/op/cum_sum.hpp"
+#include "openvino/op/deformable_convolution.hpp"
+#include "openvino/op/deformable_psroi_pooling.hpp"
+#include "openvino/op/depth_to_space.hpp"
+#include "openvino/op/detection_output.hpp"
+#include "openvino/op/dft.hpp"
+#include "openvino/op/divide.hpp"
+#include "openvino/op/einsum.hpp"
+#include "openvino/op/elu.hpp"
+#include "openvino/op/embedding_segments_sum.hpp"
+#include "openvino/op/embeddingbag_offsets_sum.hpp"
+#include "openvino/op/embeddingbag_packedsum.hpp"
+#include "openvino/op/equal.hpp"
+#include "openvino/op/erf.hpp"
+#include "openvino/op/exp.hpp"
+#include "openvino/op/experimental_detectron_detection_output.hpp"
+#include "openvino/op/experimental_detectron_generate_proposals.hpp"
+#include "openvino/op/experimental_detectron_prior_grid_generator.hpp"
+#include "openvino/op/experimental_detectron_roi_feature.hpp"
+#include "openvino/op/experimental_detectron_topkrois.hpp"
+#include "openvino/op/extractimagepatches.hpp"
+#include "openvino/op/fake_quantize.hpp"
+#include "openvino/op/floor.hpp"
+#include "openvino/op/floor_mod.hpp"
+#include "openvino/op/gather.hpp"
+#include "openvino/op/gather_elements.hpp"
+#include "openvino/op/gather_nd.hpp"
+#include "openvino/op/gather_tree.hpp"
+#include "openvino/op/gelu.hpp"
+#include "openvino/op/greater.hpp"
+#include "openvino/op/greater_eq.hpp"
+#include "openvino/op/grn.hpp"
+#include "openvino/op/group_conv.hpp"
+#include "openvino/op/gru_cell.hpp"
+#include "openvino/op/gru_sequence.hpp"
+#include "openvino/op/hard_sigmoid.hpp"
+#include "openvino/op/hsigmoid.hpp"
+#include "openvino/op/hswish.hpp"
+#include "openvino/op/idft.hpp"
+#include "openvino/op/if.hpp"
+#include "openvino/op/interpolate.hpp"
+#include "openvino/op/less.hpp"
+#include "openvino/op/less_eq.hpp"
+#include "openvino/op/log.hpp"
+#include "openvino/op/log_softmax.hpp"
+#include "openvino/op/logical_and.hpp"
+#include "openvino/op/logical_not.hpp"
+#include "openvino/op/logical_or.hpp"
+#include "openvino/op/logical_xor.hpp"
+#include "openvino/op/loop.hpp"
+#include "openvino/op/lrn.hpp"
+#include "openvino/op/lstm_cell.hpp"
+#include "openvino/op/lstm_sequence.hpp"
+#include "openvino/op/matmul.hpp"
+#include "openvino/op/matrix_nms.hpp"
+#include "openvino/op/max.hpp"
+#include "openvino/op/max_pool.hpp"
+#include "openvino/op/maximum.hpp"
+#include "openvino/op/minimum.hpp"
+#include "openvino/op/mish.hpp"
+#include "openvino/op/mod.hpp"
+#include "openvino/op/multiclass_nms.hpp"
+#include "openvino/op/multiply.hpp"
+#include "openvino/op/mvn.hpp"
+#include "openvino/op/negative.hpp"
+#include "openvino/op/non_max_suppression.hpp"
+#include "openvino/op/non_zero.hpp"
+#include "openvino/op/normalize_l2.hpp"
+#include "openvino/op/not_equal.hpp"
+#include "openvino/op/one_hot.hpp"
+#include "openvino/op/pad.hpp"
+#include "openvino/op/parameter.hpp"
+#include "openvino/op/power.hpp"
+#include "openvino/op/prelu.hpp"
+#include "openvino/op/prior_box.hpp"
+#include "openvino/op/prior_box_clustered.hpp"
+#include "openvino/op/proposal.hpp"
+#include "openvino/op/psroi_pooling.hpp"
+#include "openvino/op/random_uniform.hpp"
+#include "openvino/op/range.hpp"
+#include "openvino/op/read_value.hpp"
+#include "openvino/op/reduce_l1.hpp"
+#include "openvino/op/reduce_l2.hpp"
+#include "openvino/op/reduce_logical_and.hpp"
+#include "openvino/op/reduce_logical_or.hpp"
+#include "openvino/op/reduce_mean.hpp"
+#include "openvino/op/reduce_min.hpp"
+#include "openvino/op/reduce_prod.hpp"
+#include "openvino/op/reduce_sum.hpp"
+#include "openvino/op/region_yolo.hpp"
+#include "openvino/op/relu.hpp"
+#include "openvino/op/reorg_yolo.hpp"
+#include "openvino/op/reshape.hpp"
+#include "openvino/op/result.hpp"
+#include "openvino/op/reverse.hpp"
+#include "openvino/op/reverse_sequence.hpp"
+#include "openvino/op/rnn_cell.hpp"
+#include "openvino/op/rnn_sequence.hpp"
+#include "openvino/op/roi_align.hpp"
+#include "openvino/op/roi_pooling.hpp"
+#include "openvino/op/roll.hpp"
+#include "openvino/op/round.hpp"
+#include "openvino/op/scatter_elements_update.hpp"
+#include "openvino/op/scatter_nd_update.hpp"
+#include "openvino/op/scatter_update.hpp"
+#include "openvino/op/select.hpp"
+#include "openvino/op/selu.hpp"
+#include "openvino/op/shape_of.hpp"
+#include "openvino/op/shuffle_channels.hpp"
+#include "openvino/op/sigmoid.hpp"
+#include "openvino/op/sign.hpp"
+#include "openvino/op/sin.hpp"
+#include "openvino/op/sinh.hpp"
+#include "openvino/op/slice.hpp"
+#include "openvino/op/softmax.hpp"
+#include "openvino/op/softplus.hpp"
+#include "openvino/op/space_to_batch.hpp"
+#include "openvino/op/space_to_depth.hpp"
+#include "openvino/op/split.hpp"
+#include "openvino/op/sqrt.hpp"
+#include "openvino/op/squared_difference.hpp"
+#include "openvino/op/squeeze.hpp"
+#include "openvino/op/strided_slice.hpp"
+#include "openvino/op/subtract.hpp"
+#include "openvino/op/swish.hpp"
+#include "openvino/op/tan.hpp"
+#include "openvino/op/tanh.hpp"
+#include "openvino/op/tensor_iterator.hpp"
+#include "openvino/op/tile.hpp"
+#include "openvino/op/topk.hpp"
+#include "openvino/op/transpose.hpp"
+#include "openvino/op/unsqueeze.hpp"
+#include "openvino/op/util/attr_types.hpp"
+#include "openvino/op/util/op_types.hpp"
+#include "openvino/op/variadic_split.hpp"
+#include "openvino/op/xor.hpp"
diff --git a/ngraph/core/include/openvino/op/pad.hpp b/ngraph/core/include/openvino/op/pad.hpp
new file mode 100644
index 00000000000000..2f42122e4086a0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/pad.hpp
@@ -0,0 +1,79 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/coordinate_diff.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Generic padding operation.
+class OPENVINO_API Pad : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a generic padding operation.
+    ///
+    /// \param arg The output producing input tensor to be padded.
+    /// \param pads_begin The output which specifies the number of padding elements
+    /// added
+    /// before position 0 on each axis of arg.
+    /// \param pads_end The output which specifies the number of padding elements
+    /// after the last element on each axis.
+    /// \param arg_pad_value The scalar output with the value used for padding
+    /// if pad_mode is CONSTANT
+    /// \param pad_mode The padding mode: CONSTANT, EDGE, REFLECT or SYMMETRIC.
+    /// CONSTANT initializes new elements with arg_pad_value, EDGE uses the nearest
+    /// value from arg. REFLECT and SYMMETRIC tile the background by flipping arg
+    /// at the edge (SYMMETRIC) or on the last row/column/etc. (REFLECT).
+    Pad(const Output<Node>& arg,
+        const Output<Node>& pads_begin,
+        const Output<Node>& pads_end,
+        const Output<Node>& arg_pad_value,
+        PadMode pad_mode);
+
+    /// \brief Constructs a generic padding operation.
+    ///
+    /// \param arg The output producing input tensor to be padded.
+    /// \param pads_begin The output which specifies the number of padding elements
+    /// added
+    /// \param pads_end The output which specifies the number of padding elements
+    /// after the last element on each axis.
+    /// \param pad_mode The padding mode: CONSTANT, EDGE, REFLECT or SYMMETRIC.
+    Pad(const Output<Node>& arg, const Output<Node>& pads_begin, const Output<Node>& pads_end, PadMode pad_mode);
+
+    /// \brief Constructs a generic padding operation.
+    Pad() = default;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// return The node which specifies the number of padding elements
+    /// added at the beginning of each axis
+    CoordinateDiff get_pads_begin() const;
+    /// return The node which specifies the number of padding elements
+    /// added at the end of each axis
+    CoordinateDiff get_pads_end() const;
+
+    /// \return The padding mode.
+    PadMode get_pad_mode() const {
+        return m_pad_mode;
+    }
+    void set_pad_mode(PadMode pad_mode) {
+        m_pad_mode = pad_mode;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    PadMode m_pad_mode;
+    bool evaluate_pad(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/parameter.hpp b/ngraph/core/include/openvino/op/parameter.hpp
new file mode 100644
index 00000000000000..7878f582927616
--- /dev/null
+++ b/ngraph/core/include/openvino/op/parameter.hpp
@@ -0,0 +1,78 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief A function parameter.
+///
+/// Parameters are nodes that represent the arguments that will be passed to
+/// user-defined functions. Function creation requires a sequence of parameters.
+/// Basic graph operations do not need parameters attached to a function.
+class OPENVINO_API Parameter : public op::Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructions a tensor-typed parameter node.
+    Parameter() = default;
+    /// \brief Constructions a tensor-typed parameter node.
+    ///
+    /// \param element_type The element type of the parameter.
+    /// \param pshape The partial shape of the parameter.
+    Parameter(const ngraph::element::Type& element_type, const PartialShape& pshape);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool is_relevant_to_shapes() const;
+    void set_is_relevant_to_shapes(bool is_relevant);
+
+    const PartialShape& get_partial_shape() const {
+        return m_partial_shape;
+    }
+    PartialShape& get_partial_shape() {
+        return m_partial_shape;
+    }
+    void set_partial_shape(const PartialShape& partial_shape) {
+        m_partial_shape = partial_shape;
+    }
+    const element::Type& get_element_type() const {
+        return m_element_type;
+    }
+    void set_element_type(const element::Type& element_type) {
+        m_element_type = element_type;
+    }
+
+protected:
+    PartialShape m_partial_shape;
+    element::Type m_element_type;
+    bool m_is_relevant_to_shapes{false};
+};
+}  // namespace v0
+}  // namespace op
+using ParameterVector = std::vector<std::shared_ptr<op::v0::Parameter>>;
+
+template <>
+class OPENVINO_API AttributeAdapter<ParameterVector> : public VisitorAdapter {
+public:
+    AttributeAdapter(ParameterVector& ref);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<ParameterVector>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+
+protected:
+    ParameterVector& m_ref;
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/power.hpp b/ngraph/core/include/openvino/op/power.hpp
new file mode 100644
index 00000000000000..0c074760eedb02
--- /dev/null
+++ b/ngraph/core/include/openvino/op/power.hpp
@@ -0,0 +1,49 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+// clang-format off
+/// \brief Elementwise exponentiation operation.
+///
+/// ## Inputs
+///
+/// |        | Type                              | Description                                            |
+/// | ------ | --------------------------------- | ------------------------------------------------------ |
+/// | `arg0` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type.        |
+/// | `arg1` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
+///
+/// ## Output
+///
+/// | Type                   | Description                                                                                                    |
+/// | ---------------------- | -------------------------------------------------------------------------------------------------------------- |
+/// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \texttt{arg0}[i_1,\dots,i_n]^{\texttt{arg1}[i_1,\dots,i_n]}\f$ |
+// clang-format on
+class OPENVINO_API Power : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Power() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs an exponentiation operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Power(const Output<Node>& arg0,
+          const Output<Node>& arg1,
+          const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/prelu.hpp b/ngraph/core/include/openvino/op/prelu.hpp
new file mode 100644
index 00000000000000..53394810103320
--- /dev/null
+++ b/ngraph/core/include/openvino/op/prelu.hpp
@@ -0,0 +1,37 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Parametrized Relu
+/// x <  0 => f(x) = x * slope
+/// x >= 0 => f(x) = x
+///
+class OPENVINO_API PRelu : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    PRelu();
+    /// \brief Constructs a PRelu operation.
+    ///
+    /// \param data Input tensor
+    /// \param slope Multipliers for negative values
+    PRelu(const Output<Node>& data, const Output<Node>& slope);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    void validate_and_infer_types() override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/prior_box.hpp b/ngraph/core/include/openvino/op/prior_box.hpp
new file mode 100644
index 00000000000000..2acf9150b1ceed
--- /dev/null
+++ b/ngraph/core/include/openvino/op/prior_box.hpp
@@ -0,0 +1,67 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Layer which generates prior boxes of specified sizes
+/// normalized to input image size
+class OPENVINO_API PriorBox : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    struct Attributes {
+        // min_size         Desired min_size of prior boxes
+        // max_size         Desired max_size of prior boxes
+        // aspect_ratio     Aspect ratios of prior boxes
+        // clip             Clip output to [0,1]
+        // flip             Flip aspect ratios
+        // step             Distance between prior box centers
+        // offset           Box offset relative to top center of image
+        // variance         Values to adjust prior boxes with
+        // scale_all_sizes  Scale all sizes
+        std::vector<float> min_size;
+        std::vector<float> max_size;
+        std::vector<float> aspect_ratio;
+        std::vector<float> density;
+        std::vector<float> fixed_ratio;
+        std::vector<float> fixed_size;
+        bool clip = false;
+        bool flip = false;
+        float step = 0.0f;
+        float offset = 0.0f;
+        std::vector<float> variance;
+        bool scale_all_sizes = true;
+    };
+
+    PriorBox() = default;
+    /// \brief Constructs a PriorBox operation
+    ///
+    /// \param layer_shape    Shape of layer for which prior boxes are computed
+    /// \param image_shape    Shape of image to which prior boxes are scaled
+    /// \param attrs          PriorBox attributes
+    PriorBox(const Output<Node>& layer_shape, const Output<Node>& image_shape, const Attributes& attrs);
+
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    static int64_t number_of_priors(const Attributes& attrs);
+
+    static std::vector<float> normalized_aspect_ratio(const std::vector<float>& aspect_ratio, bool flip);
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    Attributes m_attrs;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/prior_box_clustered.hpp b/ngraph/core/include/openvino/op/prior_box_clustered.hpp
new file mode 100644
index 00000000000000..9c4342def22451
--- /dev/null
+++ b/ngraph/core/include/openvino/op/prior_box_clustered.hpp
@@ -0,0 +1,59 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+
+namespace v0 {
+/// \brief Layer which generates prior boxes of specified sizes
+/// normalized to input image size
+class OPENVINO_API PriorBoxClustered : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    struct Attributes {
+        // widths         Desired widths of prior boxes
+        // heights        Desired heights of prior boxes
+        // clip           Clip output to [0,1]
+        // step_widths    Distance between prior box centers
+        // step_heights   Distance between prior box centers
+        // step           Distance between prior box centers (when step_w = step_h)
+        // offset         Box offset relative to top center of image
+        // variances      Values to adjust prior boxes with
+        std::vector<float> widths;
+        std::vector<float> heights;
+        bool clip = true;
+        float step_widths = 0.0f;
+        float step_heights = 0.0f;
+        float step = 0.0f;
+        float offset = 0.0f;
+        std::vector<float> variances;
+    };
+
+    PriorBoxClustered() = default;
+    /// \brief Constructs a PriorBoxClustered operation
+    ///
+    /// \param layer_shape    Shape of layer for which prior boxes are computed
+    /// \param image_shape    Shape of image to which prior boxes are scaled
+    /// \param attrs          PriorBoxClustered attributes
+    PriorBoxClustered(const Output<Node>& layer_shape, const Output<Node>& image_shape, const Attributes& attrs);
+
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    Attributes m_attrs;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/proposal.hpp b/ngraph/core/include/openvino/op/proposal.hpp
new file mode 100644
index 00000000000000..0daf18d5744e14
--- /dev/null
+++ b/ngraph/core/include/openvino/op/proposal.hpp
@@ -0,0 +1,95 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+
+namespace v0 {
+class OPENVINO_API Proposal : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    // base_size       Anchor sizes
+    // pre_nms_topn    Number of boxes before nms
+    // post_nms_topn   Number of boxes after nms
+    // nms_thresh      Threshold for nms
+    // feat_stride     Feature stride
+    // min_size        Minimum box size
+    // ratio   Ratios for anchor generation
+    // scale   Scales for anchor generation
+    // clip_before_nms Clip before NMs
+    // clip_after_nms  Clip after NMs
+    // normalize       Normalize boxes to [0,1]
+    // box_size_scale  Scale factor for scaling box size
+    // box_coordinate_scale Scale factor for scaling box coordiate
+    // framework            Calculation frameworkrithm to use
+    struct Attributes {
+        size_t base_size;
+        size_t pre_nms_topn;
+        size_t post_nms_topn;
+        float nms_thresh = 0.0f;
+        size_t feat_stride = 1;
+        size_t min_size = 1;
+        std::vector<float> ratio;
+        std::vector<float> scale;
+        bool clip_before_nms = true;
+        bool clip_after_nms = false;
+        bool normalize = false;
+        float box_size_scale = 1.0f;
+        float box_coordinate_scale = 1.0f;
+        std::string framework;
+        bool infer_probs = false;
+    };
+    Proposal() = default;
+    /// \brief Constructs a Proposal operation
+    ///
+    /// \param class_probs     Class probability scores
+    /// \param bbox_deltas     Prediction of bounding box deltas
+    /// \param image_shape     Shape of image
+    /// \param attrs           Proposal op attributes
+    Proposal(const Output<Node>& class_probs,
+             const Output<Node>& bbox_deltas,
+             const Output<Node>& image_shape,
+             const Attributes& attrs);
+
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+protected:
+    Attributes m_attrs;
+};
+}  // namespace v0
+
+namespace v4 {
+class OPENVINO_API Proposal : public op::v0::Proposal {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Proposal() = default;
+    /// \brief Constructs a Proposal operation
+    ///
+    /// \param class_probs     Class probability scores
+    /// \param bbox_deltas     Prediction of bounding box deltas
+    /// \param image_shape     Shape of image
+    /// \param attrs           Proposal op attributes
+    Proposal(const Output<Node>& class_probs,
+             const Output<Node>& bbox_deltas,
+             const Output<Node>& image_shape,
+             const Attributes& attrs);
+
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    const Attributes& get_attrs() const {
+        return m_attrs;
+    }
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/psroi_pooling.hpp b/ngraph/core/include/openvino/op/psroi_pooling.hpp
new file mode 100644
index 00000000000000..6574a1dbb449d4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/psroi_pooling.hpp
@@ -0,0 +1,72 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API PSROIPooling : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    PSROIPooling() = default;
+    /// \brief Constructs a PSROIPooling operation
+    ///
+    /// \param input          Input feature map {N, C, ...}
+    /// \param coords         Coordinates of bounding boxes
+    /// \param output_dim     Output channel number
+    /// \param group_size     Number of groups to encode position-sensitive scores
+    /// \param spatial_scale  Ratio of input feature map over input image size
+    /// \param spatial_bins_x Numbers of bins to divide the input feature maps over
+    /// width
+    /// \param spatial_bins_y Numbers of bins to divide the input feature maps over
+    /// height
+    /// \param mode           Mode of pooling - Avg or Bilinear
+    PSROIPooling(const Output<Node>& input,
+                 const Output<Node>& coords,
+                 const size_t output_dim,
+                 const size_t group_size,
+                 const float spatial_scale,
+                 int spatial_bins_x,
+                 int spatial_bins_y,
+                 const std::string& mode);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    size_t get_output_dim() const {
+        return m_output_dim;
+    }
+    size_t get_group_size() const {
+        return m_group_size;
+    }
+    float get_spatial_scale() const {
+        return m_spatial_scale;
+    }
+    int get_spatial_bins_x() const {
+        return m_spatial_bins_x;
+    }
+    int get_spatial_bins_y() const {
+        return m_spatial_bins_y;
+    }
+    const std::string& get_mode() const {
+        return m_mode;
+    }
+
+private:
+    size_t m_output_dim;
+    size_t m_group_size;
+    float m_spatial_scale;
+    int m_spatial_bins_x;
+    int m_spatial_bins_y;
+    std::string m_mode;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/random_uniform.hpp b/ngraph/core/include/openvino/op/random_uniform.hpp
new file mode 100644
index 00000000000000..470936491ddb93
--- /dev/null
+++ b/ngraph/core/include/openvino/op/random_uniform.hpp
@@ -0,0 +1,84 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v8 {
+/// \brief Tensor RandomUniform operation.
+class OPENVINO_API RandomUniform : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    RandomUniform() = default;
+
+    ///
+    /// \brief      Constructs a RandomUniform operation.
+    ///
+    /// \param      out_shape         Node producing the tensor with output shape.
+    /// \param      min_val           Node producing the tensor with minimum value.
+    /// \param      max_val           Node producing the tensor with maximum value.
+    /// \param      out_type          Output type of the tensor.
+    /// \param      global_seed       Global seed value.
+    /// \param      op_seed           Operational seed value.
+    RandomUniform(const Output<Node>& out_shape,
+                  const Output<Node>& min_val,
+                  const Output<Node>& max_val,
+                  const ngraph::element::Type& out_type,
+                  uint64_t global_seed = 0,
+                  uint64_t op_seed = 0);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return Turns off constant folding for RandomUniform operation.
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override {
+        return false;
+    }
+
+    /// \return The output tensor type.
+    const ngraph::element::Type& get_out_type() const {
+        return m_output_type;
+    }
+    void set_out_type(const ngraph::element::Type& output_type) {
+        m_output_type = output_type;
+    }
+
+    /// \return The global seed value.
+    uint64_t get_global_seed() const {
+        return m_global_seed;
+    }
+    void set_global_seed(uint64_t seed) {
+        m_global_seed = seed;
+    }
+
+    /// \return The operational seed value.
+    uint64_t get_op_seed() const {
+        return m_op_seed;
+    }
+    void set_op_seed(uint64_t seed2) {
+        m_op_seed = seed2;
+    }
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+
+    bool has_evaluate() const override;
+
+protected:
+    ngraph::element::Type m_output_type;
+    uint64_t m_global_seed;
+    uint64_t m_op_seed;
+
+    mutable std::mutex m_state_mutex;
+    mutable std::pair<uint64_t, uint64_t> m_state;
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/range.hpp b/ngraph/core/include/openvino/op/range.hpp
new file mode 100644
index 00000000000000..5dcc53e928d470
--- /dev/null
+++ b/ngraph/core/include/openvino/op/range.hpp
@@ -0,0 +1,74 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+/// \brief Range operation, analogous to `arange()` in Numpy.
+class OPENVINO_API Range : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs an unitialized range operation.
+    Range() = default;
+
+    /// \brief Constructs a range operation.
+    ///
+    /// \param start The tensor producing the start value. Must be a scalar of numeric
+    ///              element type.
+    /// \param stop The tensor producing the stop value. Must be a scalar of numeric
+    ///             element type.
+    /// \param step The tensor producing the step value. Must be a scalar of numeric
+    ///             element type.
+    /// \param output_type The type of the output.
+    Range(const Output<Node>& start, const Output<Node>& stop, const Output<Node>& step, element::Type output_type);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    void set_output_type(element::Type output_type) {
+        m_output_type = output_type;
+    }
+    // Overload collision with method on Node
+    using Node::set_output_type;
+
+private:
+    element::Type m_output_type;
+};
+}  // namespace v4
+namespace v0 {
+/// \brief Range operation, analogous to `range()` in Python.
+class OPENVINO_API Range : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs an unitialized range operation.
+    Range() = default;
+
+    /// \brief Constructs a range operation.
+    ///
+    /// \param start The tensor producing the start value. Must be a scalar of integer
+    ///              element type, and same element type as `stop` and `step`.
+    /// \param stop The tensor producing the stop value. Must be a scalar of integer
+    ///             element type, and same element type as `start` and `step`.
+    /// \param step The tensor producing the step value. Must be a scalar of integer
+    ///             element type, and same element type as `start` and `stop`.
+    Range(const Output<Node>& start, const Output<Node>& stop, const Output<Node>& step);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/read_value.hpp b/ngraph/core/include/openvino/op/read_value.hpp
new file mode 100644
index 00000000000000..f3e83254a93769
--- /dev/null
+++ b/ngraph/core/include/openvino/op/read_value.hpp
@@ -0,0 +1,79 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/read_value_base.hpp"
+#include "openvino/op/util/variable.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief ReadValue operation creates the variable with `variable_id` and returns value
+/// of this variable.
+class OPENVINO_API ReadValue : public util::ReadValueBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ReadValue() = default;
+
+    /// \brief Constructs a ReadValue operation.
+    ///
+    /// \param init_value   Node that produces the input tensor.
+    /// \param variable_id  identificator of the variable to create.
+    ReadValue(const Output<Node>& init_value, const std::string& variable_id);
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::string get_variable_id() const override {
+        return m_variable_id;
+    }
+
+private:
+    std::string m_variable_id;
+};
+}  // namespace v3
+
+namespace v6 {
+/// \brief ReadValue operation gets an input value from the variable with `variable_id`
+/// and returns it as an output.
+class OPENVINO_API ReadValue : public util::ReadValueBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ReadValue() = default;
+
+    /// \brief Constructs a ReadValue operation.
+    ///
+    /// \param init_value Node that produces the input tensor.
+    /// \param variable Class for storing and synchronizing element types, shapes and
+    /// identifiers
+    /// between pairs of Assign/ReadValue nodes.
+    ReadValue(const Output<Node>& init_value, const std::shared_ptr<util::Variable>& variable);
+
+    void validate_and_infer_types() override;
+
+    void revalidate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::string get_variable_id() const override {
+        NGRAPH_CHECK(m_variable, "Variable is not initialized. Variable_id is unavailable");
+        return m_variable->get_info().variable_id;
+    }
+
+    bool evaluate(const HostTensorVector& outputs,
+                  const HostTensorVector& inputs,
+                  const EvaluationContext& evaluation_context) const override;
+    bool has_evaluate() const override;
+
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
+};
+}  // namespace v6
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_l1.hpp b/ngraph/core/include/openvino/op/reduce_l1.hpp
new file mode 100644
index 00000000000000..2e5f2abba84905
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_l1.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+/// \brief Reduction operation using L1 norm: L1(x) = sum(abs(x)) if all dimensions are
+/// specified for the normalisation.
+///
+/// Reduces the tensor, eliminating the specified reduction axes by taking the L1-norm.
+class OPENVINO_API ReduceL1 : public util::ArithmeticReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a reducet L1-norm operation.
+    ReduceL1() = default;
+    /// \brief Constructs a reduce L1-norm operation.
+    ///
+    /// \param arg The tensor to be reduced.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to true it holds axes that are used for reduction.
+    ReduceL1(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    /// \return The default value for Reduce.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_l2.hpp b/ngraph/core/include/openvino/op/reduce_l2.hpp
new file mode 100644
index 00000000000000..e257e222b6a38e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_l2.hpp
@@ -0,0 +1,39 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+/// \brief Reduction operation using L2 norm:
+///
+/// Reduces the tensor, eliminating the specified reduction axes by taking the L2-norm.
+class OPENVINO_API ReduceL2 : public util::ArithmeticReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a reducet L2-norm operation.
+    ReduceL2() = default;
+    /// \brief Constructs a reduce L2-norm operation.
+    ///
+    /// \param arg The tensor to be reduced.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to true it holds axes that are used for reduction.
+    ReduceL2(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    /// \return The default value for Reduce.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_logical_and.hpp b/ngraph/core/include/openvino/op/reduce_logical_and.hpp
new file mode 100644
index 00000000000000..afbdc06440d368
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_logical_and.hpp
@@ -0,0 +1,35 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/logical_reduction_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Performs a reduction using "logical and"
+///
+/// The reduction is performed over slices of the first input. The slices shape depends
+/// on the values passed to the second input - the axes.
+class OPENVINO_API ReduceLogicalAnd : public util::LogicalReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ReduceLogicalAnd() = default;
+    /// \brief Constructs a ReduceLogicalAnd node.
+    ///
+    /// \param data - The input tensor with data to be reduced
+    /// \param reduction_axes - The input tensor with information about axes over which
+    /// the first tensor should be sliced prior to the reduction operation
+    /// \param keep_dims - Indicates if the axes used for reduction should be held/kept
+    ReduceLogicalAnd(const Output<Node>& data, const Output<Node>& reduction_axes, const bool keep_dims = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_logical_or.hpp b/ngraph/core/include/openvino/op/reduce_logical_or.hpp
new file mode 100644
index 00000000000000..308e11bad38948
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_logical_or.hpp
@@ -0,0 +1,35 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/logical_reduction_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Performs a reduction using "logical or"
+///
+/// The reduction is performed over slices of the first input. The slices shape depends
+/// on the values passed to the second input - the axes.
+class OPENVINO_API ReduceLogicalOr : public util::LogicalReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ReduceLogicalOr() = default;
+    /// \brief Constructs a ReduceLogicalOr node.
+    ///
+    /// \param data - The input tensor with data to be reduced
+    /// \param reduction_axes - The input tensor with information about axes over which
+    /// the first tensor should be sliced prior to the reduction operation
+    /// \param keep_dims - Indicates if the axes used for reduction should be held/kept
+    ReduceLogicalOr(const Output<Node>& data, const Output<Node>& reduction_axes, const bool keep_dims = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_mean.hpp b/ngraph/core/include/openvino/op/reduce_mean.hpp
new file mode 100644
index 00000000000000..8a47de1e6fd1e9
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_mean.hpp
@@ -0,0 +1,29 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API ReduceMean : public util::ArithmeticReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ReduceMean() = default;
+
+    /// \param arg The tensor to be summed.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
+    ReduceMean(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_min.hpp b/ngraph/core/include/openvino/op/reduce_min.hpp
new file mode 100644
index 00000000000000..8509979fc37162
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_min.hpp
@@ -0,0 +1,33 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API ReduceMin : public util::ArithmeticReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a summation operation.
+    ReduceMin() = default;
+    /// \brief Constructs a summation operation.
+    ///
+    /// \param arg The tensor to be summed.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
+    ReduceMin(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_prod.hpp b/ngraph/core/include/openvino/op/reduce_prod.hpp
new file mode 100644
index 00000000000000..f82bba5e354649
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_prod.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Product reduction operation.
+///
+/// Reduces the tensor, eliminating the specified reduction axes by taking the product.
+class OPENVINO_API ReduceProd : public util::ArithmeticReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a product reduction operation.
+    ReduceProd() = default;
+    /// \brief Constructs a product reduction operation.
+    ///
+    /// \param arg The tensor to be reduced.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to true it holds axes that are used for reduction.
+    ReduceProd(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    /// \return The default value for Product.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reduce_sum.hpp b/ngraph/core/include/openvino/op/reduce_sum.hpp
new file mode 100644
index 00000000000000..229ed86fd8d14f
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reduce_sum.hpp
@@ -0,0 +1,85 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reductions_keep_dims.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+// clang-format off
+/// \brief Tensor sum operation.
+///
+/// Element-wise sums the input tensor, eliminating the specified reduction axes.
+/// For example:
+///
+/// \f[
+///     \mathit{sum}\left(\{0\},
+///         \left[ \begin{array}{ccc}
+///                1 & 2 \\ 3 & 4 \\ 5 & 6 \end{array} \right]\right) =
+///     \left[ (1 + 3 + 5), (2 + 4 + 6) \right] =
+///     \left[ 9, 12 \right]~~~\text{(dimension 0 (rows) is eliminated)}
+/// \f]
+///
+/// \f[
+///     \mathit{sum}\left(\{1\},
+///         \left[ \begin{array}{ccc}
+///                1 & 2 \\ 3 & 4 \\ 5 & 6 \end{array} \right]\right) =
+///     \left[ (1 + 2), (3 + 4), (5 + 6) \right] =
+///     \left[ 3, 7, 11 \right]~~~\text{(dimension 1 (columns) is eliminated)}
+/// \f]
+///
+/// \f[
+///     \mathit{sum}\left(\{0,1\},
+///         \left[ \begin{array}{ccc}
+///                1 & 2 \\ 3 & 4 \\ 5 & 6 \end{array} \right]\right) =
+///      (1 + 2) + (3 + 4) + (5 + 6) =
+///      21~~~\text{(both dimensions (rows and columns) are eliminated)}
+/// \f]
+///
+/// ## Parameters
+///
+/// |                      | Description                                            |
+/// | -------------------- | ----------------------------------------               |
+/// | `reduction_axes`     | The axes to eliminate through summation.               |
+/// | `keep_dims`          | If set to 1 it holds axes that are used for reduction. |
+///
+/// ## Inputs
+///
+/// |       | Type                              | Description                                            |
+/// | ----- | --------------------------------- | ------------------------------------------------------ |
+/// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | An input tensor of any shape and numeric element type. |
+///
+/// ## Output
+///
+/// | Type                                      | Description                                                                                                      |
+/// | ----------------------------------------- | ---------------------------------------------------------------------------------------------------------------- |
+/// | \f$N[\textit{delete}(A,d_1,\dots,d_n)]\f$ | The tensor \f$T\f$, where \f$T\f$ is the input tensor with the `reduction_axes` \f$A\f$ eliminated by summation. |
+// clang-format on
+class OPENVINO_API ReduceSum : public util::ArithmeticReductionKeepDims {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a summation operation.
+    ReduceSum() = default;
+    /// \brief Constructs a summation operation.
+    ///
+    /// \param arg The tensor to be summed.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
+    ReduceSum(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The default value for Sum.
+    OPENVINO_SUPPRESS_DEPRECATED_START
+    std::shared_ptr<Node> get_default_value() const override;
+    OPENVINO_SUPPRESS_DEPRECATED_END
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/region_yolo.hpp b/ngraph/core/include/openvino/op/region_yolo.hpp
new file mode 100644
index 00000000000000..17bed4408b9973
--- /dev/null
+++ b/ngraph/core/include/openvino/op/region_yolo.hpp
@@ -0,0 +1,84 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API RegionYolo : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    RegionYolo() = default;
+    ///
+    /// \brief      Constructs a RegionYolo operation
+    ///
+    /// \param[in]  input        Input
+    /// \param[in]  coords       Number of coordinates for each region
+    /// \param[in]  classes      Number of classes for each region
+    /// \param[in]  regions      Number of regions
+    /// \param[in]  do_softmax   Compute softmax
+    /// \param[in]  mask         Mask
+    /// \param[in]  axis         Axis to begin softmax on
+    /// \param[in]  end_axis     Axis to end softmax on
+    /// \param[in]  anchors      A flattened list of pairs `[width, height]` that
+    /// describes
+    ///                          prior box sizes.
+    ///
+    RegionYolo(const Output<Node>& input,
+               const size_t coords,
+               const size_t classes,
+               const size_t regions,
+               const bool do_softmax,
+               const std::vector<int64_t>& mask,
+               const int axis,
+               const int end_axis,
+               const std::vector<float>& anchors = std::vector<float>{});
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    size_t get_num_coords() const {
+        return m_num_coords;
+    }
+    size_t get_num_classes() const {
+        return m_num_classes;
+    }
+    size_t get_num_regions() const {
+        return m_num_regions;
+    }
+    bool get_do_softmax() const {
+        return m_do_softmax;
+    }
+    const std::vector<int64_t>& get_mask() const {
+        return m_mask;
+    }
+    const std::vector<float>& get_anchors() const {
+        return m_anchors;
+    }
+    int get_axis() const {
+        return m_axis;
+    }
+    int get_end_axis() const {
+        return m_end_axis;
+    }
+
+private:
+    size_t m_num_coords;
+    size_t m_num_classes;
+    size_t m_num_regions;
+    bool m_do_softmax;
+    std::vector<int64_t> m_mask;
+    std::vector<float> m_anchors{};
+    int m_axis;
+    int m_end_axis;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/relu.hpp b/ngraph/core/include/openvino/op/relu.hpp
new file mode 100644
index 00000000000000..d5e4fb50556eeb
--- /dev/null
+++ b/ngraph/core/include/openvino/op/relu.hpp
@@ -0,0 +1,33 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise Relu operation.
+///
+class OPENVINO_API Relu : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Relu() = default;
+    /// \brief Constructs a Relu operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Relu(const Output<ngraph::Node>& arg);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reorg_yolo.hpp b/ngraph/core/include/openvino/op/reorg_yolo.hpp
new file mode 100644
index 00000000000000..64183776a139b4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reorg_yolo.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API ReorgYolo : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ReorgYolo() = default;
+    /// \brief Constructs a ReorgYolo operation
+    ///
+    /// \param input          Input
+    /// \param stride         Stride to reorganize input by
+    ReorgYolo(const Output<Node>& input, const size_t stride);
+
+    // Constructor with `strides` for backward compatibility
+    ReorgYolo(const Output<Node>& input, const Strides& strides);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    Strides get_strides() const {
+        return m_strides;
+    }
+
+private:
+    Strides m_strides;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reshape.hpp b/ngraph/core/include/openvino/op/reshape.hpp
new file mode 100644
index 00000000000000..b1d0bbaa2acc43
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reshape.hpp
@@ -0,0 +1,66 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Tensor dynamic reshape operation.
+///
+/// "Converts" an input tensor into a new shape with the same number of elements.
+/// This op does not touch the actual data. If needed, use Transpose for that purpose.
+///
+class OPENVINO_API Reshape : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Reshape() = default;
+    /// \brief Constructs a dynamic reshape operation. This operation does not perform
+    ///        transpose.
+    ///
+    /// \param arg The tensor to be reshaped.
+    /// \param shape_pattern The node that defines output shape shape_pattern.
+    ///        If the input shape is \f$(a_0,\dots,a_{k-1})\f$ then the output shape
+    ///        must
+    ///        be of the form \f$(b_0,\dots,b_{j-1})\f$ where \f$\Pi(a_i) = \Pi(b_i)\f$.
+    ///        A value of -1 is allowed for at most one dimension, in which case the
+    ///        dimension size is inferred based on element count of input tensor.
+    /// \param special_zero Treats zeros in `shape_pattern` as wildcard flags indicating
+    /// a
+    ///        copy from input shape at the same index.
+    ///
+    Reshape(const Output<Node>& arg, const Output<Node>& shape_pattern, bool special_zero);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool get_special_zero() const {
+        return m_special_zero;
+    }
+    void set_special_zero(bool special_zero) {
+        m_special_zero = special_zero;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
+
+protected:
+    bool m_special_zero;
+    bool evaluate_reshape(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+
+private:
+    void calculate_output_shape(std::vector<Dimension>& reshape_pattern,
+                                const int64_t& minus_one_idx,
+                                const PartialShape& input_pshape,
+                                std::vector<Dimension>& output_shape) const;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/result.hpp b/ngraph/core/include/openvino/op/result.hpp
new file mode 100644
index 00000000000000..12f6d92510aa54
--- /dev/null
+++ b/ngraph/core/include/openvino/op/result.hpp
@@ -0,0 +1,61 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API Result : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Allows a value to be used as a function result.
+    Result() = default;
+    /// \brief Allows a value to be used as a function result.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Result(const Output<Node>& arg, bool needs_default_layout = false);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    void set_needs_default_layout(bool val) {
+        m_needs_default_layout = val;
+    }
+    bool needs_default_layout() const {
+        return m_needs_default_layout;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
+
+private:
+    bool m_needs_default_layout{false};
+};
+}  // namespace v0
+}  // namespace op
+using ResultVector = std::vector<std::shared_ptr<op::v0::Result>>;
+
+template <>
+class OPENVINO_API AttributeAdapter<ResultVector> : public VisitorAdapter {
+public:
+    AttributeAdapter(ResultVector& ref);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<ResultVector>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+
+protected:
+    ResultVector& m_ref;
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reverse.hpp b/ngraph/core/include/openvino/op/reverse.hpp
new file mode 100644
index 00000000000000..23d9e640923c03
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reverse.hpp
@@ -0,0 +1,75 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API Reverse : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    enum class Mode { INDEX, MASK };
+
+    Reverse() = default;
+    /// \brief Constructs a reverse operation.
+    ///
+    /// \param data The input tensor, some of whose axes are to be reversed.
+    /// \param reversed_axes The axes to reverse in a form of a set of indices or
+    /// boolean mask.
+    /// \param mode The way reversed_axes should be interpreted - a set or a mask.
+    Reverse(const Output<Node>& data, const Output<Node>& reversed_axes, const std::string& mode);
+
+    Reverse(const Output<Node>& data, const Output<Node>& reversed_axes, const Mode mode);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \return The second input data interpretation mode.
+    Mode get_mode() const {
+        return m_mode;
+    }
+    void set_mode(const Mode mode) {
+        m_mode = mode;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    Mode mode_from_string(const std::string& mode) const;
+
+    /// \brief Indicates how the values from the second input should be interpreted.
+    ///
+    /// The second input can contain a set of indices pointing to axes in the data
+    /// tensor shape.
+    /// Alternatively it can contain a boolean mask that indicates which axes should be
+    /// reversed.
+    Mode m_mode;
+
+private:
+    bool evaluate_reverse(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v1
+}  // namespace op
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v1::Reverse::Mode& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v1::Reverse::Mode> : public EnumAttributeAdapterBase<op::v1::Reverse::Mode> {
+public:
+    AttributeAdapter(op::v1::Reverse::Mode& value) : EnumAttributeAdapterBase<op::v1::Reverse::Mode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v1::Reverse::Mode>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/reverse_sequence.hpp b/ngraph/core/include/openvino/op/reverse_sequence.hpp
new file mode 100644
index 00000000000000..a9212a343ad2c1
--- /dev/null
+++ b/ngraph/core/include/openvino/op/reverse_sequence.hpp
@@ -0,0 +1,61 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API ReverseSequence : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ReverseSequence() = default;
+    /// \brief Constructs a ReverseSequence operation.
+    ///
+    /// \param arg         tensor with input data to reverse
+    /// \param seq_lengths 1D tensor of integers with sequence lengths in the input
+    /// tensor.
+    /// \param batch_axis  index of the batch dimension.
+    /// \param seq_axis    index of the sequence dimension.
+    ReverseSequence(const Output<Node>& arg,
+                    const Output<Node>& seq_lengths,
+                    int64_t batch_axis = 0,
+                    int64_t seq_axis = 1);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    size_t get_batch_axis() const {
+        return m_normalized_batch_axis;
+    }
+    int64_t get_origin_batch_axis() const {
+        return m_batch_axis;
+    }
+    void set_batch_axis(int64_t batch_axis) {
+        m_batch_axis = batch_axis;
+    }
+    size_t get_sequence_axis() const {
+        return m_normalized_seq_axis;
+    }
+    int64_t get_origin_sequence_axis() const {
+        return m_seq_axis;
+    }
+    void set_sequence_axis(int64_t sequence_axis) {
+        m_seq_axis = sequence_axis;
+    }
+
+private:
+    int64_t m_batch_axis;
+    int64_t m_seq_axis = 1;
+    size_t m_normalized_batch_axis;
+    size_t m_normalized_seq_axis;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/rnn_cell.hpp b/ngraph/core/include/openvino/op/rnn_cell.hpp
new file mode 100644
index 00000000000000..3a1c00ca210713
--- /dev/null
+++ b/ngraph/core/include/openvino/op/rnn_cell.hpp
@@ -0,0 +1,132 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/activation_functions.hpp"
+#include "openvino/op/util/rnn_cell_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+///
+/// \brief      Class for single RNN cell node.
+///
+/// \note       It follows notation and equations defined as in ONNX standard:
+///             https://github.com/onnx/onnx/blob/master/docs/Operators.md#RNN
+///
+/// \note       It calculates following equations:
+///
+///             Ht = f(Xt*(Wi^T) + Ht-1*(Ri^T) + Wbi + Rbi)
+///
+///             *       - Is a dot product,
+///             f       - is activation functions.
+///
+/// \note       This class represents only single *cell* (for current time step)
+///             and not the whole RNN Sequence layer
+///
+/// \sa         LSTMSequence, LSTMCell, GRUCell
+///
+class OPENVINO_API RNNCell : public util::RNNCellBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    RNNCell();
+    ///
+    /// \brief      Constructs RNNCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape: [hidden_size,
+    ///                                   input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [hidden_size, hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    ///
+    RNNCell(const Output<Node>& X,
+            const Output<Node>& initial_hidden_state,
+            const Output<Node>& W,
+            const Output<Node>& R,
+            std::size_t hidden_size,
+            const std::vector<std::string>& activations = std::vector<std::string>{"tanh"},
+            const std::vector<float>& activations_alpha = {},
+            const std::vector<float>& activations_beta = {},
+            float clip = 0.f);
+
+    ///
+    /// \brief      Constructs RNNCell node.
+    ///
+    /// \param[in]  X                     The input tensor with shape: [batch_size,
+    ///                                   input_size].
+    /// \param[in]  initial_hidden_state  The hidden state tensor at current time step
+    ///                                   with shape: [batch_size, hidden_size].
+    /// \param[in]  W                     The weight tensor with shape: [hidden_size,
+    ///                                   input_size].
+    /// \param[in]  R                     The recurrence weight tensor with shape:
+    ///                                   [hidden_size, hidden_size].
+    /// \param[in]  B                     The bias tensor for input gate with shape:
+    ///                                   [hidden_size].
+    /// \param[in]  hidden_size           The number of hidden units for recurrent cell.
+    /// \param[in]  activations           The vector of activation functions used inside
+    ///                                   recurrent cell.
+    /// \param[in]  activations_alpha     The vector of alpha parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  activations_beta      The vector of beta parameters for activation
+    ///                                   functions in order respective to activation
+    ///                                   list.
+    /// \param[in]  clip                  The value defining clipping range [-clip,
+    ///                                   clip] on input of activation functions.
+    ///
+    RNNCell(const Output<Node>& X,
+            const Output<Node>& initial_hidden_state,
+            const Output<Node>& W,
+            const Output<Node>& R,
+            const Output<Node>& B,
+            std::size_t hidden_size,
+            const std::vector<std::string>& activations = std::vector<std::string>{"tanh"},
+            const std::vector<float>& activations_alpha = {},
+            const std::vector<float>& activations_beta = {},
+            float clip = 0.f);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+private:
+    ///
+    /// \brief      Creates the default bias input initialized with zeros.
+    ///
+    /// \return     The object of Output class.
+    ///
+    Output<Node> get_default_bias_input() const;
+
+    ///
+    /// \brief The Activation function f.
+    ///
+    util::ActivationFunction m_activation_f;
+
+    static constexpr std::size_t s_gates_count{1};
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/rnn_sequence.hpp b/ngraph/core/include/openvino/op/rnn_sequence.hpp
new file mode 100644
index 00000000000000..33b1de8f995546
--- /dev/null
+++ b/ngraph/core/include/openvino/op/rnn_sequence.hpp
@@ -0,0 +1,50 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "openvino/op/util/rnn_cell_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v5 {
+class OPENVINO_API RNNSequence : public util::RNNCellBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    RNNSequence();
+
+    RNNSequence(const Output<Node>& X,
+                const Output<Node>& H_t,
+                const Output<Node>& sequence_lengths,
+                const Output<Node>& W,
+                const Output<Node>& R,
+                const Output<Node>& B,
+                size_t hidden_size,
+                op::RecurrentSequenceDirection direction,
+                const std::vector<std::string>& activations = std::vector<std::string>{"tanh"},
+                const std::vector<float>& activations_alpha = {},
+                const std::vector<float>& activations_beta = {},
+                float clip = 0.f);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    op::RecurrentSequenceDirection get_direction() const {
+        return m_direction;
+    }
+
+protected:
+    op::RecurrentSequenceDirection m_direction;
+};
+}  // namespace v5
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/roi_align.hpp b/ngraph/core/include/openvino/op/roi_align.hpp
new file mode 100644
index 00000000000000..2353885e5197c4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/roi_align.hpp
@@ -0,0 +1,98 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+class OPENVINO_API ROIAlign : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    enum class PoolingMode { AVG, MAX };
+
+    ROIAlign() = default;
+    /// \brief Constructs a ROIAlign node matching the ONNX ROIAlign specification
+    ///
+    /// \param input           Input feature map {N, C, H, W}
+    /// \param rois            Regions of interest to pool over
+    /// \param batch_indices   Indices of images in the batch matching
+    ///                        the number or ROIs
+    /// \param pooled_h        Height of the ROI output features
+    /// \param pooled_w        Width of the ROI output features
+    /// \param sampling_ratio  Number of sampling points used to compute
+    ///                        an output element
+    /// \param spatial_scale   Spatial scale factor used to translate ROI coordinates
+    /// \param mode            Method of pooling - 'avg' or 'max'
+    ROIAlign(const Output<Node>& input,
+             const Output<Node>& rois,
+             const Output<Node>& batch_indices,
+             const int pooled_h,
+             const int pooled_w,
+             const int sampling_ratio,
+             const float spatial_scale,
+             const std::string& mode);
+
+    ROIAlign(const Output<Node>& input,
+             const Output<Node>& rois,
+             const Output<Node>& batch_indices,
+             const int pooled_h,
+             const int pooled_w,
+             const int sampling_ratio,
+             const float spatial_scale,
+             const PoolingMode mode);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    int get_pooled_h() const {
+        return m_pooled_h;
+    }
+    int get_pooled_w() const {
+        return m_pooled_w;
+    }
+    int get_sampling_ratio() const {
+        return m_sampling_ratio;
+    }
+    float get_spatial_scale() const {
+        return m_spatial_scale;
+    }
+    PoolingMode get_mode() const {
+        return m_mode;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    PoolingMode mode_from_string(const std::string& mode) const;
+
+private:
+    int m_pooled_h;
+    int m_pooled_w;
+    int m_sampling_ratio;
+    float m_spatial_scale;
+    PoolingMode m_mode;
+};
+}  // namespace v3
+}  // namespace op
+
+std::ostream& operator<<(std::ostream& s, const op::v3::ROIAlign::PoolingMode& mode);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v3::ROIAlign::PoolingMode>
+    : public EnumAttributeAdapterBase<op::v3::ROIAlign::PoolingMode> {
+public:
+    AttributeAdapter(op::v3::ROIAlign::PoolingMode& value)
+        : EnumAttributeAdapterBase<op::v3::ROIAlign::PoolingMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v3::ROIAlign::PoolingMode>", 3};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/roi_pooling.hpp b/ngraph/core/include/openvino/op/roi_pooling.hpp
new file mode 100644
index 00000000000000..4b9faad5ee541f
--- /dev/null
+++ b/ngraph/core/include/openvino/op/roi_pooling.hpp
@@ -0,0 +1,52 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API ROIPooling : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ROIPooling() = default;
+    /// \brief Constructs a ROIPooling operation
+    ///
+    /// \param input          Input feature map {N, C, H, W}
+    /// \param coords         Coordinates of bounding boxes
+    /// \param output_size    Height/Width of ROI output features
+    /// \param spatial_scale  Ratio of input feature map over input image size
+    /// \param method         Method of pooling - Max or Bilinear
+    ROIPooling(const Output<Node>& input,
+               const Output<Node>& coords,
+               const Shape& output_size,
+               const float spatial_scale,
+               const std::string& method = "max");
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    const Shape& get_output_size() const {
+        return m_output_size;
+    }
+    float get_spatial_scale() const {
+        return m_spatial_scale;
+    }
+    const std::string& get_method() const {
+        return m_method;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    Shape m_output_size{0, 0};
+    float m_spatial_scale;
+    std::string m_method = "max";
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/roll.hpp b/ngraph/core/include/openvino/op/roll.hpp
new file mode 100644
index 00000000000000..ae0215b9dbc964
--- /dev/null
+++ b/ngraph/core/include/openvino/op/roll.hpp
@@ -0,0 +1,38 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v7 {
+/// \brief Tensor roll operation.
+class OPENVINO_API Roll : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Roll() = default;
+
+    ///
+    /// \brief      Constructs a roll operation.
+    ///
+    /// \param      data         Node producing the tensor to be shifted.
+    /// \param      shift        Node producing the 0D or 1D tensor which specifies the
+    /// number of places by which the elements are shifted.
+    /// \param      axes         Node producing the 0D or 1D tensor which specifies axes
+    /// along which elements are shifted.
+    ///
+    Roll(const Output<Node>& data, const Output<Node>& shift, const Output<Node>& axes);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v7
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/round.hpp b/ngraph/core/include/openvino/op/round.hpp
new file mode 100644
index 00000000000000..c066af19c41c41
--- /dev/null
+++ b/ngraph/core/include/openvino/op/round.hpp
@@ -0,0 +1,63 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v5 {
+/// \brief Elementwise round operation. The output is round to the nearest integer
+/// for each value. In case of halfs, the rule is defined in attribute 'mode':
+///     'HALF_TO_EVEN' - round halfs to the nearest even integer.
+///     'HALF_AWAY_FROM_ZERO': - round in such a way that the result heads away from
+/// zero.
+class OPENVINO_API Round : public Op {
+public:
+    enum class RoundMode { HALF_TO_EVEN, HALF_AWAY_FROM_ZERO };
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a round operation.
+    Round() = default;
+
+    /// \brief Constructs a round operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    /// \param mode Rule to resolve halfs
+    Round(const Output<Node>& arg, const RoundMode mode);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+    RoundMode get_mode() const {
+        return m_mode;
+    }
+
+private:
+    RoundMode m_mode;
+};
+}  // namespace v5
+}  // namespace op
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v5::Round::RoundMode& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v5::Round::RoundMode>
+    : public EnumAttributeAdapterBase<op::v5::Round::RoundMode> {
+public:
+    AttributeAdapter(op::v5::Round::RoundMode& value) : EnumAttributeAdapterBase<op::v5::Round::RoundMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v5::Round::RoundMode>", 5};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/scatter_elements_update.hpp b/ngraph/core/include/openvino/op/scatter_elements_update.hpp
new file mode 100644
index 00000000000000..0f57b3552971f5
--- /dev/null
+++ b/ngraph/core/include/openvino/op/scatter_elements_update.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+class OPENVINO_API ScatterElementsUpdate : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ScatterElementsUpdate() = default;
+    /// \brief Constructs a ScatterElementsUpdate node
+
+    /// \param data            Input data
+    /// \param indices         Data entry index that will be updated
+    /// \param updates         Update values
+    /// \param axis            Axis to scatter on
+    ScatterElementsUpdate(const Output<Node>& data,
+                          const Output<Node>& indices,
+                          const Output<Node>& updates,
+                          const Output<Node>& axis);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool evaluate_scatter_element_update(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/scatter_nd_update.hpp b/ngraph/core/include/openvino/op/scatter_nd_update.hpp
new file mode 100644
index 00000000000000..f56eb03db867b0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/scatter_nd_update.hpp
@@ -0,0 +1,29 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/scatter_nd_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Add updates to slices from inputs addressed by indices
+class OPENVINO_API ScatterNDUpdate : public util::ScatterNDBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ScatterNDUpdate() = default;
+    /// \param inputs Tensor
+    /// \param indices Index tensor: Data type must be `element::i32` or `element::i64`
+    /// \param updates Tensor: Must have same type as inputs
+    ScatterNDUpdate(const Output<Node>& inputs, const Output<Node>& indices, const Output<Node>& updates)
+        : util::ScatterNDBase(inputs, indices, updates) {}
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/scatter_update.hpp b/ngraph/core/include/openvino/op/scatter_update.hpp
new file mode 100644
index 00000000000000..78e192160b20e3
--- /dev/null
+++ b/ngraph/core/include/openvino/op/scatter_update.hpp
@@ -0,0 +1,42 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/scatter_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+///
+/// \brief      Set new values to slices from data addressed by indices
+///
+class OPENVINO_API ScatterUpdate : public util::ScatterBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ScatterUpdate() = default;
+    ///
+    /// \brief      Constructs ScatterUpdate operator object.
+    ///
+    /// \param      data     The input tensor to be updated.
+    /// \param      indices  The tensor with indexes which will be updated.
+    /// \param      updates  The tensor with update values.
+    /// \param[in]  axis     The axis at which elements will be updated.
+    ///
+    ScatterUpdate(const Output<Node>& data,
+                  const Output<Node>& indices,
+                  const Output<Node>& updates,
+                  const Output<Node>& axis);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& inputs) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool evaluate_scatter_update(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/select.hpp b/ngraph/core/include/openvino/op/select.hpp
new file mode 100644
index 00000000000000..9dfe70d8b5dfa7
--- /dev/null
+++ b/ngraph/core/include/openvino/op/select.hpp
@@ -0,0 +1,70 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+// clang-format off
+/// \brief Elementwise selection operation.
+///
+/// ## Inputs
+///
+/// |        | Type                                          | Description                                                  |
+/// | ------ | --------------------------------------------- | ------------------------------------------------------------ |
+/// | `arg0` | \f$\texttt{bool}[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape, with element `bool`.                  |
+/// | `arg1` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$             | A tensor of a shape that is broadcast-compatible with `arg0`, with any element type. |
+/// | `arg2` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$             | A tensor of a shape that is broadcast-compatible with `arg0`, and same element type as `arg1`. |
+/// | `auto_broadcast`| AutoBroadcastSpec                             | Auto broadcast specification.                                |
+///
+/// ## Output
+///
+/// | Type                   | Description                                                                                                                                                             |
+/// | ---------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+/// | \f$E[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \texttt{arg1}[i_1,\dots,i_n]\text{ if }\texttt{arg0}[i_1,\dots,i_n] \neq 0\text{, else }\texttt{arg2}[i_1,\dots,i_n]\f$ |
+// clang-format on
+class OPENVINO_API Select : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a selection operation.
+    Select() : m_auto_broadcast(AutoBroadcastSpec(AutoBroadcastType::NUMPY)) {}
+
+    /// \brief Constructs a selection operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param arg2 Node that produces the third input tensor.
+    /// \param auto_broadcast Auto broadcast specification. Default is Numpy-style
+    ///                       implicit broadcasting.
+    Select(const Output<Node>& arg0,
+           const Output<Node>& arg1,
+           const Output<Node>& arg2,
+           const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    const AutoBroadcastSpec& get_auto_broadcast() const {
+        return m_auto_broadcast;
+    }
+    void set_auto_broadcast(const AutoBroadcastSpec& auto_broadcast) {
+        m_auto_broadcast = auto_broadcast;
+    }
+    // TODO: Move all uses of get_autob to get_auto_broadcast() and remove this.
+    const AutoBroadcastSpec& get_autob() const override {
+        return m_auto_broadcast;
+    }
+    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
+    bool has_evaluate() const override;
+
+private:
+    AutoBroadcastSpec m_auto_broadcast;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/selu.hpp b/ngraph/core/include/openvino/op/selu.hpp
new file mode 100644
index 00000000000000..bdf2ae5c96658f
--- /dev/null
+++ b/ngraph/core/include/openvino/op/selu.hpp
@@ -0,0 +1,33 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Performs a SELU activation function on all elements of the input node
+class OPENVINO_API Selu : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Selu() = default;
+    /// \brief Constructs a Selu node.
+    ///
+    /// \param data - Node producing the input tensor
+    /// \param alpha - Alpha coefficient of SELU operation
+    /// \param lambda - Lambda coefficient of SELU operation
+    Selu(const Output<Node>& data, const Output<Node>& alpha, const Output<Node>& lambda);
+
+    void validate_and_infer_types() override;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/shape_of.hpp b/ngraph/core/include/openvino/op/shape_of.hpp
new file mode 100644
index 00000000000000..6ad940083c58b4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/shape_of.hpp
@@ -0,0 +1,67 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v3 {
+/// \brief Operation that returns the shape of its input argument as a tensor.
+class OPENVINO_API ShapeOf : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ShapeOf() = default;
+    /// \brief Constructs a shape-of operation.
+    ShapeOf(const Output<Node>& arg, const element::Type output_type = element::i64);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    void validate_and_infer_types() override;
+
+    element::Type get_output_type() const {
+        return m_output_type;
+    }
+    void set_output_type(element::Type output_type) {
+        m_output_type = output_type;
+    }
+    // Overload collision with method on Node
+    using Node::set_output_type;
+
+    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& output_values) const override;
+    bool evaluate_upper(const HostTensorVector& output_values) const override;
+    bool constant_fold(OutputVector& output_values, const OutputVector& input_values) override;
+
+private:
+    element::Type m_output_type;
+};
+}  // namespace v3
+
+namespace v0 {
+/// \brief Operation that returns the shape of its input argument as a tensor.
+class OPENVINO_API ShapeOf : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    ShapeOf() = default;
+    /// \brief Constructs a shape-of operation.
+    ShapeOf(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    void validate_and_infer_types() override;
+
+    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& output_values) const override;
+    bool evaluate_upper(const HostTensorVector& output_values) const override;
+    bool constant_fold(OutputVector& output_values, const OutputVector& input_values) override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/shuffle_channels.hpp b/ngraph/core/include/openvino/op/shuffle_channels.hpp
new file mode 100644
index 00000000000000..0c32977d087c12
--- /dev/null
+++ b/ngraph/core/include/openvino/op/shuffle_channels.hpp
@@ -0,0 +1,54 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Permutes data in the channel dimension of the input
+class OPENVINO_API ShuffleChannels : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ShuffleChannels() = default;
+    /// \brief Constructs a ShuffleChannels node.
+    ///
+    /// \param data     Node producing the input tensor.
+    /// \param axis     Channel dimension index in the data tensor.
+    ///                 A negative value means that the index should be
+    ///                 calculated from the back of the input data shape.
+    /// \param group    Number of group the channel dimension should be split into.
+    ///
+    ShuffleChannels(const Output<Node>& data, const int64_t axis = 1, const int64_t group = 1);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    size_t get_zero_based_axis() const;
+
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    int64_t get_axis() const {
+        return m_axis;
+    }
+    int64_t get_group() const {
+        return m_group;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool evaluate_shuffle_channels(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+
+    int64_t m_axis;
+    int64_t m_group;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/sigmoid.hpp b/ngraph/core/include/openvino/op/sigmoid.hpp
new file mode 100644
index 00000000000000..611997932059d0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/sigmoid.hpp
@@ -0,0 +1,23 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API Sigmoid : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Sigmoid(const Output<Node>& arg);
+    Sigmoid() = default;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/sign.hpp b/ngraph/core/include/openvino/op/sign.hpp
new file mode 100644
index 00000000000000..428784c3e220b2
--- /dev/null
+++ b/ngraph/core/include/openvino/op/sign.hpp
@@ -0,0 +1,31 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise sign operation.
+///
+class OPENVINO_API Sign : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Sign() = default;
+    /// \brief Constructs an elementwise sign operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Sign(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/sin.hpp b/ngraph/core/include/openvino/op/sin.hpp
new file mode 100644
index 00000000000000..beea3cb5162642
--- /dev/null
+++ b/ngraph/core/include/openvino/op/sin.hpp
@@ -0,0 +1,43 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+// clang-format off
+/// \brief Elementwise sine operation.
+///
+/// ## Inputs
+///
+/// |       | Type                              | Description                                     |
+/// | ----- | --------------------------------- | ----------------------------------------------- |
+/// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
+///
+/// ## Output
+///
+/// | Type                   | Description                                                                          |
+/// | ---------------------- | ------------------------------------------------------------------------------------ |
+/// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \sin(\texttt{arg}[i_1,\dots,i_n])\f$ |
+// clang-format on
+class OPENVINO_API Sin : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a sine operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Sin(const Output<Node>& arg);
+    Sin() = default;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/sinh.hpp b/ngraph/core/include/openvino/op/sinh.hpp
new file mode 100644
index 00000000000000..7759db39134dea
--- /dev/null
+++ b/ngraph/core/include/openvino/op/sinh.hpp
@@ -0,0 +1,29 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise hyperbolic sine (sinh) operation.
+class OPENVINO_API Sinh : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a hyperbolic sine operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Sinh(const Output<Node>& arg);
+    Sinh() = default;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/sink.hpp b/ngraph/core/include/openvino/op/sink.hpp
new file mode 100644
index 00000000000000..e603378183d6a6
--- /dev/null
+++ b/ngraph/core/include/openvino/op/sink.hpp
@@ -0,0 +1,26 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <vector>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+/// Root of nodes that can be sink nodes
+class OPENVINO_API Sink : public Op {
+public:
+    ~Sink() override = 0;
+    OPENVINO_RTTI_DECLARATION;
+
+protected:
+    Sink() : Op() {}
+
+    explicit Sink(const OutputVector& arguments) : Op(arguments) {}
+};
+}  // namespace op
+using SinkVector = std::vector<std::shared_ptr<op::Sink>>;
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/slice.hpp b/ngraph/core/include/openvino/op/slice.hpp
new file mode 100644
index 00000000000000..b9ff0da388707d
--- /dev/null
+++ b/ngraph/core/include/openvino/op/slice.hpp
@@ -0,0 +1,38 @@
+
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v8 {
+/// \brief Slice operation.
+///
+class OPENVINO_API Slice : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Slice() = default;
+
+    ///
+    /// \brief    Constructs Slice operation.
+    ///
+    Slice(const Output<Node>& data, const Output<Node>& start, const Output<Node>& stop, const Output<Node>& step);
+    Slice(const Output<Node>& data,
+          const Output<Node>& start,
+          const Output<Node>& stop,
+          const Output<Node>& step,
+          const Output<Node>& axes);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v8
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/softmax.hpp b/ngraph/core/include/openvino/op/softmax.hpp
new file mode 100644
index 00000000000000..8818953bd16d8b
--- /dev/null
+++ b/ngraph/core/include/openvino/op/softmax.hpp
@@ -0,0 +1,46 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+class OPENVINO_API Softmax : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Softmax() = default;
+    /// \brief Constructs a softmax operation.
+    ///
+    /// \param arg Node that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param axis The axis position (0-based) on which to calculate the softmax.
+    ///
+    /// Output `[d0, ...]`
+    ///
+    Softmax(const Output<Node>& arg, const size_t axis = 1);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    size_t get_axis() const {
+        return m_axis;
+    }
+    void set_axis(const size_t axis) {
+        m_axis = axis;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    size_t m_axis{0};
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/softplus.hpp b/ngraph/core/include/openvino/op/softplus.hpp
new file mode 100644
index 00000000000000..ae4cea9a6613b5
--- /dev/null
+++ b/ngraph/core/include/openvino/op/softplus.hpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+/// \brief A Self Regularized Non-Monotonic Neural Activation Function
+/// f(x) =  ln(exp(x) + 1.)
+///
+class OPENVINO_API SoftPlus : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    SoftPlus() = default;
+    /// \brief Constructs an SoftPlus operation.
+    ///
+    /// \param data Input tensor
+    SoftPlus(const Output<Node>& arg);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/space_to_batch.hpp b/ngraph/core/include/openvino/op/space_to_batch.hpp
new file mode 100644
index 00000000000000..44bc31fa5c1123
--- /dev/null
+++ b/ngraph/core/include/openvino/op/space_to_batch.hpp
@@ -0,0 +1,54 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief SpaceToBatch permutes data tensor blocks of spatial data into batch
+/// dimension.
+///
+/// \note  Values from spatial blocks dimensions are moved in the batch dimension.
+///
+///        Output node produces a tensor with shape: tensor with shape
+///        `[batch * block_shape[0] * block_shape[1] * ... * block_shape[N - 1],
+///         (pads_begin[1] + D_1 + pads_end[1]) / block_shape[1],
+///         (pads_begin[2] + D_2 + pads_end[2]) / block_shape[2], ...,
+///         (pads_begin[N - 1] + D_{N - 1} + pads_end[N - 1]) / block_shape[N - 1]`
+///         of the same type as `data` input.
+class OPENVINO_API SpaceToBatch : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    SpaceToBatch() = default;
+
+    /// \brief Constructs a SpaceToBatch operation.
+    ///
+    /// \param data Node producing the data tensor
+    /// \param block_shape The sizes of the block of values to be moved
+    /// \param pads_begin Specifies the padding for the beginning along each axis of
+    /// `data` input
+    /// \param pads_end Specifies the padding for the ending along each axis of `data`
+    /// input.
+    SpaceToBatch(const Output<Node>& data,
+                 const Output<Node>& block_shape,
+                 const Output<ngraph::Node>& pads_begin,
+                 const Output<ngraph::Node>& pads_end);
+
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool evaluate_space_to_batch(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/space_to_depth.hpp b/ngraph/core/include/openvino/op/space_to_depth.hpp
new file mode 100644
index 00000000000000..3dee36bc3f4db8
--- /dev/null
+++ b/ngraph/core/include/openvino/op/space_to_depth.hpp
@@ -0,0 +1,77 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief SpaceToDepth permutes input tensor blocks of spatial data into depth
+/// dimension.
+///
+/// \note  Values from the height and width dimensions are moved to the depth dimension.
+///
+///        Output node produces a tensor with shape:
+///        [N, C * blocksize * blocksize, H / blocksize, W / blocksize]
+class OPENVINO_API SpaceToDepth : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    enum class SpaceToDepthMode {
+        // The output depth is gathered from [block_size, ..., block_size, C]
+        BLOCKS_FIRST,
+        // The output depth is gathered from [C, block_size, ..., block_size]
+        DEPTH_FIRST
+    };
+
+    SpaceToDepth() = default;
+    /// \brief Constructs a SpaceToDepth operation.
+    ///
+    /// \param data - Node producing the input tensor
+    /// \param mode Specifies how the output depth dimension is gathered
+    /// from block coordinates and the old depth dimension.
+    /// \param block_size - the size of the block of values to be moved
+    SpaceToDepth(const Output<Node>& data, const SpaceToDepthMode& mode, std::size_t block_size = 1);
+
+    SpaceToDepth(const Output<Node>& data, const std::string& mode, std::size_t block_size = 1);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::size_t get_block_size() const {
+        return m_blocksize;
+    }
+    SpaceToDepthMode get_mode() const {
+        return m_mode;
+    }
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    std::size_t m_blocksize;
+    SpaceToDepthMode m_mode;
+};
+}  // namespace v0
+}  // namespace op
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::v0::SpaceToDepth::SpaceToDepthMode& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::v0::SpaceToDepth::SpaceToDepthMode>
+    : public EnumAttributeAdapterBase<op::v0::SpaceToDepth::SpaceToDepthMode> {
+public:
+    AttributeAdapter(op::v0::SpaceToDepth::SpaceToDepthMode& value)
+        : EnumAttributeAdapterBase<op::v0::SpaceToDepth::SpaceToDepthMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::v0::SpaceToDepth::SpaceToDepthMode>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/split.hpp b/ngraph/core/include/openvino/op/split.hpp
new file mode 100644
index 00000000000000..e1cb09bedf6fef
--- /dev/null
+++ b/ngraph/core/include/openvino/op/split.hpp
@@ -0,0 +1,48 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <vector>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Splits the input tensor into a list of equal sized tensors
+class OPENVINO_API Split : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a split operation.
+    Split() = default;
+    /// \brief Constructs a split operation.
+    /// \param data        The tensor to be split.
+    /// \param axis        The index of an axis in "data" along which to perform
+    ///                    the split.
+    /// \param num_splits  The number of pieces that the data tensor should be
+    ///                    split into.
+    Split(const Output<Node>& data, const Output<Node>& axis, const size_t num_splits);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    size_t get_num_splits() const {
+        return m_num_splits;
+    }
+    void set_num_splits(const size_t num_splits) {
+        m_num_splits = num_splits;
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    size_t m_num_splits;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/sqrt.hpp b/ngraph/core/include/openvino/op/sqrt.hpp
new file mode 100644
index 00000000000000..2f16e3bdf33c15
--- /dev/null
+++ b/ngraph/core/include/openvino/op/sqrt.hpp
@@ -0,0 +1,44 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+// clang-format off
+/// \brief Elementwise square root operation.
+///
+/// ## Inputs
+///
+/// |       | Type                              | Description                                     |
+/// | ----- | --------------------------------- | ----------------------------------------------- |
+/// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
+///
+/// ## Output
+///
+/// | Type                   | Description                                                                           |
+/// | ---------------------- | ------------------------------------------------------------------------------------- |
+/// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \sqrt{\texttt{arg}[i_1,\dots,i_n]}\f$ |
+// clang-format on
+class OPENVINO_API Sqrt : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a square operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Sqrt(const Output<Node>& arg);
+    Sqrt() = default;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/squared_difference.hpp b/ngraph/core/include/openvino/op/squared_difference.hpp
new file mode 100644
index 00000000000000..23c23de070b358
--- /dev/null
+++ b/ngraph/core/include/openvino/op/squared_difference.hpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Calculates an element-wise squared difference between two tensors
+///
+/// y[i] = (x1[i] - x2[i])^2
+class OPENVINO_API SquaredDifference : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constrcuts an uninitialized squared difference operation
+    SquaredDifference() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+    /// \brief Constructs the squared difference operation.
+    ///
+    /// \param x1 First input tensor
+    /// \param x2 Second input tensor
+    /// \param auto_broadcast Auto broadcast specification
+    SquaredDifference(const Output<Node>& x1,
+                      const Output<Node>& x2,
+                      const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/squeeze.hpp b/ngraph/core/include/openvino/op/squeeze.hpp
new file mode 100644
index 00000000000000..ff212467127ccd
--- /dev/null
+++ b/ngraph/core/include/openvino/op/squeeze.hpp
@@ -0,0 +1,37 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API Squeeze : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Squeeze();
+    Squeeze(const Output<Node>& data, const Output<Node>& axes);
+    Squeeze(const Output<Node>& data);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool is_dynamic() const override;
+
+private:
+    Output<Node> get_default_axes_input() const;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/strided_slice.hpp b/ngraph/core/include/openvino/op/strided_slice.hpp
new file mode 100644
index 00000000000000..150595bc145b50
--- /dev/null
+++ b/ngraph/core/include/openvino/op/strided_slice.hpp
@@ -0,0 +1,110 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <vector>
+
+#include "ngraph/op/util/attr_types.hpp"
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Takes a slice of an input tensor, i.e., the sub-tensor that resides within a
+///        bounding box, optionally with stride.
+class OPENVINO_API StridedSlice : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    StridedSlice() = default;
+
+    /// \brief Constructs a dynamic tensor strided slice operation.
+    ///
+    /// \param data             The tensor to be sliced.
+    /// \param begin            1D tensor with begin indexes for input blob slicing.
+    /// \param end              1D tensor with end indexes for input blob slicing.
+    /// \param strides          The slicing strides; for example, strides of `{n,m}`
+    ///                         means to take every nth row and every mth column
+    ///                         of the input matrix.
+    /// \param begin_mask       When begin_mask[i] equal to 1 means that the
+    ///                         corresponding dimension of the begin input is ignored.
+    /// \param end_mask         When end_mask[i] is 1, the corresponding dimension of
+    ///                         the end input is ignored.
+    /// \param new_axis_mask    If new_axis_mask[i] is 1, a length 1 dimension
+    ///                         is inserted on the i-th position.
+    /// \param shrink_axis_mask If shrink_axis_mask[i] is 1, the dimension
+    ///                         on the i-th position is deleted.
+    /// \param ellipsis_mask    It inserts missing dimensions
+    ///                         on a position of a non-zero bit.
+    StridedSlice(const Output<Node>& data,
+                 const Output<Node>& begin,
+                 const Output<Node>& end,
+                 const Output<Node>& strides,
+                 const std::vector<int64_t>& begin_mask,
+                 const std::vector<int64_t>& end_mask,
+                 const std::vector<int64_t>& new_axis_mask = std::vector<int64_t>{},
+                 const std::vector<int64_t>& shrink_axis_mask = std::vector<int64_t>{},
+                 const std::vector<int64_t>& ellipsis_mask = std::vector<int64_t>{});
+
+    /// \brief Constructs a dynamic tensor strided slice operation.
+    ///
+    /// \param data             The tensor to be sliced.
+    /// \param begin            1D tensor with begin indexes for input blob slicing.
+    /// \param end              1D tensor with end indexes for input blob slicing.
+    /// \param begin_mask       When begin_mask[i] equal to 1 means that the
+    ///                         corresponding dimension of the begin input is ignored.
+    /// \param end_mask         When end_mask[i] is 1, the corresponding dimension of
+    ///                         the end input is ignored.
+    /// \param new_axis_mask    If new_axis_mask[i] is 1, a length 1 dimension
+    ///                         is inserted on the i-th position.
+    /// \param shrink_axis_mask If shrink_axis_mask[i] is 1, the dimension
+    ///                         on the i-th position is deleted.
+    /// \param ellipsis_mask    It inserts missing dimensions
+    ///                         on a position of a non-zero bit.
+    StridedSlice(const Output<Node>& data,
+                 const Output<Node>& begin,
+                 const Output<Node>& end,
+                 const std::vector<int64_t>& begin_mask,
+                 const std::vector<int64_t>& end_mask,
+                 const std::vector<int64_t>& new_axis_mask = std::vector<int64_t>{},
+                 const std::vector<int64_t>& shrink_axis_mask = std::vector<int64_t>{},
+                 const std::vector<int64_t>& ellipsis_mask = std::vector<int64_t>{});
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    const std::vector<int64_t>& get_begin_mask() const {
+        return m_begin_mask;
+    }
+    const std::vector<int64_t>& get_end_mask() const {
+        return m_end_mask;
+    }
+    const std::vector<int64_t>& get_new_axis_mask() const {
+        return m_new_axis_mask;
+    }
+    const std::vector<int64_t>& get_shrink_axis_mask() const {
+        return m_shrink_axis_mask;
+    }
+    const std::vector<int64_t>& get_ellipsis_mask() const {
+        return m_ellipsis_mask;
+    }
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    void validate_and_infer_types() override;
+    bool evaluate(const HostTensorVector& output_values, const HostTensorVector& input_values) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+
+private:
+    AxisSet convert_mask_to_axis_set(const std::vector<int64_t>& mask) const;
+
+    std::vector<int64_t> m_begin_mask;
+    std::vector<int64_t> m_end_mask;
+    std::vector<int64_t> m_new_axis_mask;
+    std::vector<int64_t> m_shrink_axis_mask;
+    std::vector<int64_t> m_ellipsis_mask;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/subtract.hpp b/ngraph/core/include/openvino/op/subtract.hpp
new file mode 100644
index 00000000000000..abb15c9305de32
--- /dev/null
+++ b/ngraph/core/include/openvino/op/subtract.hpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/binary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Elementwise subtraction operation.
+class OPENVINO_API Subtract : public util::BinaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Subtract() : util::BinaryElementwiseArithmetic(AutoBroadcastSpec::NUMPY) {}
+
+    /// \brief Constructs a subtraction operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.
+    /// \param arg1 Node that produces the second input tensor.
+    /// \param auto_broadcast Auto broadcast specification
+    Subtract(const Output<Node>& arg0,
+             const Output<Node>& arg1,
+             const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec(AutoBroadcastType::NUMPY));
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/swish.hpp b/ngraph/core/include/openvino/op/swish.hpp
new file mode 100644
index 00000000000000..7ec3806a38dce4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/swish.hpp
@@ -0,0 +1,38 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v4 {
+/// \brief A Swish Activation Function
+/// f(x) =  x / (1.0 + exp(-beta * x)) or
+/// f(x) = x * sigmoid(beta * x)
+///
+class OPENVINO_API Swish : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Swish() = default;
+
+    /// \brief Constructs an Swish operation.
+    ///
+    /// \param data Input tensor
+    /// \param beta Scalar with beta value. If the argument is not specified then use
+    /// the default value 1.0
+    Swish(const Output<Node>& arg, const Output<Node>& beta);
+    explicit Swish(const Output<Node>& arg);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v4
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/tan.hpp b/ngraph/core/include/openvino/op/tan.hpp
new file mode 100644
index 00000000000000..45f20a91b924fa
--- /dev/null
+++ b/ngraph/core/include/openvino/op/tan.hpp
@@ -0,0 +1,43 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+// clang-format off
+/// \brief Elementwise tangent operation.
+///
+/// ## Inputs
+///
+/// |       | Type                              | Description                                     |
+/// | ----- | --------------------------------- | ----------------------------------------------- |
+/// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and numeric element type. |
+///
+/// ## Output
+///
+/// | Type                   | Description                                                                          |
+/// | ---------------------- | ------------------------------------------------------------------------------------ |
+/// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \tan(\texttt{arg}[i_1,\dots,i_n])\f$ |
+// clang-format on
+class OPENVINO_API Tan : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a tangent operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Tan(const Output<Node>& arg);
+    Tan() = default;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/tanh.hpp b/ngraph/core/include/openvino/op/tanh.hpp
new file mode 100644
index 00000000000000..f981d9037c554d
--- /dev/null
+++ b/ngraph/core/include/openvino/op/tanh.hpp
@@ -0,0 +1,30 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/unary_elementwise_arithmetic.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise hyperbolic tangent operation.
+class OPENVINO_API Tanh : public util::UnaryElementwiseArithmetic {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a hyperbolic tangent operation.
+    ///
+    /// \param arg Node that produces the input tensor.
+    Tanh(const Output<Node>& arg);
+    Tanh() = default;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/tensor_iterator.hpp b/ngraph/core/include/openvino/op/tensor_iterator.hpp
new file mode 100644
index 00000000000000..232ef4c13db334
--- /dev/null
+++ b/ngraph/core/include/openvino/op/tensor_iterator.hpp
@@ -0,0 +1,43 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <vector>
+
+#include "openvino/core/function.hpp"
+#include "openvino/op/parameter.hpp"
+#include "openvino/op/util/sub_graph_base.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief  Iterate a body over tensors, accumulating into tensors.
+class OPENVINO_API TensorIterator : public op::util::SubGraphOp {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    TensorIterator() = default;
+    explicit TensorIterator(const OutputVector& values);
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    /// \return the body of the iteration
+    std::shared_ptr<Function> get_body() const {
+        return m_bodies[0];
+    }
+    /// \param body set the body of the iteration
+    void set_body(const std::shared_ptr<Function>& body) {
+        set_function(body);
+    }
+    void validate_and_infer_types() override;
+    void revalidate_and_infer_types_for_body_ops();
+
+private:
+    void try_to_set_num_iterations_if_no_slice_inputs();
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/tile.hpp b/ngraph/core/include/openvino/op/tile.hpp
new file mode 100644
index 00000000000000..73bcd627d82744
--- /dev/null
+++ b/ngraph/core/include/openvino/op/tile.hpp
@@ -0,0 +1,38 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Dynamic Tiling operation which repeats a tensor multiple times
+///        along each dimension
+class OPENVINO_API Tile : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Tile() = default;
+    /// \brief Perform dynamic padding of a tensor
+    ///
+    /// \param data The node producing input tensor to be padded.
+    /// \param repeats The node producing the per-dimension replication factor
+    Tile(const Output<Node>& data, const Output<Node>& repeats);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool evaluate_tile(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/topk.hpp b/ngraph/core/include/openvino/op/topk.hpp
new file mode 100644
index 00000000000000..679cb143ed6c62
--- /dev/null
+++ b/ngraph/core/include/openvino/op/topk.hpp
@@ -0,0 +1,161 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/constant.hpp"
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Computes indices and values of the k maximum/minimum values
+///        for each slice along specified axis.
+class OPENVINO_API TopK : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    using SortType = TopKSortType;
+    using Mode = TopKMode;
+
+    /// \brief Constructs a TopK operation
+    TopK() = default;
+    /// \brief Constructs a TopK operation with two outputs: values and indices.
+    ///        By default the indices output is described by i32 data type.
+    ///
+    /// \param data The input tensor
+    /// \param k Specifies how many maximum/minimum elements should be computed
+    ///          (note: scalar input tensor)
+    /// \param axis The axis along which to compute top k indices
+    /// \param mode Specifies which operation (min or max) is used to select
+    ///             the biggest element of two.
+    /// \param sort Specifies order of output elements and/or indices
+    ///             Accepted values: none, index, value
+    /// \param index_element_type Specyfies type of produced indices
+    TopK(const Output<Node>& data,
+         const Output<Node>& k,
+         const int64_t axis,
+         const std::string& mode,
+         const std::string& sort,
+         const element::Type& index_element_type = element::i32);
+
+    TopK(const Output<Node>& data,
+         const Output<Node>& k,
+         const int64_t axis,
+         const Mode mode,
+         const SortType sort,
+         const element::Type& index_element_type = element::i32);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    /// \brief Returns axis value after normalization
+    /// \note If input rank required to normalization is dynamic, the exception is
+    /// thrown
+    uint64_t get_axis() const;
+    /// \brief Returns axis value before normalization
+    int64_t get_provided_axis() const {
+        return m_axis;
+    }
+    void set_axis(const int64_t axis);
+    Mode get_mode() const {
+        return m_mode;
+    }
+    void set_mode(const Mode mode) {
+        m_mode = mode;
+    }
+    SortType get_sort_type() const {
+        return m_sort;
+    }
+    void set_sort_type(const SortType sort) {
+        m_sort = sort;
+    }
+    element::Type get_index_element_type() const {
+        return m_index_element_type;
+    }
+    void set_index_element_type(const element::Type& index_element_type) {
+        m_index_element_type = index_element_type;
+    }
+    /// \brief Returns the value of K, if available
+    ///
+    /// \note If the second input to this op is a constant, the value is retrieved
+    ///       and returned. If the input is not constant(dynamic) this method returns 0
+    size_t get_k() const;
+    void set_k(size_t k);
+    size_t get_default_output_index() const override {
+        return no_default_index();
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    int64_t m_axis;
+    uint64_t m_normalized_axis;
+    Mode m_mode;
+    SortType m_sort;
+    element::Type m_index_element_type{element::i32};
+
+    virtual size_t read_k_from_constant_node(const std::shared_ptr<Node>& node,
+                                             const element::Type& k_element_type) const;
+
+    template <typename T>
+    size_t validate_and_get_k(const std::shared_ptr<op::v0::Constant>& k_constant) const;
+    Shape compute_output_shape(const std::string& node_description,
+                               const PartialShape input_partial_shape,
+                               const int64_t k) const;
+    void set_axis(const Rank input_rank, const int64_t axis);
+};
+}  // namespace v1
+
+namespace v3 {
+/// \brief Computes indices and values of the k maximum/minimum values
+///        for each slice along specified axis.
+class OPENVINO_API TopK : public v1::TopK {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a TopK operation
+    TopK() = default;
+    /// \brief Constructs a TopK operation with two outputs: values and indices.
+    ///        By default the indices output is described by i32 data type.
+    ///
+    /// \param data The input tensor
+    /// \param k Specifies how many maximum/minimum elements should be computed
+    ///          (note: scalar input tensor)
+    /// \param axis The axis along which to compute top k indices
+    /// \param mode Specifies which operation (min or max) is used to select
+    ///             the biggest element of two.
+    /// \param sort Specifies order of output elements and/or indices
+    ///             Accepted values: none, index, value
+    /// \param index_element_type Specyfies type of produced indices
+    TopK(const Output<Node>& data,
+         const Output<Node>& k,
+         const int64_t axis,
+         const std::string& mode,
+         const std::string& sort,
+         const element::Type& index_element_type = element::i32);
+
+    TopK(const Output<Node>& data,
+         const Output<Node>& k,
+         const int64_t axis,
+         const Mode mode,
+         const SortType sort,
+         const element::Type& index_element_type = element::i32);
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+protected:
+    size_t read_k_from_constant_node(const std::shared_ptr<Node>& node,
+                                     const element::Type& k_element_type) const override;
+};
+}  // namespace v3
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/transpose.hpp b/ngraph/core/include/openvino/op/transpose.hpp
new file mode 100644
index 00000000000000..944b6533044107
--- /dev/null
+++ b/ngraph/core/include/openvino/op/transpose.hpp
@@ -0,0 +1,39 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief Tensor transpose operation.
+class OPENVINO_API Transpose : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Transpose() = default;
+    ///
+    /// \brief      Constructs a transpose operation.
+    ///
+    /// \param      arg          Node producing the tensor to be transposed.
+    /// \param      input_order  Node producing the permutation to apply to the axes
+    ///                          of the input shape. Must be a vector with shape [n],
+    ///                          where n is the rank of arg. The tensor's value must
+    ///                          contain every integer in the range [0, n-1].
+    ///
+    Transpose(const Output<Node>& arg, const Output<Node>& input_order);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/unsqueeze.hpp b/ngraph/core/include/openvino/op/unsqueeze.hpp
new file mode 100644
index 00000000000000..6eae736e9a0f46
--- /dev/null
+++ b/ngraph/core/include/openvino/op/unsqueeze.hpp
@@ -0,0 +1,34 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+class OPENVINO_API Unsqueeze : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Unsqueeze() = default;
+    Unsqueeze(const Output<Node>& data, const Output<Node>& axes);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+    bool evaluate_lower(const HostTensorVector& output_values) const override;
+    bool evaluate_upper(const HostTensorVector& output_values) const override;
+
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/activation_functions.hpp b/ngraph/core/include/openvino/op/util/activation_functions.hpp
new file mode 100644
index 00000000000000..a30b70f3e67fa5
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/activation_functions.hpp
@@ -0,0 +1,86 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <string>
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/except.hpp"
+#include "openvino/core/node.hpp"
+
+#ifdef _WIN32
+#    pragma warning(push)
+
+#    pragma warning(disable : 4100)
+#endif
+
+namespace ov {
+namespace op {
+namespace util {
+namespace error {
+struct UnknownActivationFunction : Exception {
+    UnknownActivationFunction(const std::string& func_name) : Exception{"Unknown activation function: " + func_name} {}
+};
+}  // namespace error
+
+namespace detail {
+std::shared_ptr<Node> sigmoid(const std::shared_ptr<Node>& arg, float alpha, float beta);
+std::shared_ptr<Node> tanh(const std::shared_ptr<Node>& arg, float alpha, float beta);
+std::shared_ptr<Node> relu(const std::shared_ptr<Node>& arg, float alpha, float beta);
+std::shared_ptr<Node> hardsigmoid(const std::shared_ptr<Node>& arg, float alpha, float beta);
+}  // namespace detail
+
+using ActivationFunctionType = std::shared_ptr<Node> (*)(const std::shared_ptr<Node>&, float, float);
+
+///
+/// \brief      Class representing activation function used in RNN cells.
+///
+class OPENVINO_API ActivationFunction {
+public:
+    ActivationFunction(ActivationFunctionType f, float alpha, float beta);
+    ActivationFunction(ActivationFunctionType f, float alpha);
+    ActivationFunction(ActivationFunctionType f);
+    ActivationFunction() = default;
+
+    ///
+    /// \brief  Calls stored activation function with provided node argument.
+    ///
+    std::shared_ptr<Node> operator()(const std::shared_ptr<Node>& arg) const;
+
+    void set_alpha(float alpha) {
+        m_alpha = alpha;
+    }
+    void set_beta(float beta) {
+        m_beta = beta;
+    }
+
+private:
+    /// \brief Activation function wrapper.
+    ActivationFunctionType m_function;
+    /// \brief Activation function alpha parameter (may be unused).
+    float m_alpha;
+    /// \brief Activation function beta parameter (may be unused).
+    float m_beta;
+};
+
+/// \brief      Gets the activation function by name.
+///
+/// \param[in]  func_name  The function name
+///
+/// \throws     UnknownActivationFunction When provided func_name is unknown.
+///
+/// \return     The activation function object.
+///
+ActivationFunction get_activation_func_by_name(const std::string& func_name);
+}  // namespace util
+
+}  // namespace op
+
+}  // namespace ov
+
+#ifdef _WIN32
+#    pragma warning(pop)
+#endif
diff --git a/ngraph/core/include/openvino/op/util/arithmetic_reduction.hpp b/ngraph/core/include/openvino/op/util/arithmetic_reduction.hpp
new file mode 100644
index 00000000000000..55931eaf04f0f4
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/arithmetic_reduction.hpp
@@ -0,0 +1,44 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/op/util/reduction_base.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Abstract base class for arithmetic reduction operations, i.e., operations
+///        where chosen axes of the input tensors are eliminated (reduced out) by
+///        repeated application of a particular binary arithmetic operation.
+class OPENVINO_API ArithmeticReduction : public ReductionBase {
+protected:
+    /// \brief Constructs an arithmetic reduction operation.
+    ArithmeticReduction();
+
+    /// \brief Constructs an arithmetic reduction operation.
+    ///
+    /// \param arg Output that produces the first input tensor.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    ArithmeticReduction(const Output<Node>& arg, const Output<Node>& reduction_axes);
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+    void validate_and_infer_types() override;
+
+    /// \return true if reduction axes are constant else false.
+    bool reduction_axes_constant() const;
+
+    /// \return The axis positions (0-based) to be eliminated through reduction.
+    /// \throws CheckFailure if the reduction axes are not constant. (Use
+    ///           reduction_axes_constant to check.)
+    const AxisSet get_reduction_axes() const;
+
+    /// \brief Change the reduction axes
+    void set_reduction_axes(const AxisSet& reduction_axes);
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/arithmetic_reductions_keep_dims.hpp b/ngraph/core/include/openvino/op/util/arithmetic_reductions_keep_dims.hpp
new file mode 100644
index 00000000000000..805fe6ebe2d15c
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/arithmetic_reductions_keep_dims.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/util/arithmetic_reduction.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API ArithmeticReductionKeepDims : public util::ArithmeticReduction {
+protected:
+    ArithmeticReductionKeepDims() = default;
+
+    /// \param arg The tensor to be summed.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
+    ArithmeticReductionKeepDims(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims = false);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+    void validate_and_infer_types() override;
+
+    /// \return If set to 1 it holds axes that are used for reduction.
+    /// For each such axis, output dimension is equal to 1.
+    bool get_keep_dims() const {
+        return m_keep_dims;
+    }
+    void set_keep_dims(bool keep_dims) {
+        m_keep_dims = keep_dims;
+    }
+
+private:
+    bool m_keep_dims = false;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/assign_base.hpp b/ngraph/core/include/openvino/op/util/assign_base.hpp
new file mode 100644
index 00000000000000..af195f6496a606
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/assign_base.hpp
@@ -0,0 +1,22 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/sink.hpp"
+#include "openvino/op/util/variable_extension.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API AssignBase : public Sink, public VariableExtension {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    AssignBase() = default;
+    /// \brief Constructs an AssignBase operation.
+    explicit AssignBase(const OutputVector& arguments) : Sink(arguments) {}
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/attr_types.hpp b/ngraph/core/include/openvino/op/util/attr_types.hpp
new file mode 100644
index 00000000000000..b7e37518d435c9
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/attr_types.hpp
@@ -0,0 +1,333 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <ostream>
+
+#include "openvino/core/attribute_adapter.hpp"
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/type.hpp"
+
+namespace ov {
+namespace op {
+/// \brief Modes for the `Pad` operator.
+enum class PadMode { CONSTANT = 0, EDGE, REFLECT, SYMMETRIC };
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const PadMode& type);
+
+/// \brief Padding Type used for `Convolution` and `Pooling`
+///
+/// Follows ONNX padding type definitions
+/// EXPLICIT   - Pad dimensions are explicity specified
+/// SAME_LOWER - Pad dimensions computed to match input shape
+///              Ceil(num_dims/2) at the beginning and
+///              Floor(num_dims/2) at the end
+/// SAME_UPPER - Pad dimensions computed to match input shape
+///              Floor(num_dims/2) at the beginning and
+///              Ceil(num_dims/2) at the end
+/// VALID      - No padding
+/// AUTO       - Deprecated. User should not use it in the future
+/// NOTSET     - Deprecated. User should not use it in the future
+
+enum class PadType {
+    EXPLICIT = 0,
+    SAME_LOWER,
+    SAME_UPPER,
+    VALID,
+    AUTO = SAME_UPPER,
+    NOTSET = EXPLICIT,
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const PadType& type);
+
+/// \brief Rounding Type used for `Pooling` operators.
+enum class RoundingType {
+    FLOOR = 0,
+    CEIL = 1,
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const RoundingType& type);
+
+/// \brief Specifies the algorithm to use for implicit broadcasting of a tensor
+///        to align with another tensor
+///
+/// NONE  - No implicit broadcasting of tensor
+/// NUMPY - Numpy-style implicit broadcasting
+///         (https://docs.scipy.org/doc/numpy/user/basics.broadcasting.html)
+///         Right-align dimensions of the two tensors, with missing dimensions
+///         treated as size 1 dimensions. After alignment, for each dimension,
+///         their sizes should either match or one of them should be of size 1.
+///         Size 1 dimension will be implicitly broadcast to match the other
+///         size.
+///
+///         E.g.,
+///              A: Shape(2, 1, 6)
+///              B: Shape(   3, 1)
+///         Result: Shape(2, 3, 6)
+///
+///              A: Shape(2, 1, 6)
+///              B: Shape(   3, 1)
+///         Result: Shape(2, 3, 6)
+/// PDPD  - PaddlePaddle-style implicit broadcasting
+///         (https://github.com/PaddlePaddle/Paddle/blob/release/1.5/paddle/
+///                  fluid/operators/elementwise/elementwise_op.h#L126)
+///         Broadcast B to match the shape of A, where axis is the start
+///         dimension index to align B with A. If axis is -1 (default), i
+///         axis = rank(A) - rank(B). The trailing dimensions of size 1 for B
+///         will be ignored.
+///
+///         E.g.,
+///              A: Shape(2, 3, 4, 5)
+///              B: Shape(   3, 4   ) with axis =1
+///         Result: Shape(2, 3, 4, 5)
+///
+///              A: Shape(2, 3, 4, 5)
+///              B: Shape(   3, 1   ) with axis = 1
+///         Result: Shape(2, 3, 4, 5)
+///
+enum class AutoBroadcastType {
+    NONE = 0,
+    EXPLICIT = NONE,
+    NUMPY,
+    PDPD,
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const AutoBroadcastType& type);
+/// \brief BroadcastType specifies rules used for mapping of input tensor axes to output
+/// shape axes.
+///
+/// \note  Broadcasting rules are different for Broadcast op and for element-wise ops.
+///        AutoBroadcastType::NUMPY is equivalent of BroadcastType::BIDIRECTIONAL
+///        according to spec.
+///
+/// EXPLICIT      - Mapping of the input data shape to output shape
+///                 based on axes_mapping input.
+/// NUMPY         - Numpy broadcasting rules, aligned with ONNX Broadcasting.
+///                 (https://github.com/onnx/onnx/blob/master/docs/Broadcasting.md)
+/// PDPD          - PaddlePaddle-style implicit broadcasting.
+///                 For more informaction see AutoBroadcastType documentation.
+/// BIDIRECTIONAL - The broadcast rule is similar to
+///                 numpy.array(input) * numpy.ones(target_shape).
+///                 Dimensions are right alignment.
+enum class BroadcastType { NONE, EXPLICIT = NONE, NUMPY, PDPD, BIDIRECTIONAL };
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const BroadcastType& type);
+
+/// \brief Specifies how eps is combined with L2 value
+enum class EpsMode {
+    // Add bias to norm
+    ADD,
+    // Calculate max of norm and bias
+    MAX
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const EpsMode& type);
+
+enum class TopKSortType {
+    // Returned values are not sorte
+    NONE,
+    // Sort result based on element indices
+    SORT_INDICES,
+    // Sort result based on element values
+    SORT_VALUES,
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const TopKSortType& type);
+
+enum class TopKMode {
+    MAX,
+    MIN,
+};
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const TopKMode& type);
+
+/// \brief Implicit broadcast specification
+struct OPENVINO_API AutoBroadcastSpec {
+    AutoBroadcastSpec() : m_type(AutoBroadcastType::NONE), m_axis(0) {}
+    AutoBroadcastSpec(AutoBroadcastType type) : m_type(type), m_axis(0) {}
+    AutoBroadcastSpec(const char* type) : AutoBroadcastSpec(type_from_string(type)) {}
+    AutoBroadcastSpec(AutoBroadcastType type, int64_t axis) : m_type(type), m_axis(axis) {}
+
+    AutoBroadcastType m_type;  // Implicit broadcasting algorithm
+    int64_t m_axis;            // Axis to start alignment on
+
+    bool operator==(const AutoBroadcastSpec& a) const {
+        return a.m_type == m_type && a.m_axis == m_axis;
+    }
+
+    bool operator!=(const AutoBroadcastSpec& a) const {
+        return !(*this == a);
+    }
+    static const AutoBroadcastSpec NUMPY;
+    static const AutoBroadcastSpec NONE;
+
+private:
+    AutoBroadcastType type_from_string(const std::string& type) const;
+};
+
+/// \brief Implicit broadcast specification
+struct OPENVINO_API BroadcastModeSpec {
+    BroadcastModeSpec() : m_type(BroadcastType::NUMPY), m_axis(0) {}
+    BroadcastModeSpec(BroadcastType type) : m_type(type), m_axis(0) {}
+    BroadcastModeSpec(const char* type) : BroadcastModeSpec(as_enum<BroadcastType>(type)) {}
+    BroadcastModeSpec(BroadcastType type, int64_t axis) : m_type(type), m_axis(axis) {}
+
+    BroadcastType m_type;  // Implicit broadcasting algorithm
+    int64_t m_axis;        // Axis to start alignment on
+
+    bool operator==(const BroadcastModeSpec& a) const {
+        return a.m_type == m_type && a.m_axis == m_axis;
+    }
+};
+
+///
+/// \brief      This class defines possible recurrent sequence directions.
+///
+enum class RecurrentSequenceDirection { FORWARD, REVERSE, BIDIRECTIONAL };
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const RecurrentSequenceDirection& direction);
+}  // namespace op
+
+template <>
+class OPENVINO_API AttributeAdapter<op::PadMode> : public EnumAttributeAdapterBase<op::PadMode> {
+public:
+    AttributeAdapter(op::PadMode& value) : EnumAttributeAdapterBase<op::PadMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::PadMode>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::PadType> : public EnumAttributeAdapterBase<op::PadType> {
+public:
+    AttributeAdapter(op::PadType& value) : EnumAttributeAdapterBase<op::PadType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::PadType>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::RoundingType> : public EnumAttributeAdapterBase<op::RoundingType> {
+public:
+    AttributeAdapter(op::RoundingType& value) : EnumAttributeAdapterBase<op::RoundingType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::RoundingType>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::AutoBroadcastType> : public EnumAttributeAdapterBase<op::AutoBroadcastType> {
+public:
+    AttributeAdapter(op::AutoBroadcastType& value) : EnumAttributeAdapterBase<op::AutoBroadcastType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::AutoBroadcastType>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::BroadcastType> : public EnumAttributeAdapterBase<op::BroadcastType> {
+public:
+    AttributeAdapter(op::BroadcastType& value) : EnumAttributeAdapterBase<op::BroadcastType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::BroadcastType>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::EpsMode> : public EnumAttributeAdapterBase<op::EpsMode> {
+public:
+    AttributeAdapter(op::EpsMode& value) : EnumAttributeAdapterBase<op::EpsMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::EpsMode>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::TopKSortType> : public EnumAttributeAdapterBase<op::TopKSortType> {
+public:
+    AttributeAdapter(op::TopKSortType& value) : EnumAttributeAdapterBase<op::TopKSortType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::TopKSortType>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::TopKMode> : public EnumAttributeAdapterBase<op::TopKMode> {
+public:
+    AttributeAdapter(op::TopKMode& value) : EnumAttributeAdapterBase<op::TopKMode>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::TopKMode>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+template <>
+class AttributeAdapter<op::AutoBroadcastSpec> : public VisitorAdapter {
+public:
+    AttributeAdapter(op::AutoBroadcastSpec& value) : m_ref(value) {}
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::AutoBroadcastSpec>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+
+protected:
+    op::AutoBroadcastSpec& m_ref;
+};
+
+template <>
+class AttributeAdapter<op::BroadcastModeSpec> : public VisitorAdapter {
+public:
+    AttributeAdapter(op::BroadcastModeSpec& value) : m_ref(value) {}
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::BroadcastModeSpec>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+
+protected:
+    op::BroadcastModeSpec& m_ref;
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<op::RecurrentSequenceDirection>
+    : public EnumAttributeAdapterBase<op::RecurrentSequenceDirection> {
+public:
+    AttributeAdapter(op::RecurrentSequenceDirection& value)
+        : EnumAttributeAdapterBase<op::RecurrentSequenceDirection>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::RecurrentSequenceDirection>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/binary_elementwise_arithmetic.hpp b/ngraph/core/include/openvino/op/util/binary_elementwise_arithmetic.hpp
new file mode 100644
index 00000000000000..c1fe1e3b916283
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/binary_elementwise_arithmetic.hpp
@@ -0,0 +1,70 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+// clang-format off
+            /// \brief Abstract base class for elementwise binary arithmetic operations, i.e.,
+            ///        operations where the same scalar binary arithmetic operation is applied to
+            ///        each corresponding pair of elements in the two input tensors. Implicit
+            ///        broadcast of input tensors is supported through one of the AutoBroadcast
+            ///        modes.
+            ///
+            /// For example, if the underlying arithmetic operation (determined by the subclass) is
+            /// \f$\mathit{op}(x,y)\f$, the input tensors
+            /// \f$[[x_0,y_0],[z_0,w_0]]\f$ and \f$[[x_1,y_1],[z_1,w_1]]\f$ will be mapped to
+            /// \f$[[\mathit{op}(x_0,x_1),\mathit{op}(y_0,y_1)],[\mathit{op}(z_0,z_1),\mathit{op}(w_0,w_1)]]\f$.
+            ///
+            /// ## Inputs
+            ///
+            /// |        | Type                              | Description                                                              |
+            /// | ------ | --------------------------------- | ------------------------------------------------------------------------ |
+            /// | `arg0` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape. The element type \f$N\f$ may be any numeric type. |
+            /// | `arg1` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same element type as `arg0`.                             |
+            /// | `autob`| AutoBroadcastSpec                 | Auto broadcast specification.                                            |
+            ///
+            /// ## Output
+            ///
+            /// | Type                   | Description                                                                                                                                                                                                                      |
+            /// | ---------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+            /// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg0}[i_1,\dots,i_n],\texttt{arg1}[i_1,\dots,i_n])\f$. This will always have the same shape and element type as the input tensors (after auto broadcasting). |
+// clang-format on
+class OPENVINO_API BinaryElementwiseArithmetic : public Op {
+protected:
+    BinaryElementwiseArithmetic(const AutoBroadcastSpec& autob);
+
+    /// \brief Constructs a binary elementwise arithmetic operation.
+    ///
+    /// \param arg0 Output that produces the first input tensor.
+    /// \param arg1 Output that produces the second input tensor.
+    BinaryElementwiseArithmetic(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& autob);
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    void validate_and_infer_types() override;
+
+    const AutoBroadcastSpec& get_autob() const override {
+        return m_autob;
+    }
+    void set_autob(const AutoBroadcastSpec& autob) {
+        m_autob = autob;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+
+private:
+    AutoBroadcastSpec m_autob;
+    void validate_and_infer_elementwise_arithmetic(const op::AutoBroadcastSpec& autob);
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/binary_elementwise_comparison.hpp b/ngraph/core/include/openvino/op/util/binary_elementwise_comparison.hpp
new file mode 100644
index 00000000000000..ffbf50e103bc49
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/binary_elementwise_comparison.hpp
@@ -0,0 +1,71 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+// clang-format off
+            /// \brief Abstract base class for elementwise binary comparison operations, i.e.,
+            ///        operations where the same scalar binary comparison operation is applied to
+            ///        each corresponding pair of elements in two input tensors. Implicit
+            ///        broadcast of input tensors is supported through one of the AutoBroadcast
+            ///        modes.
+            ///
+            /// For example, if the underlying comparison operation (determined by the subclass) is
+            /// \f$\mathit{op}(x,y)\f$, the input tensors \f$[[x_0,y_0],[z_0,w_0]]\f$ and
+            /// \f$[[x_1,y_1],[z_1,w_1]]\f$ will be mapped to
+            /// \f$[[\mathit{op}(x_0,x_1),\mathit{op}(y_0,y_1)],[\mathit{op}(z_0,z_1),\mathit{op}(w_0,w_1)]]\f$.
+            ///
+            /// ## Inputs
+            ///
+            /// |        | Type                              | Description                                            |
+            /// | ------ | --------------------------------- | ------------------------------------------------------ |
+            /// | `arg0` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape and element type.                |
+            /// | `arg1` | \f$E[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
+            /// | `autob`| AutoBroadcastSpec                 | Auto broadcast specification.                          |
+            ///
+            /// ## Output
+            ///
+            /// | Type                               | Description                                                                                                                                                                                                        |
+            /// | ---------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+            /// | \f$\texttt{bool}[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg0}[i_1,\dots,i_n],\texttt{arg1}[i_1,\dots,i_n])\f$. This will always have the same shape as the input tensors, and the element type `bool`. |
+// clang-format on
+class OPENVINO_API BinaryElementwiseComparison : public Op {
+protected:
+    /// \brief Constructs a binary elementwise comparison operation.
+    BinaryElementwiseComparison(const AutoBroadcastSpec& autob);
+
+    /// \brief Constructs a binary elementwise comparison operation.
+    ///
+    /// \param arg0 Output that produces the first input tensor.
+    /// \param arg1 Output that produces the second input tensor.
+    /// \param autob AutoBroadcast mode.
+    BinaryElementwiseComparison(const Output<Node>& arg0,
+                                const Output<Node>& arg1,
+                                const AutoBroadcastSpec& autob = AutoBroadcastSpec());
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    void validate_and_infer_types() override;
+
+    const AutoBroadcastSpec& get_autob() const override {
+        return m_autob;
+    }
+    void set_autob(const AutoBroadcastSpec& autob) {
+        m_autob = autob;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    AutoBroadcastSpec m_autob;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/binary_elementwise_logical.hpp b/ngraph/core/include/openvino/op/util/binary_elementwise_logical.hpp
new file mode 100644
index 00000000000000..c2dc6f999f775d
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/binary_elementwise_logical.hpp
@@ -0,0 +1,68 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+// clang-format off
+            /// \brief Abstract base class for elementwise binary logical operations, i.e.,
+            ///        operations where the same scalar binary logical operation is applied to
+            ///        each corresponding pair of elements in two boolean input tensors. Implicit
+            ///        broadcast of input tensors is supported through one of the AutoBroadcast
+            ///        modes.
+            ///
+            /// For example, if the underlying operation (determined by the subclass) is
+            /// \f$\mathit{op}(x,y)\f$, the input tensors \f$[[x_0,y_0],[z_0,w_0]]\f$ and
+            /// \f$[[x_1,y_1],[z_1,w_1]]\f$ will be mapped to
+            /// \f$[[\mathit{op}(x_0,x_1),\mathit{op}(y_0,y_1)],[\mathit{op}(z_0,z_1),\mathit{op}(w_0,w_1)]]\f$.
+            ///
+            /// ## Inputs
+            ///
+            /// |        | Type                                          | Description                                            |
+            /// | ------ | --------------------------------------------- | ------------------------------------------------------ |
+            /// | `arg0` | \f$\texttt{bool}[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape, with element type `bool`.       |
+            /// | `arg1` | \f$\texttt{bool}[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of the same shape and element type as `arg0`. |
+            /// | `autob`| AutoBroadcastSpec                             | Auto broadcast specification.                          |
+            ///
+            /// ## Output
+            ///
+            /// | Type                               | Description                                                                                                                                                                                                        |
+            /// | ---------------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+            /// | \f$\texttt{bool}[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg0}[i_1,\dots,i_n],\texttt{arg1}[i_1,\dots,i_n])\f$. This will always have the same shape as the input tensors, and the element type `bool`. |
+// clang-format on
+class OPENVINO_API BinaryElementwiseLogical : public Op {
+protected:
+    OPENVINO_RTTI_DECLARATION;
+
+    BinaryElementwiseLogical();
+
+    /// \brief Constructs a binary elementwise logical operation.
+    ///
+    /// \param arg0 Output that produces the first input tensor.
+    /// \param arg1 Output that produces the second input tensor.
+    BinaryElementwiseLogical(const Output<Node>& arg0,
+                             const Output<Node>& arg1,
+                             const AutoBroadcastSpec& autob = AutoBroadcastSpec());
+
+public:
+    void validate_and_infer_types() override;
+
+    const AutoBroadcastSpec& get_autob() const override {
+        return m_autob;
+    }
+    void set_autob(const AutoBroadcastSpec& autob) {
+        m_autob = autob;
+    }
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    AutoBroadcastSpec m_autob = AutoBroadcastSpec::NUMPY;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/broadcast_base.hpp b/ngraph/core/include/openvino/op/util/broadcast_base.hpp
new file mode 100644
index 00000000000000..10cf5b1f9bcf1f
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/broadcast_base.hpp
@@ -0,0 +1,84 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/core/axis_vector.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API BroadcastBase : public Op {
+protected:
+    BroadcastBase() = default;
+    /// \brief Constructs a broadcast operation.
+    ///
+    /// \param arg            The input tensor to be broadcast.
+    /// \param target_shape   The shape of the output tensor.
+    /// \param axes_mapping   The axis positions (0-based) in the result that correspond
+    ///                       to input axes.
+    /// \param broadcast_mode Broadcast specification to use for determining broadcast
+    ///                       axes. 'axes_mapping' should not be provided if mode other
+    ///
+    BroadcastBase(const Output<Node>& arg,
+                  const Output<Node>& target_shape,
+                  const Output<Node>& axes_mapping,
+                  const BroadcastModeSpec& broadcast_mode = BroadcastType::EXPLICIT);
+
+    /// \brief Constructs a broadcast operation.
+    ///
+    /// \param arg            The input tensor to be broadcast.
+    /// \param target_shape   The shape of the output tensor.
+    /// \param broadcast_mode Broadcast specification to use for determining broadcast
+    ///                       axes
+    BroadcastBase(const Output<Node>& arg,
+                  const Output<Node>& target_shape,
+                  const BroadcastModeSpec& broadcast_mode = BroadcastType::NUMPY);
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    void validate_and_infer_types() override;
+    /// \return true and the AxisSet if broadcast axes can be fully determined.
+    virtual std::pair<bool, AxisSet> get_broadcast_axes() const;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+
+protected:
+    BroadcastModeSpec m_mode;
+
+    bool evaluate_broadcast(const HostTensorPtr& arg0,
+                            const HostTensorPtr& out,
+                            const std::pair<bool, AxisSet>& pair_broadcast_axes,
+                            const Shape& output_shape) const;
+
+    bool evaluate_broadcast(const HostTensorPtr& arg0, const HostTensorPtr& out, const AxisSet& broadcast_axes) const;
+
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+
+    PartialShape get_result_shape_pdpd(const PartialShape& arg0_shape,
+                                       const PartialShape& target_shape,
+                                       const op::BroadcastModeSpec& broadcast_spec) const;
+
+    void validate_target_shape_numpy(const PartialShape& arg_shape, const PartialShape& target_shape) const;
+
+    static std::pair<bool, AxisSet> get_broadcast_axes_numpy_pdpd(const Shape& arg_shape,
+                                                                  const Shape& result_shape,
+                                                                  const op::BroadcastModeSpec& broadcast_spec);
+
+    static std::pair<bool, AxisSet> get_broadcast_axes_none(const AxisVector& axes_mapping_val,
+                                                            const size_t target_shape);
+
+    void validate_target_shape_none(const PartialShape& arg_shape,
+                                    const AxisVector& axes_mapping_val,
+                                    const PartialShape& target_shape) const;
+
+    Shape get_target_shape(const HostTensorPtr& input1) const;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/deformable_convolution_base.hpp b/ngraph/core/include/openvino/op/util/deformable_convolution_base.hpp
new file mode 100644
index 00000000000000..341f6ac82a12a7
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/deformable_convolution_base.hpp
@@ -0,0 +1,105 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/coordinate_diff.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Base class for operations DeformableConvolution v1 and DeformableConvolution
+/// v8.
+class OPENVINO_API DeformableConvolutionBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a conversion operation.
+    DeformableConvolutionBase() = default;
+
+    /// \brief Constructs a conversion operation.
+    /// \param strides            Convolution strides.
+    /// \param pads_begin         Amount of padding to be added to the beginning along
+    ///                           each axis. For example in case of a 2D input the value
+    ///                           of (1, 2) means that 1 element will be added to the
+    ///                           top and 2 elements to the left.
+    /// \param pads_end           Amount of padding to be added to the end along each
+    ///                           axis.
+    /// \param dilations          The distance in width and height between the weights
+    ///                           in the filters tensor.
+    /// \param auto_pad           Specifies how the automatic calculation of padding
+    ///                           should be done.
+    /// \param group              The number of groups which both output and input
+    ///                           should be split into.
+    /// \param deformable_group   The number of groups which deformable values and
+    ///                           output should be split into along the channel axis.
+    DeformableConvolutionBase(const OutputVector& arguments,
+                              const Strides& strides,
+                              const CoordinateDiff& pads_begin,
+                              const CoordinateDiff& pads_end,
+                              const Strides& dilations,
+                              const PadType& auto_pad = PadType::EXPLICIT,
+                              int64_t group = 1,
+                              int64_t deformable_group = 1);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    void validate_and_infer_types() override;
+
+    const Strides& get_strides() const {
+        return m_strides;
+    }
+    void set_strides(const Strides& strides) {
+        m_strides = strides;
+    }
+    const Strides& get_dilations() const {
+        return m_dilations;
+    }
+    void set_dilations(const Strides& dilations) {
+        m_dilations = dilations;
+    }
+    const CoordinateDiff& get_pads_begin() const {
+        return m_pads_begin;
+    }
+    void set_pads_begin(const CoordinateDiff& pads_begin) {
+        m_pads_begin = pads_begin;
+    }
+    const CoordinateDiff& get_pads_end() const {
+        return m_pads_end;
+    }
+    void set_pads_end(const CoordinateDiff& pads_end) {
+        m_pads_end = pads_end;
+    }
+    const PadType& get_auto_pad() const {
+        return m_auto_pad;
+    }
+    void set_auto_pad(const PadType& auto_pad) {
+        m_auto_pad = auto_pad;
+    }
+    int64_t get_group() const {
+        return m_group;
+    }
+    void set_group(const int64_t group) {
+        m_group = group;
+    }
+    int64_t get_deformable_group() const {
+        return m_deformable_group;
+    }
+    void set_deformable_group(const int64_t deformable_group) {
+        m_deformable_group = deformable_group;
+    }
+
+protected:
+    Strides m_strides;
+    Strides m_dilations;
+    CoordinateDiff m_pads_begin;
+    CoordinateDiff m_pads_end;
+    PadType m_auto_pad;
+    int64_t m_group;
+    int64_t m_deformable_group;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/elementwise_args.hpp b/ngraph/core/include/openvino/op/util/elementwise_args.hpp
new file mode 100644
index 00000000000000..90961bee7ac7eb
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/elementwise_args.hpp
@@ -0,0 +1,17 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+std::tuple<element::Type, PartialShape> validate_and_infer_elementwise_args(
+    Node* node,
+    const op::AutoBroadcastSpec& autob = op::AutoBroadcastSpec());
+}
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/embeddingbag_offsets_base.hpp b/ngraph/core/include/openvino/op/util/embeddingbag_offsets_base.hpp
new file mode 100644
index 00000000000000..ea755e81a5713e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/embeddingbag_offsets_base.hpp
@@ -0,0 +1,63 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/op/util/index_reduction.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Returns embeddings for given indices
+class OPENVINO_API EmbeddingBagOffsetsBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a EmbeddingBagOffsetsBase operation.
+    EmbeddingBagOffsetsBase() = default;
+    /// \brief Constructs a EmbeddingBagOffsetsBase operation.
+    ///
+    /// EmbeddingBagOffsetsBase constructs an output tensor by replacing every index in
+    /// a
+    /// given
+    /// input tensor with a row (from the weights matrix) at that index
+    ///
+    /// \param emb_table tensor containing the embedding lookup table of the module of
+    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
+    /// \param tensor of shape [num_indices] and of type T_IND. Required
+    /// \param offsets tensor of shape [batch] and of type T_IND containing the starting
+    /// index positions of each "bag" in indices. Required.
+    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
+    /// Each value in this tensor are multiplied with each
+    /// value pooled from embedding table for each index. Optional.
+    /// \param default_index scalar of type T_IND containing default index in embedding
+    /// table to fill empty "bags". If not provided empty "bags"
+    /// are filled with zeros. Optional.
+
+    EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
+                            const Output<Node>& indices,
+                            const Output<Node>& offsets,
+                            const Output<Node>& default_index,
+                            const Output<Node>& per_sample_weights);
+
+    EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
+                            const Output<Node>& indices,
+                            const Output<Node>& offsets,
+                            const Output<Node>& default_index);
+
+    EmbeddingBagOffsetsBase(const Output<Node>& emb_table, const Output<Node>& indices, const Output<Node>& offsets);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    static constexpr int EMB_TABLE = 0;
+    static constexpr int INDICES = 1;
+    static constexpr int OFFSETS = 2;
+    static constexpr int DEFAULT_INDEX = 3;
+    static constexpr int PER_SAMPLE_WEIGHTS = 4;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/embeddingbag_packed_base.hpp b/ngraph/core/include/openvino/op/util/embeddingbag_packed_base.hpp
new file mode 100644
index 00000000000000..89929fa31714cc
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/embeddingbag_packed_base.hpp
@@ -0,0 +1,49 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/axis_set.hpp"
+#include "openvino/op/util/index_reduction.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Returns embeddings for given indices
+class OPENVINO_API EmbeddingBagPackedBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Constructs a EmbeddingBagPackedBase operation.
+    EmbeddingBagPackedBase() = default;
+    /// \brief Constructs a EmbeddingBagPackedBase operation.
+    ///
+    /// EmbeddingBagPackedBase constructs an output tensor by replacing every index in a
+    /// given
+    /// input tensor with a row (from the weights matrix) at that index
+    ///
+    /// \param emb_table Tensor containing the embedding lookup table of the module of
+    /// shape [num_emb, emb_dim1, emb_dim2, ...] and  of type T
+    /// \param  indices Tensor of shape `[batch, indices_per_bag]` and of type *T_IND*.
+    /// Required.
+    /// \param per_sample_weigths tensor of the same shape as indices and of type T.
+    /// Each value in this tensor are multiplied with each
+    /// value pooled from embedding table for each index. Optional.
+
+    EmbeddingBagPackedBase(const Output<Node>& emb_table,
+                           const Output<Node>& indices,
+                           const Output<Node>& per_sample_weights);
+
+    EmbeddingBagPackedBase(const Output<Node>& emb_table, const Output<Node>& indices);
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    static constexpr int EMB_TABLE = 0;
+    static constexpr int INDICES = 1;
+    static constexpr int PER_SAMPLE_WEIGHTS = 2;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/fft_base.hpp b/ngraph/core/include/openvino/op/util/fft_base.hpp
new file mode 100644
index 00000000000000..7e9f959520b278
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/fft_base.hpp
@@ -0,0 +1,40 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+#include "ngraph/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Base class for operations DFT and DFT.
+class OPENVINO_API FFTBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    FFTBase() = default;
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+protected:
+    /// \brief Constructs an FFT operation. FFT is performed for full size axes.
+    ///
+    /// \param data  Input data
+    /// \param axes Axes to perform FFT
+    FFTBase(const Output<Node>& data, const Output<Node>& axes);
+
+    /// \brief Constructs a FFT operation.
+    ///
+    /// \param data  Input data
+    /// \param axes Axes to perform FFT
+    /// \param signal_size Signal sizes for 'axes'
+    FFTBase(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size);
+
+    void validate();
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/gather_base.hpp b/ngraph/core/include/openvino/op/util/gather_base.hpp
new file mode 100644
index 00000000000000..694f17830bb7e0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/gather_base.hpp
@@ -0,0 +1,42 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief GatherBase basic class for Gather v1 and v7
+class OPENVINO_API GatherBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    GatherBase() = default;
+
+    /// \param data The tensor from which slices are gathered
+    /// \param indices Tensor with indexes to gather
+    /// \param axis The tensor is a dimension index to gather data from
+    /// \param batch_dims The number of batch dimension in data and indices tensors
+    GatherBase(const Output<Node>& data,
+               const Output<Node>& indices,
+               const Output<Node>& axis,
+               const int64_t batch_dims = 0);
+
+    void validate_and_infer_types() override;
+    virtual int64_t get_axis() const;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+
+    bool evaluate_lower(const HostTensorVector& outputs) const override;
+    bool evaluate_upper(const HostTensorVector& outputs) const override;
+
+    bool constant_fold(OutputVector& output_values, const OutputVector& inputs_values) override;
+
+protected:
+    int64_t m_batch_dims = 0;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/index_reduction.hpp b/ngraph/core/include/openvino/op/util/index_reduction.hpp
new file mode 100644
index 00000000000000..adf1168edba435
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/index_reduction.hpp
@@ -0,0 +1,37 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <string>
+#include <type_traits>
+#include <utility>
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class NGRAPH_API IndexReduction : public Op {
+protected:
+    IndexReduction();
+
+    IndexReduction(const Output<Node>& arg, uint64_t axis, const element::Type& index_element_type);
+
+public:
+    uint64_t get_reduction_axis() const;
+    void set_reduction_axis(uint64_t value);
+    element::Type get_index_element_type() const;
+    void set_index_element_type(const element::Type& index_element_type);
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+protected:
+    uint64_t m_axis{0};
+    element::Type m_index_element_type;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/logical_reduction.hpp b/ngraph/core/include/openvino/op/util/logical_reduction.hpp
new file mode 100644
index 00000000000000..75cd638725b307
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/logical_reduction.hpp
@@ -0,0 +1,46 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/reduction_base.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Abstract base class for logical reduction operations, i.e., operations where
+///        chosen axes of the input tensors are eliminated (reduced out) by repeated
+///        application of a particular binary logical operation.
+class OPENVINO_API LogicalReduction : public ReductionBase {
+protected:
+    /// \brief Constructs a logical reduction operation.
+    LogicalReduction();
+    /// \brief Constructs a logical reduction operation.
+    ///
+    /// \param arg Output that produces the first input tensor.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    LogicalReduction(const Output<Node>& arg, const AxisSet& reduction_axes);
+    /// \brief Constructs a 'dynamic' logical reduction operation.
+    ///
+    /// \param arg Node that produces the first input tensor.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    LogicalReduction(const Output<Node>& arg, const Output<Node>& reduction_axes);
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+    void validate_and_infer_types() override;
+
+    /// \return true if reduction axes are constant else false.
+    bool reduction_axes_constant() const;
+
+    /// \return The axis positions (0-based) to be eliminated through reduction.
+    /// \throws CheckFailure if the reduction axes are not constant. (Use
+    ///           reduction_axes_constant to check.)
+    const AxisSet get_reduction_axes() const;
+    void set_reduction_axes(const AxisSet& reduction_axes);
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/logical_reduction_keep_dims.hpp b/ngraph/core/include/openvino/op/util/logical_reduction_keep_dims.hpp
new file mode 100644
index 00000000000000..a9ce1ed1c6edb6
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/logical_reduction_keep_dims.hpp
@@ -0,0 +1,42 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/logical_reduction.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API LogicalReductionKeepDims : public util::LogicalReduction {
+protected:
+    LogicalReductionKeepDims() = default;
+
+    /// \param arg The tensor to be reduced.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    /// \param keep_dims If set to 1 it holds axes that are used for reduction.
+    LogicalReductionKeepDims(const Output<Node>& arg, const Output<Node>& reduction_axes, const bool keep_dims = false);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+    void validate_and_infer_types() override;
+
+    /// \return If set to 1 it holds axes that are used for reduction.
+    /// For each such axis, output dimension is equal to 1.
+    bool get_keep_dims() const {
+        return m_keep_dims;
+    }
+    void set_keep_dims(bool keep_dims) {
+        m_keep_dims = keep_dims;
+    }
+
+private:
+    bool m_keep_dims = false;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/max_pool_base.hpp b/ngraph/core/include/openvino/op/util/max_pool_base.hpp
new file mode 100644
index 00000000000000..45b90536a0bbb6
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/max_pool_base.hpp
@@ -0,0 +1,96 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/attr_types.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API MaxPoolBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    MaxPoolBase() = default;
+
+    /// \param arg The node producing the input data batch tensor.
+    /// \param strides The strides.
+    /// \param pads_begin The beginning of padding shape.
+    /// \param pads_end The end of padding shape.
+    /// \param kernel The kernel shape.
+    /// \param rounding_mode Whether to use ceiling or floor rounding type while
+    /// computing output shape.
+    /// \param auto_pad The pad type for automatically computing padding sizes.
+    MaxPoolBase(const Output<Node>& arg,
+                const Strides& strides,
+                const Shape& pads_begin,
+                const Shape& pads_end,
+                const Shape& kernel,
+                const op::RoundingType rounding_mode = op::RoundingType::FLOOR,
+                const PadType auto_pad = op::PadType::EXPLICIT);
+
+    void validate_and_infer_types() override;
+
+    /// \return The kernel shape.
+    const Shape& get_kernel() const {
+        return m_kernel;
+    }
+    void set_kernel(const Shape& kernel) {
+        m_kernel = kernel;
+    }
+    /// \return The strides.
+    const Strides& get_strides() const {
+        return m_strides;
+    }
+    void set_strides(const Strides& strides) {
+        m_strides = strides;
+    }
+    /// \return The beginning of padding shape.
+    const Shape& get_pads_begin() const {
+        return m_pads_begin;
+    }
+    void set_pads_begin(const Shape& pads_begin) {
+        m_pads_begin = pads_begin;
+    }
+    /// \return The end of padding shape.
+    const Shape& get_pads_end() const {
+        return m_pads_end;
+    }
+    void set_adding_above(const Shape& pads_end) {
+        m_pads_end = pads_end;
+    }
+    /// \return The pad type for pooling.
+    PadType get_auto_pad() const {
+        return m_auto_pad;
+    }
+    void set_auto_pad(const PadType auto_pad) {
+        m_auto_pad = auto_pad;
+    }
+    /// \return The ceiling mode being used for output shape computations
+    op::RoundingType get_rounding_type() const {
+        return m_rounding_type;
+    }
+    void set_rounding_type(op::RoundingType rounding_type) {
+        m_rounding_type = rounding_type;
+    }
+
+protected:
+    bool update_auto_padding(const PartialShape& in_shape,
+                             const Strides& filter_dilations,
+                             Shape& new_pads_end,
+                             Shape& new_pads_begin) const;
+
+    PartialShape infer_output_shape(const Strides& dilations);
+
+    Shape m_kernel;
+    Strides m_strides;
+    Shape m_pads_begin;
+    Shape m_pads_end;
+    PadType m_auto_pad;
+    op::RoundingType m_rounding_type;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/multi_subgraph_base.hpp b/ngraph/core/include/openvino/op/util/multi_subgraph_base.hpp
new file mode 100644
index 00000000000000..95fc65bc59e661
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/multi_subgraph_base.hpp
@@ -0,0 +1,313 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/parameter.hpp"
+#include "openvino/core/function.hpp"
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Abstract base class for sub-graph based ops, i.e ops that have some
+/// sub-graphs
+///
+class OPENVINO_API MultiSubGraphOp : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    /// \brief Abstract class describes a connection between a MultiSubGraphOp input and
+    /// the body.
+    class InputDescription {
+    protected:
+        ///
+        /// \brief      Constructs a new instance.
+        ///
+        /// \param      input_index           Position of the MultiSubGraphOp input
+        /// \param      body_parameter_index  Body parameter to receive input
+        ///
+        InputDescription(uint64_t input_index, uint64_t body_parameter_index);
+        InputDescription() = default;
+
+    public:
+        using Ptr = std::shared_ptr<InputDescription>;
+        using type_info_t = DiscreteTypeInfo;
+        virtual ~InputDescription() = default;
+        virtual std::shared_ptr<InputDescription> copy() const = 0;
+
+        virtual const type_info_t& get_type_info() const = 0;
+
+        uint64_t m_input_index{0};
+        uint64_t m_body_parameter_index{0};
+    };
+
+    /// \brief Abstract class describes how a MultiSubGraphOp output is produced from
+    /// the body.
+    class OutputDescription {
+    protected:
+        ///
+        /// \brief      Constructs a new instance.
+        ///
+        /// \param      body_value_index  A body value that produces the output
+        /// \param      output_index      The MultiSubGraphOp output index
+        ///
+        OutputDescription(uint64_t body_value_index, uint64_t output_index);
+        OutputDescription() = default;
+
+    public:
+        using Ptr = std::shared_ptr<OutputDescription>;
+        using type_info_t = DiscreteTypeInfo;
+        virtual ~OutputDescription() = default;
+        virtual std::shared_ptr<OutputDescription> copy() const = 0;
+        virtual const type_info_t& get_type_info() const = 0;
+
+        uint64_t m_body_value_index{0};
+        uint64_t m_output_index{0};
+    };
+
+    ///
+    /// \brief      Describes a body input formed from slices of an input to
+    ///             MultiSubGraphOp.
+    ///
+    class OPENVINO_API SliceInputDescription : public InputDescription {
+    public:
+        OPENVINO_RTTI_DECLARATION;
+        ///
+        /// \brief      Constructs a new instance.
+        ///
+        /// \param      input_index           Position of the MultiSubGraphOp input
+        /// \param      body_parameter_index  Body parameter position to receive input
+        /// \param      start                 First index for slices
+        /// \param      stride                Step amount for slices
+        /// \param      part_size             Width of slices
+        /// \param      end                   Last index for slices
+        /// \param      axis                  Axis being sliced
+        ///
+        SliceInputDescription(uint64_t input_index,
+                              uint64_t body_parameter_index,
+                              int64_t start,
+                              int64_t stride,
+                              int64_t part_size,
+                              int64_t end,
+                              int64_t axis);
+        SliceInputDescription() = default;
+        std::shared_ptr<InputDescription> copy() const override;
+        int64_t m_start{0};
+        int64_t m_stride{0};
+        int64_t m_part_size{0};
+        int64_t m_end{0};
+        int64_t m_axis{0};
+    };
+
+    ///
+    /// \brief      Describes a body input initialized from a MultiSubGraphOp input
+    ///             on the first iteration, and then a body output thereafter.
+    ///
+    class OPENVINO_API MergedInputDescription : public InputDescription {
+    public:
+        OPENVINO_RTTI_DECLARATION;
+        ///
+        /// \brief      Constructs a new instance.
+        ///
+        /// \param      input_index           Position of the MultiSubGraphOp input
+        ///                                   supplying a value to body_parameter for
+        ///                                   the initial iteration.
+        /// \param      body_parameter_index  Body parameter position to receive input.
+        /// \param      body_value_index      Body value to supply body_parameter for
+        /// successive
+        ///                                   iterations.
+        ///
+        MergedInputDescription(uint64_t input_index, uint64_t body_parameter_index, uint64_t body_value_index);
+        MergedInputDescription() = default;
+        std::shared_ptr<InputDescription> copy() const override;
+        uint64_t m_body_value_index{0};
+    };
+
+    /// \brief Produces an output by concatenating an output from each iteration
+    class OPENVINO_API ConcatOutputDescription : public OutputDescription {
+    public:
+        OPENVINO_RTTI_DECLARATION;
+        ///
+        /// \brief      Constructs a new instance.
+        ///
+        /// \param      body_value_index  A body value that produces the output
+        /// \param      output_index      The MultiSubGraphOp output index
+        /// \param      start             First index for slices
+        /// \param      stride            Step amount for slices
+        /// \param      part_size         Width of slices
+        /// \param      end               Last index for slices
+        /// \param      axis              Axis being sliced
+        ///
+        ConcatOutputDescription(uint64_t body_value_index,
+                                uint64_t output_index,
+                                int64_t start,
+                                int64_t stride,
+                                int64_t part_size,
+                                int64_t end,
+                                int64_t axis);
+        ConcatOutputDescription() = default;
+
+        std::shared_ptr<OutputDescription> copy() const override;
+        int64_t m_start{0};
+        int64_t m_stride{0};
+        int64_t m_part_size{0};
+        int64_t m_end{0};
+        int64_t m_axis{0};
+    };
+
+    /// \brief Produces an input
+    class OPENVINO_API InvariantInputDescription : public InputDescription {
+    public:
+        OPENVINO_RTTI_DECLARATION;
+        ///
+        /// \brief      Constructs a new instance.
+        ///
+        /// \param      input_index           Position of the MultiSubGraphOp input
+        /// \param      body_parameter_index  Body parameter to receive input
+        ///
+        InvariantInputDescription(uint64_t input_index, uint64_t body_parameter_index);
+        InvariantInputDescription() = default;
+        std::shared_ptr<InputDescription> copy() const override;
+    };
+
+    /// \brief Produces an output from a specific iteration
+    class OPENVINO_API BodyOutputDescription : public MultiSubGraphOp::OutputDescription {
+    public:
+        OPENVINO_RTTI_DECLARATION;
+        ///
+        /// \brief      Constructs a new instance.
+        ///
+        /// \param      body_value_index  A body value that produces the output
+        /// \param      output_index      The SubGraphOp output index
+        /// \param      iteration         which iteration (typically -1, final) will
+        ///                               supply the value
+        ///
+        BodyOutputDescription(uint64_t body_value_index, uint64_t output_index, int64_t iteration = -1);
+        BodyOutputDescription() = default;
+        std::shared_ptr<MultiSubGraphOp::OutputDescription> copy() const override;
+        int64_t m_iteration{0};
+    };
+    using MultiSubgraphInputDescriptionVector = std::vector<MultiSubGraphOp::InputDescription::Ptr>;
+    using MultiSubgraphOutputDescriptionVector = std::vector<MultiSubGraphOp::OutputDescription::Ptr>;
+
+    /// \brief     Gets internal sub-graph by index in MultiSubGraphOp
+    ///
+    /// \param     index sub-graph's index in op
+    /// \return pointer to Function with sub-graph
+    virtual const std::shared_ptr<Function>& get_function(int index) const {
+        return m_bodies[index];
+    };
+    /// \brief     Adds sub-graph to MultiSubGraphOp
+    ///
+    /// \param index   index of new sub-graph
+    /// \param func    func new sub_graph as Function
+    virtual void set_function(int index, const std::shared_ptr<Function>& func) {
+        m_bodies[index] = func;
+    }
+    /// \brief     Gets vector with connections beewtwen operation inputs
+    /// and internal sub-graph parameters
+    ///
+    /// \param index   index of internal sub-graph
+    /// \return vector of input descriptions
+    const MultiSubgraphInputDescriptionVector& get_input_descriptions(int index) const {
+        return m_input_descriptions[index];
+    }
+    /// \brief     Gets vector with connections beewtwen operation inputs
+    /// and internal sub-graph parameters
+    ///
+    /// \param index   index of internal sub-graph
+    /// \return vector of input descriptions
+    MultiSubgraphInputDescriptionVector& get_input_descriptions(int index) {
+        return m_input_descriptions[index];
+    }
+    /// \brief     Gets vector with connections beewtwen operation outputs
+    /// and internal sub-graph results
+    ///
+    /// \param index   index of internal sub-graph
+    /// \return vector of output descriptions
+    const MultiSubgraphOutputDescriptionVector& get_output_descriptions(int index) const {
+        return m_output_descriptions[index];
+    }
+    /// \brief     Gets vector with connections beewtwen operation outputs
+    /// and internal sub-graph results
+    ///
+    /// \param index   index of internal sub-graph
+    /// \return vector of output descriptions
+    MultiSubgraphOutputDescriptionVector& get_output_descriptions(int index) {
+        return m_output_descriptions[index];
+    }
+    /// \brief     Sets vector with connections beewtwen operation inputs
+    /// and internal sub-graph parameters
+    ///
+    /// \param index   index of internal sub-graph
+    /// \param inputs  vector of input descriptions
+    void set_input_descriptions(int index, const MultiSubgraphInputDescriptionVector& inputs) {
+        m_input_descriptions[index] = inputs;
+    }
+
+    /// \brief     Sets vector with connections beewtwen operation outputs
+    /// and internal sub-graph results
+    ///
+    /// \param index   index of internal sub-graph
+    /// \param outputs vector of input descriptions
+    void set_output_descriptions(int index, const MultiSubgraphOutputDescriptionVector& outputs) {
+        m_output_descriptions[index] = outputs;
+    }
+
+    ///
+    /// \brief     Set input decriptions for MultiSubGraphOp input.
+    ///
+    /// \param      value              The value supplied as an input to the block.
+    /// \param      bodies_parameters  vector of bodies parameters.
+    virtual void set_invariant_inputs(const Output<Node>& value, const ngraph::ParameterVector& bodies_parameters);
+    ///
+    /// \brief     Set output decriptions for MultiSubGraphOp output.
+    ///
+    /// \param      bodies_results  vector of bodies results for one output.
+    /// \return     value           Output node for bodies_results.
+    virtual Output<Node> set_body_outputs(const ResultVector& bodies_results);
+
+    MultiSubGraphOp(const MultiSubGraphOp&) = delete;
+    MultiSubGraphOp(MultiSubGraphOp&&) = default;
+
+    MultiSubGraphOp& operator=(const MultiSubGraphOp&) = delete;
+    MultiSubGraphOp& operator=(MultiSubGraphOp&&) = default;
+
+protected:
+    // Find an input corresponding to value, adding one if necessary.
+    Input<Node> input_for_value(const Output<Node>& value);
+
+    MultiSubGraphOp(size_t number_of_bodies);
+    MultiSubGraphOp() = default;
+    MultiSubGraphOp(const OutputVector& args, size_t number_of_bodies);
+    explicit MultiSubGraphOp(const OutputVector& args);
+
+    std::vector<std::shared_ptr<Function>> m_bodies;
+    std::vector<MultiSubgraphInputDescriptionVector> m_input_descriptions;
+    std::vector<MultiSubgraphOutputDescriptionVector> m_output_descriptions;
+};
+}  // namespace util
+}  // namespace op
+
+template <>
+class OPENVINO_API AttributeAdapter<std::vector<std::shared_ptr<op::util::MultiSubGraphOp::InputDescription>>>
+    : public DirectValueAccessor<std::vector<std::shared_ptr<op::util::MultiSubGraphOp::InputDescription>>> {
+public:
+    AttributeAdapter(std::vector<std::shared_ptr<op::util::MultiSubGraphOp::InputDescription>>& value)
+        : DirectValueAccessor<std::vector<std::shared_ptr<op::util::MultiSubGraphOp::InputDescription>>>(value) {}
+
+    OPENVINO_RTTI_DECLARATION;
+};
+
+template <>
+class OPENVINO_API AttributeAdapter<std::vector<std::shared_ptr<op::util::MultiSubGraphOp::OutputDescription>>>
+    : public DirectValueAccessor<std::vector<std::shared_ptr<op::util::MultiSubGraphOp::OutputDescription>>> {
+public:
+    AttributeAdapter(std::vector<std::shared_ptr<op::util::MultiSubGraphOp::OutputDescription>>& value)
+        : DirectValueAccessor<std::vector<std::shared_ptr<op::util::MultiSubGraphOp::OutputDescription>>>(value) {}
+
+    OPENVINO_RTTI_DECLARATION;
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/nms_base.hpp b/ngraph/core/include/openvino/op/util/nms_base.hpp
new file mode 100644
index 00000000000000..ee7ca77708727e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/nms_base.hpp
@@ -0,0 +1,92 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Base class for operations NmsBase and MatrixNms
+///
+class OPENVINO_API NmsBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    enum class SortResultType {
+        CLASSID,  // sort selected boxes by class id (ascending) in each batch element
+        SCORE,    // sort selected boxes by score (descending) in each batch element
+        NONE      // do not guarantee the order in each batch element
+    };
+
+    NmsBase() = delete;
+
+    /// \brief Constructs a NmsBase operation
+    ///
+    /// \param output_type Specifies the output tensor type
+    /// \param nms_top_k Specifies maximum number of boxes to be selected per
+    /// class, -1 meaning to keep all boxes
+    /// \param keep_top_k Specifies maximum number of boxes to be selected per
+    /// batch element, -1 meaning to keep all boxes
+    NmsBase(element::Type& output_type, int& nms_top_k, int& keep_top_k);
+
+    /// \brief Constructs a NmsBase operation
+    ///
+    /// \param boxes Node producing the box coordinates
+    /// \param scores Node producing the box scores
+    /// \param output_type Specifies the output tensor type
+    /// \param nms_top_k Specifies maximum number of boxes to be selected per
+    /// class, -1 meaning to keep all boxes
+    /// \param keep_top_k Specifies maximum number of boxes to be selected per
+    /// batch element, -1 meaning to keep all boxes
+    NmsBase(const Output<Node>& boxes,
+            const Output<Node>& scores,
+            element::Type& output_type,
+            int& nms_top_k,
+            int& keep_top_k);
+
+    void validate_and_infer_types() override;
+
+    const element::Type& get_output_type() const {
+        return m_output_type;
+    }
+    void set_output_type(const element::Type& output_type) {
+        m_output_type = output_type;
+    }
+    using Node::set_output_type;
+
+    int get_nms_top_k() const {
+        return m_nms_top_k;
+    }
+
+    int get_keep_top_k() const {
+        return m_keep_top_k;
+    }
+
+protected:
+    element::Type& m_output_type;
+    int& m_nms_top_k;
+    int& m_keep_top_k;
+    virtual void validate();
+};
+}  // namespace util
+}  // namespace op
+
+OPENVINO_API
+std::ostream& operator<<(std::ostream& s, const op::util::NmsBase::SortResultType& type);
+
+template <>
+class OPENVINO_API AttributeAdapter<op::util::NmsBase::SortResultType>
+    : public EnumAttributeAdapterBase<op::util::NmsBase::SortResultType> {
+public:
+    AttributeAdapter(op::util::NmsBase::SortResultType& value)
+        : EnumAttributeAdapterBase<op::util::NmsBase::SortResultType>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<op::util::NmsBase::SortResultType>", 1};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/op_types.hpp b/ngraph/core/include/openvino/op/util/op_types.hpp
new file mode 100644
index 00000000000000..29cd0edbcd16d5
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/op_types.hpp
@@ -0,0 +1,66 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/node.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+OPENVINO_API
+bool is_unary_elementwise_arithmetic(const Node* node);
+OPENVINO_API
+bool is_binary_elementwise_arithmetic(const Node* node);
+OPENVINO_API
+bool is_binary_elementwise_comparison(const Node* node);
+OPENVINO_API
+bool is_binary_elementwise_logical(const Node* node);
+
+OPENVINO_API
+bool supports_auto_broadcast(const Node* node);
+
+OPENVINO_API
+bool is_op(const Node* node);
+OPENVINO_API
+bool is_parameter(const Node* node);
+OPENVINO_API
+bool is_output(const Node* node);
+OPENVINO_API
+bool is_sink(const Node* node);
+OPENVINO_API
+bool is_constant(const Node* node);
+OPENVINO_API
+bool is_commutative(const Node* node);
+
+OPENVINO_API
+bool is_unary_elementwise_arithmetic(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_binary_elementwise_arithmetic(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_binary_elementwise_comparison(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_binary_elementwise_logical(const std::shared_ptr<Node>& node);
+
+OPENVINO_API
+bool supports_auto_broadcast(const std::shared_ptr<Node>& node);
+
+OPENVINO_API
+bool is_op(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_parameter(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_output(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_sink(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_constant(const std::shared_ptr<Node>& node);
+OPENVINO_API
+bool is_commutative(const std::shared_ptr<Node>& node);
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/read_value_base.hpp b/ngraph/core/include/openvino/op/util/read_value_base.hpp
new file mode 100644
index 00000000000000..97e101c9394906
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/read_value_base.hpp
@@ -0,0 +1,24 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/variable_extension.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API ReadValueBase : public Op, public VariableExtension {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ReadValueBase() = default;
+
+    /// \brief Constructs an AssignBase operation.
+    explicit ReadValueBase(const OutputVector& arguments) : Op(arguments) {}
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/reduction_base.hpp b/ngraph/core/include/openvino/op/util/reduction_base.hpp
new file mode 100644
index 00000000000000..6cbffbd4bcdfd3
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/reduction_base.hpp
@@ -0,0 +1,36 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API ReductionBase : public Op {
+protected:
+    /// \brief Constructs a reduction operation.
+    ReductionBase();
+
+    /// \brief Constructs a reduction operation.
+    ///
+    /// \param arg Output that produces the first input tensor.
+    /// \param reduction_axes The axis positions (0-based) to be eliminated.
+    ReductionBase(const Output<Node>& arg, const Output<Node>& reduction_axes);
+
+    /// \brief      Infers reduction operations output shape.
+    ///
+    /// \param[in] keep_dims    Reduction operation keeps dimensions.
+    ///
+    /// \return Partial shape of the output.
+    PartialShape infer_reduction_output_shape(const bool keep_dims);
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/rnn_cell_base.hpp b/ngraph/core/include/openvino/op/util/rnn_cell_base.hpp
new file mode 100644
index 00000000000000..ea1f10a0694d9e
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/rnn_cell_base.hpp
@@ -0,0 +1,162 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstddef>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "openvino/core/node.hpp"
+#include "openvino/op/op.hpp"
+#include "openvino/op/util/activation_functions.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+enum class LSTMWeightsFormat {
+    FICO,  // IE
+    ICOF,  // PyTorch
+    IFCO,  // DNNL, TF, MxNet
+    IFOC,  // Caffe
+    IOFC,  // ONNX
+};
+
+///
+/// \brief      Change data format of provided node.
+///
+/// \param[in]  node  The input node to be permuted.
+///
+///
+/// \param[in]  from_format  Original node weights format.
+///
+///
+/// \param[in]  to_format  Weights format to convert to.
+///
+/// \return     Node representing reshaped tensor according to `to_format` weights
+/// format.
+///
+std::shared_ptr<Node> OPENVINO_API convert_lstm_node_format(const Output<Node>& node,
+                                                            LSTMWeightsFormat from_format,
+                                                            LSTMWeightsFormat to_format = LSTMWeightsFormat::FICO,
+                                                            int64_t axis = 0);
+
+/// \brief      Base class for all recurrent network cells.
+///
+/// \note       It holds all common attributes.
+///
+class OPENVINO_API RNNCellBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    ///
+    /// \brief      Constructs a RNNCellBase class.
+    ///
+    /// \param[in]  hidden_size        The number of hidden units for recurrent cell.
+    /// \param[in]  clip               The value defining clipping range [-clip, clip]
+    ///                                on input of activation functions.
+    /// \param[in]  activations        The vector of activation functions used inside
+    ///                                recurrent cell.
+    /// \param[in]  activations_alpha  The vector of alpha parameters for activation
+    ///                                functions in order respective to activation list.
+    /// \param[in]  activations_beta   The vector of beta parameters for activation
+    ///                                functions in order respective to activation list.
+    ///
+    RNNCellBase(const OutputVector& args,
+                std::size_t hidden_size,
+                float clip,
+                const std::vector<std::string>& activations,
+                const std::vector<float>& activations_alpha,
+                const std::vector<float>& activations_beta);
+
+    RNNCellBase();
+    ~RNNCellBase() override = default;
+
+    ///
+    /// \brief      Validates static rank and dimension for provided input parameters.
+    ///             Additionally input_size dimension is checked for X and W inputs.
+    ///
+    ///
+    /// \param[in]  input           Vector with RNN-Cell op inputs in following order:
+    ///                             X, initial_hidden_state, W, R and B.
+    ///
+    void validate_input_rank_dimension(const std::vector<PartialShape>& input);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+    std::size_t get_hidden_size() const {
+        return m_hidden_size;
+    }
+    float get_clip() const {
+        return m_clip;
+    }
+    const std::vector<std::string>& get_activations() const {
+        return m_activations;
+    }
+    const std::vector<float>& get_activations_alpha() const {
+        return m_activations_alpha;
+    }
+    const std::vector<float>& get_activations_beta() const {
+        return m_activations_beta;
+    }
+
+protected:
+    ///
+    /// \brief      Constructs activation function object.
+    ///
+    /// \param[in]  idx   The index of the activation function name.
+    ///
+    /// \return     The object representing activation function.
+    ///
+    ActivationFunction get_activation_function(std::size_t idx) const;
+    ///
+    /// \brief      Creates node with element-wise add operation with numpy
+    ///             broadcasting.
+    ///
+    /// \param[in]  lhs   The left hand side argument node.
+    /// \param[in]  rhs   The right hand side argument node.
+    ///
+    /// \return     Node with element-wise add operation.
+    ///
+    static std::shared_ptr<Node> add(const Output<Node>& lhs, const Output<Node>& rhs);
+    ///
+    /// \brief      Creates node with element-wise subtract operation with numpy
+    ///             broadcasting.
+    ///
+    /// \param[in]  lhs   The left hand side argument node.
+    /// \param[in]  rhs   The right hand side argument node.
+    ///
+    /// \return     Node with element-wise subtract operation.
+    ///
+    static std::shared_ptr<Node> sub(const Output<Node>& lhs, const Output<Node>& rhs);
+    ///
+    /// \brief      Creates node with element-wise multiply operation with numpy
+    ///             broadcasting.
+    ///
+    /// \param[in]  lhs   The left hand side argument node.
+    /// \param[in]  rhs   The right hand side argument node.
+    ///
+    /// \return     Node with element-wise multiply operation.
+    ///
+    static std::shared_ptr<Node> mul(const Output<Node>& lhs, const Output<Node>& rhs);
+    ///
+    /// \brief      Creates node with element-wise clip operation with numpy
+    ///             broadcasting.
+    ///
+    /// \param[in]  data   The input tensor for clipping.
+    ///
+    /// \return     Node with element-wise clip operation.
+    ///
+    std::shared_ptr<Node> clip(const Output<Node>& data) const;
+
+protected:
+    std::size_t m_hidden_size;
+    float m_clip;
+    std::vector<std::string> m_activations;
+    std::vector<float> m_activations_alpha;
+    std::vector<float> m_activations_beta;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/scatter_base.hpp b/ngraph/core/include/openvino/op/util/scatter_base.hpp
new file mode 100644
index 00000000000000..ffe6952d84c181
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/scatter_base.hpp
@@ -0,0 +1,46 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+///
+/// \brief      Base class for ScatterXXX operators.
+///
+class OPENVINO_API ScatterBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+protected:
+    ScatterBase() = default;
+
+    ///
+    /// \brief      Constructs ScatterBase object.
+    ///
+    /// \param      inputs   The input tensor to be updated.
+    /// \param      indices  The tensor with indexes which will be updated.
+    /// \param      updates  The tensor with update values.
+    /// \param[in]  axis     The axis at which elements will be updated.
+    ///
+    ScatterBase(const Output<Node>& inputs,
+                const Output<Node>& indices,
+                const Output<Node>& updates,
+                const Output<Node>& axis);
+
+private:
+    // Respective input ordinal number.
+    static constexpr int DATA = 0;
+    static constexpr int INDICES = 1;
+    static constexpr int UPDATES = 2;
+    static constexpr int AXIS = 3;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/scatter_nd_base.hpp b/ngraph/core/include/openvino/op/util/scatter_nd_base.hpp
new file mode 100644
index 00000000000000..36fb2e22b05ce1
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/scatter_nd_base.hpp
@@ -0,0 +1,39 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+///
+/// \brief      Base class for ScatterNDXXX operators.
+///
+class OPENVINO_API ScatterNDBase : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    // Respective input ordinal number.
+    static constexpr int INPUTS = 0;
+    static constexpr int INDICES = 1;
+    static constexpr int UPDATES = 2;
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+protected:
+    ScatterNDBase() = default;
+
+    ///
+    /// \brief      Constructs ScatterNDBase object.
+    ///
+    /// \param      inputs   The input tensor to be updated.
+    /// \param      indices  The tensor with indexes which will be updated.
+    /// \param      updates  The tensor with update values.
+    ///
+    ScatterNDBase(const Output<Node>& inputs, const Output<Node>& indices, const Output<Node>& updates);
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/sub_graph_base.hpp b/ngraph/core/include/openvino/op/util/sub_graph_base.hpp
new file mode 100644
index 00000000000000..f489330e1984a0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/sub_graph_base.hpp
@@ -0,0 +1,149 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/op/parameter.hpp"
+#include "ngraph/op/util/multi_subgraph_base.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// \brief Abstract base class for sub-graph based ops, i.e ops that have only one
+/// sub-graph
+///
+class OPENVINO_API SubGraphOp : public MultiSubGraphOp {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    virtual const std::shared_ptr<Function>& get_function() const {
+        return m_bodies[0];
+    };
+    virtual void set_function(const std::shared_ptr<Function>& func) {
+        m_bodies[0] = func;
+    };
+    /// \return a reference to the input descriptions.
+    const std::vector<std::shared_ptr<InputDescription>>& get_input_descriptions() const {
+        return m_input_descriptions[0];
+    }
+    /// \return a reference to the input descriptions. Can add input descriptions
+    /// before
+    /// validation.
+    std::vector<std::shared_ptr<InputDescription>>& get_input_descriptions() {
+        return m_input_descriptions[0];
+    }
+    /// \return a reference to the output descriptions.
+    const std::vector<std::shared_ptr<OutputDescription>>& get_output_descriptions() const {
+        return m_output_descriptions[0];
+    }
+    /// \return a reference to the output descriptions. Can add output descriptions
+    /// before
+    /// validation.
+    std::vector<std::shared_ptr<OutputDescription>>& get_output_descriptions() {
+        return m_output_descriptions[0];
+    }
+
+    ///
+    /// \brief      Indicate that a body parameter comes from slices of a value
+    ///
+    /// \param      parameter  The parameter to receive the slices
+    /// \param      value      The value to be sliced. This will be added as an input to
+    ///                        SubGraphOp.
+    /// \param      start      First index on axis of the slicing
+    /// \param      stride     Stepping of the slice
+    /// \param      part_size  Size of the slice on axis
+    /// \param      end        The last index on axis of the slicing
+    /// \param      axis       The axis to slice along
+    ///
+    virtual void set_sliced_input(const std::shared_ptr<ngraph::op::Parameter>& parameter,
+                                  const Output<Node>& value,
+                                  int64_t start,
+                                  int64_t stride,
+                                  int64_t part_size,
+                                  int64_t end,
+                                  int64_t axis);
+    ///
+    /// \brief      Indicates that a body parameter has an initial value in the first
+    ///             iteration and computed value thereafter
+    ///
+    /// \param[in]  body_parameter    The body parameter
+    /// \param      initial_value     Value for the parameter in first iteration. This
+    ///                               will be added as an input to Loop.
+    /// \param      successive_value  Value for the parameter in successive iterations.
+    ///                               The value is what is active in the most recent
+    ///                               completed iteration.
+    ///
+    virtual void set_merged_input(const std::shared_ptr<ngraph::op::Parameter>& body_parameter,
+                                  const Output<Node>& initial_value,
+                                  const Output<Node>& successive_value);
+    ///
+    /// \brief      Indicates that a body parameter has an invariant value during
+    ///             iteration that may depend on values computed outside of the
+    ///             iteration.
+    ///
+    /// \param      body_parameter  The body parameter
+    /// \param      value           The value supplied as an input to the block
+    ///
+    virtual void set_invariant_input(const std::shared_ptr<ngraph::op::Parameter>& body_parameter,
+                                     const Output<Node>& value);
+    ///
+    /// \brief      Gets a value for a particular iteration point
+    ///
+    /// \param      body_value  The value
+    /// \param      iteration   The iteration that supplies the value. Negative values
+    ///                         are from the last iteration.
+    ///                         Default value -1 (the last iteration).
+    ///
+    /// \return     The iterator value.
+    ///
+    virtual Output<Node> get_iter_value(const Output<Node>& body_value, int64_t iteration = -1);
+    ///
+    /// \brief      Concatenates slices from all iterations
+    ///
+    /// \param      value      The value supplying slice values from each iteration.
+    /// \param      start      First index on axis of the slicing
+    /// \param      stride     Stepping of the slice
+    /// \param      part_size  Size of the slice on axis
+    /// \param      end        The last index on axis of the slicing
+    /// \param      axis       The axis to slice along
+    ///
+    /// \return     The concatenated slices.
+    ///
+    virtual Output<Node> get_concatenated_slices(const Output<Node>& value,
+                                                 int64_t start,
+                                                 int64_t stride,
+                                                 int64_t part_size,
+                                                 int64_t end,
+                                                 int64_t axis);
+
+    SubGraphOp(const SubGraphOp&) = delete;
+    SubGraphOp(SubGraphOp&&) = default;
+
+    SubGraphOp& operator=(const SubGraphOp&) = delete;
+    SubGraphOp& operator=(SubGraphOp&&) = default;
+
+    int64_t get_num_iterations() const {
+        return m_num_iterations;
+    }
+
+protected:
+    int64_t m_num_iterations = -1;  // -1 means infinity for Loop op, inconsistent for TensorIterator
+
+    // Find an input corresponding to value, adding one if necessary.
+    Input<Node> input_for_value(const Output<Node>& value);
+
+    SubGraphOp();
+    explicit SubGraphOp(const OutputVector& args);
+
+private:
+    using MultiSubGraphOp::get_function;
+
+    using MultiSubGraphOp::set_function;
+};
+using InputDescriptionVector = std::vector<util::SubGraphOp::InputDescription::Ptr>;
+using OutputDescriptionVector = std::vector<util::SubGraphOp::OutputDescription::Ptr>;
+}  // namespace util
+}  // namespace op
+
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/unary_elementwise_arithmetic.hpp b/ngraph/core/include/openvino/op/util/unary_elementwise_arithmetic.hpp
new file mode 100644
index 00000000000000..0b9be9877cb55a
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/unary_elementwise_arithmetic.hpp
@@ -0,0 +1,53 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+// clang-format off
+/// \brief Abstract base class for elementwise unary arithmetic operations, i.e.,
+///        operations where the same scalar arithmetic operation is applied to each
+///        element.
+///
+/// For example, if the underlying operation (determined by the subclass) is
+/// \f$\mathit{op}(x)\f$, the input tensor \f$[[x,y],[z,w]]\f$ will be mapped to
+/// \f$[[\mathit{op}(x),\mathit{op}(y)],[\mathit{op}(z),\mathit{op}(w)]]\f$.
+///
+/// ## Inputs
+///
+/// |       | Type                              | Description                                                              |
+/// | ----- | --------------------------------- | ------------------------------------------------------------------------ |
+/// | `arg` | \f$N[d_1,\dots,d_n]~(n \geq 0)\f$ | A tensor of any shape. The element type \f$N\f$ may be any numeric type. |
+///
+/// ## Output
+///
+/// | Type                   | Description                                                                                                                                                             |
+/// | ---------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+/// | \f$N[d_1,\dots,d_n]\f$ | The tensor \f$T\f$, where \f$T[i_1,\dots,i_n] = \mathit{op}(\texttt{arg}[i_1,\dots,i_n])\f$. This will always have the same shape and element type as the input tensor. |
+// clang-format on
+class OPENVINO_API UnaryElementwiseArithmetic : public Op {
+protected:
+    /// \brief Constructs a unary elementwise arithmetic operation.
+    UnaryElementwiseArithmetic();
+    /// \brief Constructs a unary elementwise arithmetic operation.
+    ///
+    /// \param arg Output that produces the input tensor.
+    UnaryElementwiseArithmetic(const Output<Node>& arg);
+
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    void validate_and_infer_types() override;
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+private:
+    void validate_and_infer_elementwise_arithmetic();
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/variable.hpp b/ngraph/core/include/openvino/op/util/variable.hpp
new file mode 100644
index 00000000000000..239ee5b5eca189
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/variable.hpp
@@ -0,0 +1,60 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+#include <utility>
+
+#include "openvino/core/partial_shape.hpp"
+#include "openvino/core/type.hpp"
+#include "openvino/core/type/element_type.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+struct VariableInfo {
+    PartialShape data_shape;
+    element::Type data_type;
+    std::string variable_id;
+
+    inline bool operator==(const VariableInfo& other) const {
+        return data_shape == other.data_shape && data_type == other.data_type && variable_id == other.variable_id;
+    }
+};
+
+class OPENVINO_API Variable {
+public:
+    using Ptr = std::shared_ptr<Variable>;
+    Variable() = default;
+
+    explicit Variable(VariableInfo variable_info) : m_info(std::move(variable_info)) {}
+
+    VariableInfo get_info() const {
+        return m_info;
+    }
+    void update(const VariableInfo& variable_info) {
+        m_info = variable_info;
+    }
+
+private:
+    VariableInfo m_info;
+};
+using VariableVector = std::vector<Variable::Ptr>;
+
+}  // namespace util
+}  // namespace op
+template <>
+class OPENVINO_API AttributeAdapter<std::shared_ptr<op::util::Variable>>
+    : public DirectValueAccessor<std::shared_ptr<op::util::Variable>> {
+public:
+    explicit AttributeAdapter(std::shared_ptr<op::util::Variable>& value)
+        : DirectValueAccessor<std::shared_ptr<op::util::Variable>>(value) {}
+
+    static constexpr DiscreteTypeInfo type_info{"AttributeAdapter<std::shared_ptr<Variable>>", 0};
+    const DiscreteTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+};
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/variable_context.hpp b/ngraph/core/include/openvino/op/util/variable_context.hpp
new file mode 100644
index 00000000000000..0cfb29f28573e0
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/variable_context.hpp
@@ -0,0 +1,91 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <unordered_map>
+
+#include "openvino/core/node_vector.hpp"
+#include "openvino/core/variant.hpp"
+#include "openvino/op/util/variable.hpp"
+#include "openvino/op/util/variable_value.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+using VariableMap = std::unordered_map<Variable::Ptr, VariableValue::Ptr>;
+
+/// VariableContext stores and manages a evaluation context for Variables.
+class NGRAPH_API VariableContext {
+public:
+    /// \brief Constructs an uninitialized VariableContext.
+    VariableContext() = default;
+
+    /// \brief Constructor for VariableContext.
+    /// \param variable_values The values associated with a particular Variables.
+    explicit VariableContext(const VariableMap& variable_values) : m_variable_values(variable_values) {}
+
+    /// \brief Sets the reset flags for all stored Variables to true.
+    void reset_variable_context() const {
+        for (const auto& el : m_variable_values) {
+            el.second->set_reset(true);
+        }
+    }
+
+    /// \brief Sets the new values for Variables.
+    /// \param variable_values The new values associated with a particular Variable.
+    void set_variable_values(const VariableMap& variable_values) {
+        m_variable_values = variable_values;
+    }
+
+    /// \brief Changes/sets the values for Variable.
+    /// \param variable New or stored Variable.
+    /// \param variable_value The values associated with the variable.
+    void set_variable_value(const Variable::Ptr& variable, const VariableValue::Ptr& variable_value) {
+        m_variable_values[variable] = variable_value;
+    }
+
+    /// \brief Removes context for a particular Variable.
+    /// \param variable The variable for which the context will be cleared.
+    void remove_variable_value(const Variable::Ptr& variable) {
+        m_variable_values.erase(variable);
+    }
+
+    /// \brief Returns the current values for Variables.
+    const VariableMap& get_variable_values() const {
+        return m_variable_values;
+    }
+
+    /// \brief Returns the value for specified Variable.
+    VariableValue::Ptr get_variable_value(const Variable::Ptr& variable) const {
+        auto var_value = m_variable_values.find(variable);
+        if (var_value != m_variable_values.end()) {
+            return (*var_value).second;
+        }
+        return VariableValue::Ptr();
+    }
+
+private:
+    /// The values associated with a particular Variable.
+    VariableMap m_variable_values;
+};
+}  // namespace util
+}  // namespace op
+template <>
+class NGRAPH_API VariantWrapper<op::util::VariableContext> : public VariantImpl<op::util::VariableContext> {
+public:
+    static constexpr VariantTypeInfo type_info{"Variant::EvaluationContext::VariableContext", 0};
+
+    const VariantTypeInfo& get_type_info() const override {
+        return type_info;
+    }
+
+    explicit VariantWrapper(const value_type& value) : VariantImpl<value_type>(value) {}
+
+private:
+    using Variant::init;
+    using Variant::merge;
+};
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/variable_extension.hpp b/ngraph/core/include/openvino/op/util/variable_extension.hpp
new file mode 100644
index 00000000000000..53c16c22065d30
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/variable_extension.hpp
@@ -0,0 +1,47 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <utility>
+
+#include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/op/util/variable.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+class OPENVINO_API VariableExtension {
+public:
+    VariableExtension() = default;
+
+    /// \brief Returns variable connected to this node.
+    virtual std::shared_ptr<Variable> get_variable() const {
+        return m_variable;
+    }
+
+    /// \brief Sets a new variable to be connected to this node.
+    ///
+    /// \param variable New variable to be connected to this node.
+    virtual void set_variable(const std::shared_ptr<Variable>& variable) {
+        m_variable = variable;
+    }
+
+    /// \brief Sets the identifier to a variable
+    ///
+    /// \param variable_id New identifier of the variable.
+    virtual void set_variable_id(const std::string& variable_id) {
+        m_variable->get_info().variable_id = variable_id;
+    };
+
+    /// \brief Returns the identifier of corresponding variable.
+    virtual std::string get_variable_id() const = 0;
+
+protected:
+    std::shared_ptr<Variable> m_variable;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/util/variable_value.hpp b/ngraph/core/include/openvino/op/util/variable_value.hpp
new file mode 100644
index 00000000000000..39425604034097
--- /dev/null
+++ b/ngraph/core/include/openvino/op/util/variable_value.hpp
@@ -0,0 +1,60 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <utility>
+
+#include "ngraph/runtime/host_tensor.hpp"
+#include "openvino/core/core_visibility.hpp"
+
+namespace ov {
+namespace op {
+namespace util {
+/// VariableValue stores data and state (reset flag) for a Variable,
+/// and provides an interface for changing them.
+class OPENVINO_API VariableValue {
+public:
+    using Ptr = std::shared_ptr<VariableValue>;
+    /// \brief Constructs an uninitialized VariableValue.
+    VariableValue() = default;
+
+    /// \brief Constructor for VariableValue.
+    /// \param value The data for Variable.
+    explicit VariableValue(ngraph::HostTensorPtr value) : m_value(std::move(value)) {}
+
+    /// \brief Constructor for VariableValue.
+    /// \param value Data for Variable.
+    /// \param reset The current state of the reset flag.
+    VariableValue(ngraph::HostTensorPtr value, bool reset) : m_reset(reset), m_value(std::move(value)) {}
+
+    /// \brief Sets the reset flag to a new state.
+    /// \param reset The new state of the reset flag.
+    void set_reset(bool reset) {
+        m_reset = reset;
+    }
+
+    /// \brief Returns the current reset flag state.
+    bool get_reset() const {
+        return m_reset;
+    }
+
+    /// \brief Returns the current stored data.
+    const ngraph::HostTensorPtr& get_value() const {
+        return m_value;
+    }
+
+    /// \brief Sets new values for Variable.
+    /// \param value New data for Variable.
+    void set_value(const ngraph::HostTensorPtr& value) {
+        m_value = value;
+    }
+
+private:
+    bool m_reset = true;
+    ngraph::HostTensorPtr m_value;
+};
+}  // namespace util
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/variadic_split.hpp b/ngraph/core/include/openvino/op/variadic_split.hpp
new file mode 100644
index 00000000000000..74c3059dac5ebd
--- /dev/null
+++ b/ngraph/core/include/openvino/op/variadic_split.hpp
@@ -0,0 +1,46 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/op.hpp"
+
+namespace ov {
+namespace op {
+namespace v1 {
+/// \brief VariadicSplit operation splits an input tensor into pieces along some axis.
+/// The pieces may have variadic lengths depending on "split_lengths" attribute.
+class OPENVINO_API VariadicSplit : public Op {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    /// \brief Constructs a variadic split operation.
+    VariadicSplit() = default;
+    /// \brief Constructs a variadic split operation.
+    ///
+    /// \param data           The tensor to be split.
+    /// \param axis           The index of an axis in "data" along which to perform the
+    /// split.
+    /// \param split_lengths  A list containing the sizes of each output tensor
+    /// along the split "axis". Size of "split_lengths" should be equal to the number of
+    ///
+    /// outputs. The sum of split_lengths must match data.shape[axis]
+    VariadicSplit(const Output<Node>& data, const Output<Node>& axis, const Output<Node>& split_lengths);
+
+    bool visit_attributes(AttributeVisitor& visitor) override;
+
+    void validate_and_infer_types() override;
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+    size_t get_default_output_index() const override {
+        return no_default_index();
+    }
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+
+private:
+    bool evaluate_variadic_split(const HostTensorVector& outputs, const HostTensorVector& inputs) const;
+};
+}  // namespace v1
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/op/xor.hpp b/ngraph/core/include/openvino/op/xor.hpp
new file mode 100644
index 00000000000000..460117ae5996b3
--- /dev/null
+++ b/ngraph/core/include/openvino/op/xor.hpp
@@ -0,0 +1,41 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+
+#include "openvino/op/util/binary_elementwise_logical.hpp"
+
+namespace ov {
+namespace op {
+namespace v0 {
+/// \brief Elementwise logical-xor operation.
+///
+class OPENVINO_API Xor : public util::BinaryElementwiseLogical {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    Xor() = default;
+    /// \brief Constructs a logical-xor operation.
+    ///
+    /// \param arg0 Node that produces the first input tensor.<br>
+    /// `[d0, ...]`
+    /// \param arg1 Node that produces the second input tensor.<br>
+    /// `[d0, ...]`
+    /// \param auto_broadcast Auto broadcast specification
+    ///
+    /// Output `[d0, ...]`
+    ///
+    Xor(const Output<Node>& arg0,
+        const Output<Node>& arg1,
+        const AutoBroadcastSpec& auto_broadcast = AutoBroadcastSpec());
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& new_args) const override;
+
+    bool evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const override;
+    bool has_evaluate() const override;
+};
+}  // namespace v0
+}  // namespace op
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset.hpp b/ngraph/core/include/openvino/opsets/opset.hpp
new file mode 100644
index 00000000000000..8503d815313346
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset.hpp
@@ -0,0 +1,119 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <locale>
+#include <map>
+#include <mutex>
+#include <set>
+#include <utility>
+
+#include "ngraph/factory.hpp"
+#include "openvino/core/node.hpp"
+
+namespace ov {
+/// \brief Run-time opset information
+class OPENVINO_API OpSet {
+    static std::mutex& get_mutex();
+
+public:
+    OpSet() = default;
+    virtual ~OpSet() = default;
+    std::set<NodeTypeInfo>::size_type size() const {
+        std::lock_guard<std::mutex> guard(get_mutex());
+        return m_op_types.size();
+    }
+
+    /// \brief Insert OP_TYPE into the opset with a special name and the default factory
+    template <typename OP_TYPE>
+    void insert(const std::string& name) {
+        insert(name, OP_TYPE::type_info, ngraph::FactoryRegistry<Node>::get_default_factory<OP_TYPE>());
+    }
+
+    /// \brief Insert OP_TYPE into the opset with the default name and factory
+    template <typename OP_TYPE>
+    void insert() {
+        insert<OP_TYPE>(OP_TYPE::type_info.name);
+    }
+
+    const std::set<NodeTypeInfo>& get_types_info() const {
+        return m_op_types;
+    }
+    /// \brief Create the op named name using it's factory
+    ov::Node* create(const std::string& name) const;
+
+    /// \brief Create the op named name using it's factory
+    ov::Node* create_insensitive(const std::string& name) const;
+
+    /// \brief Return true if OP_TYPE is in the opset
+    bool contains_type(const NodeTypeInfo& type_info) const {
+        std::lock_guard<std::mutex> guard(get_mutex());
+        return m_op_types.find(type_info) != m_op_types.end();
+    }
+
+    /// \brief Return true if OP_TYPE is in the opset
+    template <typename OP_TYPE>
+    bool contains_type() const {
+        return contains_type(OP_TYPE::type_info);
+    }
+
+    /// \brief Return true if name is in the opset
+    bool contains_type(const std::string& name) const {
+        std::lock_guard<std::mutex> guard(get_mutex());
+        return m_name_type_info_map.find(name) != m_name_type_info_map.end();
+    }
+
+    /// \brief Return true if name is in the opset
+    bool contains_type_insensitive(const std::string& name) const {
+        std::lock_guard<std::mutex> guard(get_mutex());
+        return m_case_insensitive_type_info_map.find(to_upper_name(name)) != m_case_insensitive_type_info_map.end();
+    }
+
+    /// \brief Return true if node's type is in the opset
+    bool contains_op_type(const Node* node) const {
+        std::lock_guard<std::mutex> guard(get_mutex());
+        return m_op_types.find(node->get_type_info()) != m_op_types.end();
+    }
+
+    const std::set<NodeTypeInfo>& get_type_info_set() const {
+        return m_op_types;
+    }
+
+protected:
+    static std::string to_upper_name(const std::string& name) {
+        std::string upper_name = name;
+        std::locale loc;
+        std::transform(upper_name.begin(), upper_name.end(), upper_name.begin(), [&loc](char c) {
+            return std::toupper(c, loc);
+        });
+        return upper_name;
+    }
+
+    ngraph::FactoryRegistry<ov::Node> m_factory_registry;
+    std::set<NodeTypeInfo> m_op_types;
+    std::map<std::string, NodeTypeInfo> m_name_type_info_map;
+    std::map<std::string, NodeTypeInfo> m_case_insensitive_type_info_map;
+
+    /// \brief Insert an op into the opset with a particular name and factory
+    void insert(const std::string& name,
+                const NodeTypeInfo& type_info,
+                ngraph::FactoryRegistry<Node>::Factory factory) {
+        std::lock_guard<std::mutex> guard(get_mutex());
+        m_op_types.insert(type_info);
+        m_name_type_info_map[name] = type_info;
+        m_case_insensitive_type_info_map[to_upper_name(name)] = type_info;
+        m_factory_registry.register_factory(type_info, std::move(factory));
+    }
+};
+
+const OPENVINO_API OpSet& get_opset1();
+const OPENVINO_API OpSet& get_opset2();
+const OPENVINO_API OpSet& get_opset3();
+const OPENVINO_API OpSet& get_opset4();
+const OPENVINO_API OpSet& get_opset5();
+const OPENVINO_API OpSet& get_opset6();
+const OPENVINO_API OpSet& get_opset7();
+const OPENVINO_API OpSet& get_opset8();
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset1.hpp b/ngraph/core/include/openvino/opsets/opset1.hpp
new file mode 100644
index 00000000000000..47eb6effa88ae5
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset1.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset1 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset1_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset1
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset1_tbl.hpp b/ngraph/core/include/openvino/opsets/opset1_tbl.hpp
new file mode 100644
index 00000000000000..faa7100c00799c
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset1_tbl.hpp
@@ -0,0 +1,150 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+// This collection contains one entry for each op. If an op is added it must be
+// added to this list.
+//
+// In order to use this list you want to define a macro named exactly OPENVINO_OP
+// When you are done you should undef the macro
+// As an example if you wanted to make a list of all op names as strings you could do this:
+//
+// #define OPENVINO_OP(a,b) #a,
+// std::vector<std::string> op_names{
+// #include "this include file name"
+// };
+// #undef OPENVINO_OP
+//
+// This sample expands to a list like this:
+// "Abs",
+// "Acos",
+// ...
+//
+// #define OPENVINO_OP(a,b) b::a,
+// std::vector<std::string> op_names{
+// #include "this include file name"
+// };
+// #undef OPENVINO_OP
+//
+// This sample expands to a list like this:
+// ov::op::Abs,
+// ov::op::Acos,
+// ...
+//
+// It's that easy. You can use this for fun and profit.
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v0)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v1)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(DeformableConvolution, ov::op::v1)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(Gather, ov::op::v1)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Interpolate, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v0)
+OPENVINO_OP(LSTMSequence, ov::op::v0)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(MaxPool, ov::op::v1)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NonMaxSuppression, ov::op::v1)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v0)
+OPENVINO_OP(Range, ov::op::v0)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+OPENVINO_OP(Reverse, ov::op::v1)
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+OPENVINO_OP(RNNCell, ov::op::v0)
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v0)
+OPENVINO_OP(ShuffleChannels, ov::op::v0)
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(TopK, ov::op::v1)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+OPENVINO_OP(Xor, ov::op::v0)
diff --git a/ngraph/core/include/openvino/opsets/opset2.hpp b/ngraph/core/include/openvino/opsets/opset2.hpp
new file mode 100644
index 00000000000000..24c1b1befe2310
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset2.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset2 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset2_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset2
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset2_tbl.hpp b/ngraph/core/include/openvino/opsets/opset2_tbl.hpp
new file mode 100644
index 00000000000000..80ac1d7f658574
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset2_tbl.hpp
@@ -0,0 +1,143 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v0)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v1)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(DeformableConvolution, ov::op::v1)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(Gather, ov::op::v1)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Interpolate, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v0)
+OPENVINO_OP(LSTMSequence, ov::op::v0)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(MaxPool, ov::op::v1)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+
+OPENVINO_OP(MVN, ov::op::v0)  // Missing in opset1
+
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NonMaxSuppression, ov::op::v1)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v0)
+OPENVINO_OP(Range, ov::op::v0)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+
+OPENVINO_OP(ReorgYolo, ov::op::v0)  // Missing in opset1
+
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+
+// Moved out of opset2, it was added to opset1 by mistake
+// OPENVINO_OP(Reverse, ov::op::v1)
+
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+
+// Moved out of opset2, it was added to opset1 by mistake
+// OPENVINO_OP(RNNCell, ov::op::v0)
+
+OPENVINO_OP(ROIPooling, ov::op::v0)  // Missing in opset1
+
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v0)
+
+// Moved out of opset2, it was added to opset1 by mistake
+// OPENVINO_OP(ShuffleChannels, ov::op::v0)
+
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(TopK, ov::op::v1)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+
+// Moved out of opset2, it was added to opset1 by mistake
+// OPENVINO_OP(Xor, ov::op::v0)
+
+// New operations added in opset2
+OPENVINO_OP(Gelu, ov::op::v0)
+OPENVINO_OP(BatchToSpace, ov::op::v1)
+OPENVINO_OP(SpaceToBatch, ov::op::v1)
diff --git a/ngraph/core/include/openvino/opsets/opset3.hpp b/ngraph/core/include/openvino/opsets/opset3.hpp
new file mode 100644
index 00000000000000..a2f60e8a9f1c82
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset3.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset3 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset3_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset3
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset3_tbl.hpp b/ngraph/core/include/openvino/opsets/opset3_tbl.hpp
new file mode 100644
index 00000000000000..c6369b99b68fcf
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset3_tbl.hpp
@@ -0,0 +1,159 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v0)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v3)
+OPENVINO_OP(Bucketize, ov::op::v3)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(CumSum, ov::op::v0)
+OPENVINO_OP(DeformableConvolution, ov::op::v1)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(ExtractImagePatches, ov::op::v3)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(Gather, ov::op::v1)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Interpolate, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v0)
+OPENVINO_OP(LSTMSequence, ov::op::v0)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(MaxPool, ov::op::v1)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+
+OPENVINO_OP(MVN, ov::op::v0)  // Missing in opset1
+
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NonMaxSuppression, ov::op::v3)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v0)
+OPENVINO_OP(Range, ov::op::v0)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+
+OPENVINO_OP(ReorgYolo, ov::op::v0)  // Missing in opset1
+
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+
+// Moved out of opset2, it was added to opset1 by mistake
+// OPENVINO_OP(Reverse, ov::op::v1)
+
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+
+// Moved out of opset2, it was added to opset1 by mistake
+// OPENVINO_OP(RNNCell, ov::op::v0)
+
+OPENVINO_OP(ROIPooling, ov::op::v0)  // Missing in opset1
+
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+// Superseded
+// OPENVINO_OP(ShapeOf, ov::op::v0)
+
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+
+// Moved out of opset2, it was added to opset1 by mistake
+// OPENVINO_OP(Xor, ov::op::v0)
+
+// New operations added in opset2
+OPENVINO_OP(Gelu, ov::op::v0)
+OPENVINO_OP(BatchToSpace, ov::op::v1)
+OPENVINO_OP(SpaceToBatch, ov::op::v1)
+
+// New operations added in opset3
+OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
+OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
+OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
+OPENVINO_OP(GRUCell, ov::op::v3)
+OPENVINO_OP(NonZero, ov::op::v3)
+OPENVINO_OP(RNNCell, ov::op::v0)
+OPENVINO_OP(ROIAlign, ov::op::v3)
+OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
+OPENVINO_OP(ScatterUpdate, ov::op::v3)
+OPENVINO_OP(ShuffleChannels, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v3)
+OPENVINO_OP(Assign, ov::op::v3)
+OPENVINO_OP(ReadValue, ov::op::v3)
+OPENVINO_OP(TopK, ov::op::v3)
diff --git a/ngraph/core/include/openvino/opsets/opset4.hpp b/ngraph/core/include/openvino/opsets/opset4.hpp
new file mode 100644
index 00000000000000..369ea427e9e845
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset4.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset4 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset4_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset4
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset4_tbl.hpp b/ngraph/core/include/openvino/opsets/opset4_tbl.hpp
new file mode 100644
index 00000000000000..320916daf48d78
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset4_tbl.hpp
@@ -0,0 +1,152 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v0)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v3)
+OPENVINO_OP(Bucketize, ov::op::v3)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(CumSum, ov::op::v0)
+OPENVINO_OP(DeformableConvolution, ov::op::v1)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(ExtractImagePatches, ov::op::v3)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(Gather, ov::op::v1)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v4)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(MaxPool, ov::op::v1)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+OPENVINO_OP(MVN, ov::op::v0)
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v4)
+OPENVINO_OP(Range, ov::op::v4)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+OPENVINO_OP(ReorgYolo, ov::op::v0)
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+OPENVINO_OP(ROIPooling, ov::op::v0)
+OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+
+// New operations added in opset2
+OPENVINO_OP(Gelu, ov::op::v0)
+OPENVINO_OP(BatchToSpace, ov::op::v1)
+OPENVINO_OP(SpaceToBatch, ov::op::v1)
+
+// New operations added in opset3
+OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
+OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
+OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
+OPENVINO_OP(GRUCell, ov::op::v3)
+OPENVINO_OP(NonZero, ov::op::v3)
+OPENVINO_OP(RNNCell, ov::op::v0)
+OPENVINO_OP(ROIAlign, ov::op::v3)
+OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
+OPENVINO_OP(ScatterUpdate, ov::op::v3)
+OPENVINO_OP(ShuffleChannels, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v3)
+OPENVINO_OP(Assign, ov::op::v3)
+OPENVINO_OP(ReadValue, ov::op::v3)
+OPENVINO_OP(TopK, ov::op::v3)
+
+// New operations added in opset4
+OPENVINO_OP(Acosh, ov::op::v3)
+OPENVINO_OP(Asinh, ov::op::v3)
+OPENVINO_OP(Atanh, ov::op::v3)
+OPENVINO_OP(CTCLoss, ov::op::v4)
+OPENVINO_OP(HSwish, ov::op::v4)
+OPENVINO_OP(Interpolate, ov::op::v4)
+OPENVINO_OP(Mish, ov::op::v4)
+OPENVINO_OP(NonMaxSuppression, ov::op::v4)
+OPENVINO_OP(ReduceL1, ov::op::v4)
+OPENVINO_OP(ReduceL2, ov::op::v4)
+OPENVINO_OP(SoftPlus, ov::op::v4)
+OPENVINO_OP(Swish, ov::op::v4)
diff --git a/ngraph/core/include/openvino/opsets/opset5.hpp b/ngraph/core/include/openvino/opsets/opset5.hpp
new file mode 100644
index 00000000000000..736fa00f5294b1
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset5.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset5 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset5_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset5
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset5_tbl.hpp b/ngraph/core/include/openvino/opsets/opset5_tbl.hpp
new file mode 100644
index 00000000000000..beeeef5395bd3d
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset5_tbl.hpp
@@ -0,0 +1,162 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v5)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v3)
+OPENVINO_OP(Bucketize, ov::op::v3)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(CumSum, ov::op::v0)
+OPENVINO_OP(DeformableConvolution, ov::op::v1)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(ExtractImagePatches, ov::op::v3)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(Gather, ov::op::v1)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v4)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(MaxPool, ov::op::v1)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+OPENVINO_OP(MVN, ov::op::v0)
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v4)
+OPENVINO_OP(Range, ov::op::v4)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+OPENVINO_OP(ReorgYolo, ov::op::v0)
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+OPENVINO_OP(ROIPooling, ov::op::v0)
+OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+
+// New operations added in opset2
+OPENVINO_OP(Gelu, ov::op::v0)
+OPENVINO_OP(BatchToSpace, ov::op::v1)
+OPENVINO_OP(SpaceToBatch, ov::op::v1)
+
+// New operations added in opset3
+OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
+OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
+OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
+OPENVINO_OP(GRUCell, ov::op::v3)
+OPENVINO_OP(NonZero, ov::op::v3)
+OPENVINO_OP(RNNCell, ov::op::v0)
+OPENVINO_OP(ROIAlign, ov::op::v3)
+OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
+OPENVINO_OP(ScatterUpdate, ov::op::v3)
+OPENVINO_OP(ShuffleChannels, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v3)
+OPENVINO_OP(Assign, ov::op::v3)
+OPENVINO_OP(ReadValue, ov::op::v3)
+OPENVINO_OP(TopK, ov::op::v3)
+
+// New operations added in opset4
+OPENVINO_OP(Acosh, ov::op::v3)
+OPENVINO_OP(Asinh, ov::op::v3)
+OPENVINO_OP(Atanh, ov::op::v3)
+OPENVINO_OP(CTCLoss, ov::op::v4)
+OPENVINO_OP(HSwish, ov::op::v4)
+OPENVINO_OP(Interpolate, ov::op::v4)
+OPENVINO_OP(Mish, ov::op::v4)
+OPENVINO_OP(ReduceL1, ov::op::v4)
+OPENVINO_OP(ReduceL2, ov::op::v4)
+OPENVINO_OP(SoftPlus, ov::op::v4)
+OPENVINO_OP(Swish, ov::op::v4)
+
+// New operations added in opset5
+OPENVINO_OP(GatherND, ov::op::v5)
+OPENVINO_OP(GRUSequence, ov::op::v5)
+OPENVINO_OP(HSigmoid, ov::op::v5)
+OPENVINO_OP(LogSoftmax, ov::op::v5)
+OPENVINO_OP(Loop, ov::op::v5)
+OPENVINO_OP(LSTMSequence, ov::op::v5)
+OPENVINO_OP(NonMaxSuppression, ov::op::v5)
+OPENVINO_OP(RNNSequence, ov::op::v5)
+OPENVINO_OP(Round, ov::op::v5)
diff --git a/ngraph/core/include/openvino/opsets/opset6.hpp b/ngraph/core/include/openvino/opsets/opset6.hpp
new file mode 100644
index 00000000000000..82b792da09ab0f
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset6.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset6 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset6_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset6
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset6_tbl.hpp b/ngraph/core/include/openvino/opsets/opset6_tbl.hpp
new file mode 100644
index 00000000000000..eb23908c61da34
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset6_tbl.hpp
@@ -0,0 +1,171 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v5)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v3)
+OPENVINO_OP(Bucketize, ov::op::v3)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(CumSum, ov::op::v0)
+OPENVINO_OP(DeformableConvolution, ov::op::v1)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(ExtractImagePatches, ov::op::v3)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(Gather, ov::op::v1)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v4)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(MaxPool, ov::op::v1)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v4)
+OPENVINO_OP(Range, ov::op::v4)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+OPENVINO_OP(ReorgYolo, ov::op::v0)
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+OPENVINO_OP(ROIPooling, ov::op::v0)
+OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+
+// New operations added in opset2
+OPENVINO_OP(Gelu, ov::op::v0)
+OPENVINO_OP(BatchToSpace, ov::op::v1)
+OPENVINO_OP(SpaceToBatch, ov::op::v1)
+
+// New operations added in opset3
+OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
+OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
+OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
+OPENVINO_OP(GRUCell, ov::op::v3)
+OPENVINO_OP(NonZero, ov::op::v3)
+OPENVINO_OP(RNNCell, ov::op::v0)
+OPENVINO_OP(ROIAlign, ov::op::v3)
+OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
+OPENVINO_OP(ScatterUpdate, ov::op::v3)
+OPENVINO_OP(ShuffleChannels, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v3)
+OPENVINO_OP(TopK, ov::op::v3)
+
+// New operations added in opset4
+OPENVINO_OP(Acosh, ov::op::v3)
+OPENVINO_OP(Asinh, ov::op::v3)
+OPENVINO_OP(Atanh, ov::op::v3)
+OPENVINO_OP(CTCLoss, ov::op::v4)
+OPENVINO_OP(HSwish, ov::op::v4)
+OPENVINO_OP(Interpolate, ov::op::v4)
+OPENVINO_OP(Mish, ov::op::v4)
+OPENVINO_OP(ReduceL1, ov::op::v4)
+OPENVINO_OP(ReduceL2, ov::op::v4)
+OPENVINO_OP(SoftPlus, ov::op::v4)
+OPENVINO_OP(Swish, ov::op::v4)
+
+// New operations added in opset5
+OPENVINO_OP(GatherND, ov::op::v5)
+OPENVINO_OP(GRUSequence, ov::op::v5)
+OPENVINO_OP(HSigmoid, ov::op::v5)
+OPENVINO_OP(LogSoftmax, ov::op::v5)
+OPENVINO_OP(Loop, ov::op::v5)
+OPENVINO_OP(LSTMSequence, ov::op::v5)
+OPENVINO_OP(NonMaxSuppression, ov::op::v5)
+OPENVINO_OP(RNNSequence, ov::op::v5)
+OPENVINO_OP(Round, ov::op::v5)
+
+// New operations added in opset6
+OPENVINO_OP(CTCGreedyDecoderSeqLen, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronDetectionOutput, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronTopKROIs, ov::op::v6)
+OPENVINO_OP(GatherElements, ov::op::v6)
+OPENVINO_OP(MVN, ov::op::v6)
+OPENVINO_OP(Assign, ov::op::v6)     // new version
+OPENVINO_OP(ReadValue, ov::op::v6)  // new version
diff --git a/ngraph/core/include/openvino/opsets/opset7.hpp b/ngraph/core/include/openvino/opsets/opset7.hpp
new file mode 100644
index 00000000000000..87343585747c15
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset7.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset7 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset7_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset7
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset7_tbl.hpp b/ngraph/core/include/openvino/opsets/opset7_tbl.hpp
new file mode 100644
index 00000000000000..169a0534dd0cd1
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset7_tbl.hpp
@@ -0,0 +1,177 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v5)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v3)
+OPENVINO_OP(Bucketize, ov::op::v3)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(CumSum, ov::op::v0)
+OPENVINO_OP(DeformableConvolution, ov::op::v1)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(ExtractImagePatches, ov::op::v3)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(Gather, ov::op::v7)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v4)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(MaxPool, ov::op::v1)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v4)
+OPENVINO_OP(Range, ov::op::v4)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+OPENVINO_OP(ReorgYolo, ov::op::v0)
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+OPENVINO_OP(ROIPooling, ov::op::v0)
+OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+
+// New operations added in opset2
+OPENVINO_OP(BatchToSpace, ov::op::v1)
+OPENVINO_OP(SpaceToBatch, ov::op::v1)
+
+// New operations added in opset3
+OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
+OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
+OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
+OPENVINO_OP(GRUCell, ov::op::v3)
+OPENVINO_OP(NonZero, ov::op::v3)
+OPENVINO_OP(RNNCell, ov::op::v0)
+OPENVINO_OP(ROIAlign, ov::op::v3)
+OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
+OPENVINO_OP(ScatterUpdate, ov::op::v3)
+OPENVINO_OP(ShuffleChannels, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v3)
+OPENVINO_OP(TopK, ov::op::v3)
+
+// New operations added in opset4
+OPENVINO_OP(Acosh, ov::op::v3)
+OPENVINO_OP(Asinh, ov::op::v3)
+OPENVINO_OP(Atanh, ov::op::v3)
+OPENVINO_OP(CTCLoss, ov::op::v4)
+OPENVINO_OP(HSwish, ov::op::v4)
+OPENVINO_OP(Interpolate, ov::op::v4)
+OPENVINO_OP(Mish, ov::op::v4)
+OPENVINO_OP(ReduceL1, ov::op::v4)
+OPENVINO_OP(ReduceL2, ov::op::v4)
+OPENVINO_OP(SoftPlus, ov::op::v4)
+OPENVINO_OP(Swish, ov::op::v4)
+
+// New operations added in opset5
+OPENVINO_OP(GatherND, ov::op::v5)
+OPENVINO_OP(GRUSequence, ov::op::v5)
+OPENVINO_OP(HSigmoid, ov::op::v5)
+OPENVINO_OP(LogSoftmax, ov::op::v5)
+OPENVINO_OP(Loop, ov::op::v5)
+OPENVINO_OP(LSTMSequence, ov::op::v5)
+OPENVINO_OP(NonMaxSuppression, ov::op::v5)
+OPENVINO_OP(RNNSequence, ov::op::v5)
+OPENVINO_OP(Round, ov::op::v5)
+
+// New operations added in opset6
+OPENVINO_OP(CTCGreedyDecoderSeqLen, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronDetectionOutput, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronTopKROIs, ov::op::v6)
+OPENVINO_OP(GatherElements, ov::op::v6)
+OPENVINO_OP(MVN, ov::op::v6)
+OPENVINO_OP(Assign, ov::op::v6)     // new version
+OPENVINO_OP(ReadValue, ov::op::v6)  // new version
+
+// New operations added in opset7
+OPENVINO_OP(DFT, ov::op::v7)
+OPENVINO_OP(Einsum, ov::op::v7)
+OPENVINO_OP(Gelu, ov::op::v7)
+OPENVINO_OP(IDFT, ov::op::v7)
+OPENVINO_OP(Roll, ov::op::v7)
diff --git a/ngraph/core/include/openvino/opsets/opset8.hpp b/ngraph/core/include/openvino/opsets/opset8.hpp
new file mode 100644
index 00000000000000..c41f5fb8af6acc
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset8.hpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/op/ops.hpp"
+
+namespace ov {
+namespace opset8 {
+#define OPENVINO_OP(a, b) using b::a;
+#include "openvino/opsets/opset8_tbl.hpp"
+#undef OPENVINO_OP
+}  // namespace opset8
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/opsets/opset8_tbl.hpp b/ngraph/core/include/openvino/opsets/opset8_tbl.hpp
new file mode 100644
index 00000000000000..a94b747a3b52c7
--- /dev/null
+++ b/ngraph/core/include/openvino/opsets/opset8_tbl.hpp
@@ -0,0 +1,186 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#ifndef OPENVINO_OP
+#    warning "OPENVINO_OP not defined"
+#    define OPENVINO_OP(x, y)
+#endif
+
+OPENVINO_OP(Abs, ov::op::v0)
+OPENVINO_OP(Acos, ov::op::v0)
+OPENVINO_OP(Add, ov::op::v1)
+OPENVINO_OP(Asin, ov::op::v0)
+OPENVINO_OP(Atan, ov::op::v0)
+OPENVINO_OP(AvgPool, ov::op::v1)
+OPENVINO_OP(BatchNormInference, ov::op::v5)
+OPENVINO_OP(BinaryConvolution, ov::op::v1)
+OPENVINO_OP(Broadcast, ov::op::v3)
+OPENVINO_OP(Bucketize, ov::op::v3)
+OPENVINO_OP(CTCGreedyDecoder, ov::op::v0)
+OPENVINO_OP(Ceiling, ov::op::v0)
+OPENVINO_OP(Clamp, ov::op::v0)
+OPENVINO_OP(Concat, ov::op::v0)
+OPENVINO_OP(Constant, ov::op::v0)
+OPENVINO_OP(Convert, ov::op::v0)
+OPENVINO_OP(ConvertLike, ov::op::v1)
+OPENVINO_OP(Convolution, ov::op::v1)
+OPENVINO_OP(ConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(Cos, ov::op::v0)
+OPENVINO_OP(Cosh, ov::op::v0)
+OPENVINO_OP(CumSum, ov::op::v0)
+OPENVINO_OP(DeformablePSROIPooling, ov::op::v1)
+OPENVINO_OP(DepthToSpace, ov::op::v0)
+OPENVINO_OP(DetectionOutput, ov::op::v0)
+OPENVINO_OP(Divide, ov::op::v1)
+OPENVINO_OP(Elu, ov::op::v0)
+OPENVINO_OP(Erf, ov::op::v0)
+OPENVINO_OP(Equal, ov::op::v1)
+OPENVINO_OP(Exp, ov::op::v0)
+OPENVINO_OP(ExtractImagePatches, ov::op::v3)
+OPENVINO_OP(FakeQuantize, ov::op::v0)
+OPENVINO_OP(Floor, ov::op::v0)
+OPENVINO_OP(FloorMod, ov::op::v1)
+OPENVINO_OP(GatherTree, ov::op::v1)
+OPENVINO_OP(Greater, ov::op::v1)
+OPENVINO_OP(GreaterEqual, ov::op::v1)
+OPENVINO_OP(GroupConvolution, ov::op::v1)
+OPENVINO_OP(GroupConvolutionBackpropData, ov::op::v1)
+OPENVINO_OP(GRN, ov::op::v0)
+OPENVINO_OP(HardSigmoid, ov::op::v0)
+OPENVINO_OP(Less, ov::op::v1)
+OPENVINO_OP(LessEqual, ov::op::v1)
+OPENVINO_OP(Log, ov::op::v0)
+OPENVINO_OP(LogicalAnd, ov::op::v1)
+OPENVINO_OP(LogicalNot, ov::op::v1)
+OPENVINO_OP(LogicalOr, ov::op::v1)
+OPENVINO_OP(LogicalXor, ov::op::v1)
+OPENVINO_OP(LRN, ov::op::v0)
+OPENVINO_OP(LSTMCell, ov::op::v4)
+OPENVINO_OP(MatMul, ov::op::v0)
+OPENVINO_OP(Maximum, ov::op::v1)
+OPENVINO_OP(Minimum, ov::op::v1)
+OPENVINO_OP(Mod, ov::op::v1)
+OPENVINO_OP(Multiply, ov::op::v1)
+OPENVINO_OP(Negative, ov::op::v0)
+OPENVINO_OP(NormalizeL2, ov::op::v0)
+OPENVINO_OP(NotEqual, ov::op::v1)
+OPENVINO_OP(OneHot, ov::op::v1)
+OPENVINO_OP(PRelu, ov::op::v0)
+OPENVINO_OP(PSROIPooling, ov::op::v0)
+OPENVINO_OP(Pad, ov::op::v1)
+OPENVINO_OP(Parameter, ov::op::v0)
+OPENVINO_OP(Power, ov::op::v1)
+OPENVINO_OP(PriorBox, ov::op::v0)
+OPENVINO_OP(PriorBoxClustered, ov::op::v0)
+OPENVINO_OP(Proposal, ov::op::v4)
+OPENVINO_OP(Range, ov::op::v4)
+OPENVINO_OP(Relu, ov::op::v0)
+OPENVINO_OP(ReduceMax, ov::op::v1)
+OPENVINO_OP(ReduceLogicalAnd, ov::op::v1)
+OPENVINO_OP(ReduceLogicalOr, ov::op::v1)
+OPENVINO_OP(ReduceMean, ov::op::v1)
+OPENVINO_OP(ReduceMin, ov::op::v1)
+OPENVINO_OP(ReduceProd, ov::op::v1)
+OPENVINO_OP(ReduceSum, ov::op::v1)
+OPENVINO_OP(RegionYolo, ov::op::v0)
+OPENVINO_OP(ReorgYolo, ov::op::v0)
+OPENVINO_OP(Reshape, ov::op::v1)
+OPENVINO_OP(Result, ov::op::v0)
+OPENVINO_OP(ReverseSequence, ov::op::v0)
+OPENVINO_OP(ROIPooling, ov::op::v0)
+OPENVINO_OP(ScatterNDUpdate, ov::op::v3)
+OPENVINO_OP(Select, ov::op::v1)
+OPENVINO_OP(Selu, ov::op::v0)
+OPENVINO_OP(Sign, ov::op::v0)
+OPENVINO_OP(Sigmoid, ov::op::v0)
+OPENVINO_OP(Sin, ov::op::v0)
+OPENVINO_OP(Sinh, ov::op::v0)
+OPENVINO_OP(Softmax, ov::op::v1)
+OPENVINO_OP(Sqrt, ov::op::v0)
+OPENVINO_OP(SpaceToDepth, ov::op::v0)
+OPENVINO_OP(Split, ov::op::v1)
+OPENVINO_OP(SquaredDifference, ov::op::v0)
+OPENVINO_OP(Squeeze, ov::op::v0)
+OPENVINO_OP(StridedSlice, ov::op::v1)
+OPENVINO_OP(Subtract, ov::op::v1)
+OPENVINO_OP(Tan, ov::op::v0)
+OPENVINO_OP(Tanh, ov::op::v0)
+OPENVINO_OP(TensorIterator, ov::op::v0)
+OPENVINO_OP(Tile, ov::op::v0)
+OPENVINO_OP(Transpose, ov::op::v1)
+OPENVINO_OP(Unsqueeze, ov::op::v0)
+OPENVINO_OP(VariadicSplit, ov::op::v1)
+
+// New operations added in opset2
+OPENVINO_OP(BatchToSpace, ov::op::v1)
+OPENVINO_OP(SpaceToBatch, ov::op::v1)
+
+// New operations added in opset3
+OPENVINO_OP(EmbeddingBagPackedSum, ov::op::v3)
+OPENVINO_OP(EmbeddingSegmentsSum, ov::op::v3)
+OPENVINO_OP(EmbeddingBagOffsetsSum, ov::op::v3)
+OPENVINO_OP(GRUCell, ov::op::v3)
+OPENVINO_OP(NonZero, ov::op::v3)
+OPENVINO_OP(RNNCell, ov::op::v0)
+OPENVINO_OP(ROIAlign, ov::op::v3)
+OPENVINO_OP(ScatterElementsUpdate, ov::op::v3)
+OPENVINO_OP(ScatterUpdate, ov::op::v3)
+OPENVINO_OP(ShuffleChannels, ov::op::v0)
+OPENVINO_OP(ShapeOf, ov::op::v3)
+OPENVINO_OP(TopK, ov::op::v3)
+
+// New operations added in opset4
+OPENVINO_OP(Acosh, ov::op::v3)
+OPENVINO_OP(Asinh, ov::op::v3)
+OPENVINO_OP(Atanh, ov::op::v3)
+OPENVINO_OP(CTCLoss, ov::op::v4)
+OPENVINO_OP(HSwish, ov::op::v4)
+OPENVINO_OP(Interpolate, ov::op::v4)
+OPENVINO_OP(Mish, ov::op::v4)
+OPENVINO_OP(ReduceL1, ov::op::v4)
+OPENVINO_OP(ReduceL2, ov::op::v4)
+OPENVINO_OP(SoftPlus, ov::op::v4)
+OPENVINO_OP(Swish, ov::op::v4)
+
+// New operations added in opset5
+OPENVINO_OP(GatherND, ov::op::v5)
+OPENVINO_OP(GRUSequence, ov::op::v5)
+OPENVINO_OP(HSigmoid, ov::op::v5)
+OPENVINO_OP(LogSoftmax, ov::op::v5)
+OPENVINO_OP(Loop, ov::op::v5)
+OPENVINO_OP(LSTMSequence, ov::op::v5)
+OPENVINO_OP(NonMaxSuppression, ov::op::v5)
+OPENVINO_OP(RNNSequence, ov::op::v5)
+OPENVINO_OP(Round, ov::op::v5)
+
+// New operations added in opset6
+OPENVINO_OP(CTCGreedyDecoderSeqLen, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronDetectionOutput, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronGenerateProposalsSingleImage, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronPriorGridGenerator, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronROIFeatureExtractor, ov::op::v6)
+OPENVINO_OP(ExperimentalDetectronTopKROIs, ov::op::v6)
+OPENVINO_OP(GatherElements, ov::op::v6)
+OPENVINO_OP(MVN, ov::op::v6)
+OPENVINO_OP(Assign, ov::op::v6)     // new version
+OPENVINO_OP(ReadValue, ov::op::v6)  // new version
+
+// New operations added in opset7
+OPENVINO_OP(DFT, ov::op::v7)
+OPENVINO_OP(Einsum, ov::op::v7)
+OPENVINO_OP(Gelu, ov::op::v7)
+OPENVINO_OP(IDFT, ov::op::v7)
+OPENVINO_OP(Roll, ov::op::v7)
+
+// New operations added in opset8
+OPENVINO_OP(Gather, ov::op::v8)
+OPENVINO_OP(AdaptiveAvgPool, ov::op::v8)
+OPENVINO_OP(AdaptiveMaxPool, ov::op::v8)
+OPENVINO_OP(DeformableConvolution, ov::op::v8)
+OPENVINO_OP(MatrixNms, ov::op::v8)
+OPENVINO_OP(MaxPool, ov::op::v8)
+OPENVINO_OP(MulticlassNms, ov::op::v8)
+OPENVINO_OP(RandomUniform, ov::op::v8)
+OPENVINO_OP(Slice, ov::op::v8)
+OPENVINO_OP(If, ov::op::v8)
diff --git a/ngraph/core/include/openvino/pass/constant_folding.hpp b/ngraph/core/include/openvino/pass/constant_folding.hpp
new file mode 100644
index 00000000000000..de2bb3c0f834f6
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/constant_folding.hpp
@@ -0,0 +1,28 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/pass/pass.hpp"
+
+namespace ov {
+namespace pass {
+/**
+ * @brief Constant folding iterates over the function and tries to evaluate nodes
+ *        with constant inputs. Such nodes are then replaced with new Constants containing
+ *        the result of a folded operation.
+ */
+class OPENVINO_API ConstantFolding : public FunctionPass {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
+
+private:
+    void copy_runtime_info_to_target_inputs(const std::shared_ptr<Node>& node, const Output<Node>& replacement);
+    /// \brief Folds pre-calculated output tensor values to constants in case lower and
+    /// upper estimations are equal. Traverses graph backwards starting from the results.
+    bool pre_calculated_values_folding(const std::shared_ptr<ngraph::Function>& f);
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/convert_fp32_to_fp16.hpp b/ngraph/core/include/openvino/pass/convert_fp32_to_fp16.hpp
new file mode 100644
index 00000000000000..3d20e16bba3c0c
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/convert_fp32_to_fp16.hpp
@@ -0,0 +1,17 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/pass/graph_rewrite.hpp"
+
+namespace ov {
+namespace pass {
+class OPENVINO_API ConvertFP32ToFP16 : public FunctionPass {
+public:
+    OPENVINO_RTTI_DECLARATION;
+    bool run_on_function(std::shared_ptr<ngraph::Function>) override;
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/graph_rewrite.hpp b/ngraph/core/include/openvino/pass/graph_rewrite.hpp
new file mode 100644
index 00000000000000..154b10f90396f1
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/graph_rewrite.hpp
@@ -0,0 +1,249 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <functional>
+#include <memory>
+#include <set>
+
+#include "openvino/pass/pass.hpp"
+#include "openvino/pass/pattern/matcher.hpp"
+
+namespace ov {
+using matcher_pass_callback = std::function<bool(pass::pattern::Matcher& m)>;
+using graph_rewrite_callback = std::function<bool(pass::pattern::Matcher& m)>;
+using recurrent_graph_rewrite_callback = std::function<bool(pass::pattern::RecurrentMatcher& m)>;
+using handler_callback = std::function<bool(const std::shared_ptr<Node>& node)>;
+namespace pass {
+/// \brief MatcherPass is a basic block for pattern based transformations. It describes
+/// pattern and
+/// action that is applied if pattern is matched.
+///
+/// MatcherPass consists of Matcher and matcher_pass_callback that needs to be implemented
+/// and
+/// finally registered by using \sa register_matcher. MatcherPass can be executed on node
+/// within
+/// \sa apply method. To run matcher pass on Function use GraphRewrite.
+/// In addition MatcherPass provides a way for adding new operations into GraphRewrite
+/// execution
+/// queue. That means that operations that were created inside transformation callback can
+/// be added
+/// for matching. To register node use \sa register_new_node method. GraphRewrite
+/// automatically
+/// takes registered nodes and put them to execution queue. If multiple nodes were register
+/// make
+/// sure that they were registered in topological order.
+/// Note: when implementing pattern for Matcher make sure that root node is an operation
+/// from opset
+/// or has ov::pass::pattern::op::WrapType. That will help GraphRewrite to execute matcher
+/// passes more
+/// efficient.
+
+class OPENVINO_API MatcherPass : public PassBase {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    MatcherPass() = default;
+
+    MatcherPass(const MatcherPass&) = delete;
+    MatcherPass& operator=(const MatcherPass&) = delete;
+
+    explicit MatcherPass(const std::string& name,
+                         const std::shared_ptr<pattern::Matcher>& m,
+                         const handler_callback& handler,
+                         const PassPropertyMask& property = PassProperty::CHANGE_DYNAMIC_STATE)
+        : PassBase(),
+          m_handler(handler),
+          m_matcher(m) {
+        set_name(name);
+        set_property(property, true);
+    }
+
+    bool apply(std::shared_ptr<ov::Node> node);
+
+    template <typename T, class... Args>
+    std::shared_ptr<T> register_new_node(Args&&... args) {
+        auto node = std::make_shared<T>(std::forward<Args>(args)...);
+        m_new_nodes.push_back(node);
+        return node;
+    }
+
+    template <typename T>
+    std::shared_ptr<T> register_new_node(const std::shared_ptr<T>& node) {
+        m_new_nodes.push_back(node);
+        return node;
+    }
+
+    const std::vector<std::shared_ptr<ov::Node>>& get_new_nodes() {
+        return m_new_nodes;
+    }
+    void clear_new_nodes() {
+        m_new_nodes.clear();
+    }
+    std::shared_ptr<pattern::Matcher> get_matcher() {
+        return m_matcher;
+    }
+
+protected:
+    void register_matcher(const std::shared_ptr<pattern::Matcher>& m,
+                          const graph_rewrite_callback& callback,
+                          const PassPropertyMask& property = PassProperty::CHANGE_DYNAMIC_STATE);
+
+private:
+    handler_callback m_handler;
+    std::shared_ptr<pattern::Matcher> m_matcher;
+    std::vector<std::shared_ptr<ov::Node>> m_new_nodes;
+};
+
+/// \brief GraphRewrite is a container for MatcherPasses that allows to run them on Function
+/// in
+/// efficient way
+///
+/// Graph rewrite pass is used for matcher passes execution on Function.
+/// To register MatcherPass use \sa add_matcher<T>(args) method where T is a MatcherPass
+/// class.
+/// As a default algorithm graph rewrite pass traverse Function in topological order and
+/// applies
+/// registered matcher passes for each node. But if all registered matcher passes have type
+/// based
+/// root node in Matcher pattern then efficient mechanism is used to execute them.
+/// Matcher pattern root is type based if it's operation from opset or
+/// pattern::op::WrapType.
+/// Note: when implementing pattern for Matcher make sure that root node is an operation
+/// from opset
+/// or has ov::pattern::op::WrapType. That will help GraphRewrite to execute matcher
+/// passes more
+/// efficient.
+
+class OPENVINO_API GraphRewrite : public FunctionPass {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    GraphRewrite() = default;
+
+    explicit GraphRewrite(const std::shared_ptr<MatcherPass>& pass) : FunctionPass() {
+        m_matchers.push_back(pass);
+    }
+
+    /// \brief Register given transformation class type to GraphRewrite execution list
+    /// All registered transformations will be executed in a single graph traversal.
+    /// Example below show the basic usage of pass::GraphRewrite
+    ///
+    ///     pass::Manager manager;
+    ///     auto anchor = manager.register_pass<GraphRewrite>();
+    ///     anchor->add_matcher<MatcherPassA>();
+    ///     anchor->add_matcher<MatcherPassB>();
+    ///     anchor->set_name("CommonMatchers");
+    ///     manager.run_passes(f);
+    ///
+    /// For some purposes transformation can be registered and disabled by default.
+    ///
+    ///     anchor->add_matcher<MatcherPassB, false>();
+    ///
+    /// \return shared_ptr to the transformation instance
+    template <typename T,
+              bool Enabled = true,
+              class... Args,
+              typename std::enable_if<std::is_base_of<pass::MatcherPass, T>::value, bool>::type = true>
+    std::shared_ptr<T> add_matcher(Args&&... args) {
+        static_assert(std::is_base_of<pass::MatcherPass, T>::value, "pass not derived from MatcherPass");
+        auto pass = std::make_shared<T>(std::forward<Args>(args)...);
+        auto pass_config = get_pass_config();
+        pass->set_pass_config(pass_config);
+        if (!Enabled && !pass_config->is_enabled<T>()) {
+            pass_config->disable<T>();
+        }
+        m_matchers.push_back(pass);
+        return pass;
+    }
+
+    /// \brief Register passes from GraphRewrite class that contains sequence of matcher
+    /// passes registered in its ctor.
+    /// For example:
+    ///
+    ///    class ov::pass::LinFusions: public ov::pass::GraphRewrite {
+    ///    public:
+    ///         OPENVINO_RTTI_DECLARATION;
+    ///         Fusions() {
+    ///             add_matcher<ov::pass::AddFusion>();
+    ///             add_matcher<ov::pass::MulFusion>();
+    ///         }
+    ///     };
+    ///
+    ///     pass::Manager manager;
+    ///     auto anchor = manager.register_pass<GraphRewrite>();
+    ///     anchor->add_matcher<LinFusions>();
+    ///     anchor->add_matcher<OtherFusions>();
+    ///     anchor->set_name("CommonFusions");
+    ///     manager.run_passes(f);
+    ///
+    /// In this case all matcher passes from LinFusions pass will be united with other
+    /// registered matchers.
+    template <typename T,
+              class... Args,
+              typename std::enable_if<std::is_base_of<pass::GraphRewrite, T>::value, bool>::type = true>
+    void add_matcher(Args&&... args) {
+        static_assert(std::is_base_of<pass::GraphRewrite, T>::value, "pass not derived from GraphRewrite");
+        auto pass = std::make_shared<T>(std::forward<Args>(args)...);
+        auto pass_config = get_pass_config();
+
+        for (auto& matcher : pass->m_matchers) {
+            pass->set_pass_config(pass_config);
+            m_matchers.push_back(matcher);
+        }
+    }
+
+    OPENVINO_DEPRECATED("Use MatcherPass instead")
+    void add_matcher(const std::shared_ptr<pattern::Matcher>& m,
+                     const graph_rewrite_callback& callback,
+                     const PassPropertyMask& property);
+
+    OPENVINO_DEPRECATED("Use MatcherPass instead")
+    void add_matcher(const std::shared_ptr<pattern::Matcher>& m, const ov::graph_rewrite_callback& callback);
+
+    bool run_on_function(std::shared_ptr<ov::Function> f) override;
+
+    void set_pass_config(const std::shared_ptr<PassConfig>& pass_config) override;
+
+protected:
+    bool apply_matcher_passes(std::shared_ptr<Function> f, std::deque<std::weak_ptr<Node>> nodes_to_run);
+
+    bool m_enable_shape_inference = false;
+
+    std::vector<std::shared_ptr<ov::pass::MatcherPass>> m_matchers;
+};
+
+class OPENVINO_API BackwardGraphRewrite : public GraphRewrite {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    BackwardGraphRewrite() = default;
+
+    explicit BackwardGraphRewrite(const std::shared_ptr<MatcherPass>& pass) : GraphRewrite(pass) {}
+
+    bool run_on_function(std::shared_ptr<ov::Function> f) override;
+};
+
+class OPENVINO_API RecurrentGraphRewrite : public FunctionPass {
+public:
+    RecurrentGraphRewrite(size_t num_iters = 10) : FunctionPass(), m_num_iters(num_iters) {}
+
+    void add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
+                     const ov::recurrent_graph_rewrite_callback& callback,
+                     const PassPropertyMask& property);
+
+    // TODO: This interface may deprecate after all passes are refactored.
+    void add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
+                     const ov::recurrent_graph_rewrite_callback& callback);
+
+    bool run_on_function(std::shared_ptr<ov::Function> f) override;
+
+private:
+    size_t m_num_iters;
+
+    std::vector<std::shared_ptr<ov::pass::MatcherPass>> m_matchers;
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/low_latency.hpp b/ngraph/core/include/openvino/pass/low_latency.hpp
new file mode 100644
index 00000000000000..214b5545370f66
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/low_latency.hpp
@@ -0,0 +1,48 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory>
+#include <vector>
+
+#include "openvino/pass/pass.hpp"
+
+namespace ov {
+namespace pass {
+/**
+ * @brief The transformation finds all TensorIterator/Loop layers in the network,
+ * processes all back edges that describe a connection between Result and Parameter
+ * of the TensorIterator/Loop bodies,and inserts ReadValue and Assign layers at the
+ * input and output corresponding to this back edge.
+ * Supported platforms: CPU, GNA.
+ *
+ * The example below describes the changes made by the transformation
+ *  [] - TensorIterator body
+ *  () - new layer
+ *  BE - back-edge
+ *
+ *  before applying the transformation:
+ *  -> input1[BE_1 -> Parameter -> Layers ... -> Result  -> BE_1 ]output1->
+ *
+ *  after applying the transformation:
+ *  ->(ReadValue)-> input1[BE_1 ->Parameter->Layers ...->Result->BE_1]output1 ->(Assign)
+ *                                                                      \
+ *                                                                       ->...
+ * After applying the transformation, the resulting network can be inferred
+ * step by step, the states will store between inferences.
+ */
+class OPENVINO_API LowLatency2 : public FunctionPass {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    explicit LowLatency2(bool use_const_initializer = true) : m_use_const_initializer(use_const_initializer) {}
+
+    bool run_on_function(std::shared_ptr<ngraph::Function> f) override;
+
+private:
+    bool m_use_const_initializer;
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/manager.hpp b/ngraph/core/include/openvino/pass/manager.hpp
new file mode 100644
index 00000000000000..6f5926b41b8782
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/manager.hpp
@@ -0,0 +1,116 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <list>
+#include <memory>
+#include <typeinfo>
+#include <vector>
+
+#include "openvino/pass/pass.hpp"
+#include "openvino/pass/validate.hpp"
+
+namespace ov {
+namespace pass {
+class OPENVINO_API Manager {
+public:
+    Manager();
+    ~Manager();
+
+    //// \brief Construct Manager with shared PassConfig instance
+    explicit Manager(std::shared_ptr<PassConfig> pass_config);
+
+    /// \brief Register given transformation class type to execution list
+    /// Example below show the basic usage of pass::Manager
+    ///
+    ///     pass::Manager manager;
+    ///     manager.register_pass<MyTransformation>(/*transformation constructor ars*/);
+    ///     manager.run_passes(f);
+    ///
+    /// For some purposes transformation can be registered and disabled by default.
+    ///
+    ///     manager.register_pass<MyTransformation, false>();
+    ///
+    /// \return shared_ptr to the transformation instance
+    template <typename T, bool Enable = true, class... Args>
+    std::shared_ptr<T> register_pass(Args&&... args) {
+        auto rc = push_pass<T>(std::forward<Args>(args)...);
+        rc->set_pass_config(m_pass_config);
+        if (m_per_pass_validation) {
+            push_pass<Validate>();
+        }
+        if (!Enable && !m_pass_config->is_enabled<T>()) {
+            m_pass_config->disable<T>();
+        }
+        return rc;
+    }
+
+    void run_passes(std::shared_ptr<Function>);
+
+    void set_pass_visualization(bool new_state) {
+        m_visualize = new_state;
+    }
+    /// \brief Set flag to enable/disable running Validate pass after executing
+    /// each registered pass
+    /// \param new_state Value "true" enables Validate pass run; "false", otherwise
+    void set_per_pass_validation(bool new_state) {
+        m_per_pass_validation = new_state;
+    }
+    /// \brief Callback is a lambda function that can be used by registered transformations.
+    /// The main purpose of this callback is to provide a way for plugins to disable/enable
+    /// transformations based on some conditions. In some cases plugins may want not to
+    /// execute some
+    /// transformations.
+    /// For example plugin can disable unpleasant decompositions because of performance
+    /// reasons for
+    /// some cases.
+    /// Callback example:
+    /// auto callback = [](const std::shared_ptr<const ngraph::Node> & node) -> bool {
+    ///     return std::dynamic_pointer_cast<const ngraph::opset3::DepthToSpace>(node) !=
+    ///     nullptr;
+    /// };
+    /// This callback returns true in case of DepthToSpace operation. So when execution
+    /// DepthToSpace
+    /// decomposition pass will check is this decomposition needed or plugin can execute
+    /// this
+    /// operation directly. And of course on transformation side we need to have a response
+    /// for this
+    /// callback.
+    /// if (transformation_callback(batch_to_space)) {
+    ///     return false;
+    /// }
+    /// \param callback lamda function that returns true in case if node is supported by
+    /// plugin and
+    /// transformation is not needed
+    OPENVINO_DEPRECATED("Please use get_pass_config() to configure transformation pipeline")
+    void set_callback(const param_callback& callback) {
+        m_pass_config->set_callback(callback);
+    }
+    /// \return PassConfig shared object. This object is used for transformations pipeline
+    /// configuration.
+    /// This object allows to disable/enable transformations execution, set callback to
+    /// particular
+    /// transformation. For mo details see PassConfig class.
+    std::shared_ptr<PassConfig> get_pass_config() {
+        return m_pass_config;
+    }
+
+protected:
+    template <typename T, class... Args>
+    std::shared_ptr<T> push_pass(Args&&... args) {
+        static_assert(std::is_base_of<pass::PassBase, T>::value, "pass not derived from pass base");
+        auto pass = std::make_shared<T>(std::forward<Args>(args)...);
+        auto pass_base = std::static_pointer_cast<PassBase>(pass);
+        m_pass_list.push_back(pass_base);
+        return pass;
+    }
+
+    std::shared_ptr<PassConfig> m_pass_config;
+    std::vector<std::shared_ptr<PassBase>> m_pass_list;
+    bool m_visualize = false;
+    bool m_per_pass_validation = true;
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pass.hpp b/ngraph/core/include/openvino/pass/pass.hpp
new file mode 100644
index 00000000000000..c7056390a4fa2e
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pass.hpp
@@ -0,0 +1,110 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <list>
+#include <memory>
+#include <vector>
+
+#include "ngraph/util.hpp"
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/deprecated.hpp"
+#include "openvino/core/function.hpp"
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pass_config.hpp"
+
+namespace ov {
+namespace pass {
+enum class PassProperty : uint32_t {
+    // Pass requires node shapes to be static
+    REQUIRE_STATIC_SHAPE = 0x1,
+    // Pass transformation will change the function's dynamic state
+    CHANGE_DYNAMIC_STATE = 1 << 1,
+};
+
+using PassPropertyMask = ngraph::EnumMask<PassProperty>;
+
+class OPENVINO_API PassBase {
+    friend class Manager;
+
+public:
+    PassBase();
+    virtual ~PassBase() = default;
+    /// Check if this pass has all the pass properties.
+    bool get_property(const PassPropertyMask& prop_mask) const;
+
+    void set_name(const std::string& name) {
+        m_name = name;
+    }
+    std::string get_name() const;
+
+    /// \brief Set callback for particular transformation type.
+    /// This method set global callback. For more details see PassConfig class
+    /// documentation.
+    /// \param callback lambda function that takes node and returns bool
+    void set_callback(const param_callback& callback);
+
+    /// \brief Set PassConfig for particular transformation instance
+    /// \param pass_config is a PassConfig shared_ptr
+    virtual void set_pass_config(const std::shared_ptr<PassConfig>& pass_config) {
+        m_pass_config = pass_config;
+    }
+
+    /// \brief Allows to access PassConfig shared instance
+    /// \return Shared instance of PassConfig class
+    std::shared_ptr<PassConfig> get_pass_config() {
+        return m_pass_config;
+    }
+    /// \brief Applies callback for given node. By default callback returns false.
+    /// This method remains here only for backward compatibility and will be removed
+    /// after all transformations are moved to transformation_callback() method.
+    /// \return result of callback execution for given node
+    NGRAPH_DEPRECATED("Please use transformation_callback method instead")
+    bool m_transformation_callback(const std::shared_ptr<const Node>& node) {
+        return m_pass_config->get_callback(get_type_info())(node);
+    }
+
+    /// \brief Applies callback for given node. By default callback returns false.
+    /// \param node which will be used inside callback
+    /// \return result of callback execution for given node
+    bool transformation_callback(const std::shared_ptr<const Node>& node) {
+        return m_pass_config->get_callback(get_type_info())(node);
+    }
+
+    using type_info_t = DiscreteTypeInfo;
+
+    virtual const type_info_t& get_type_info() const = 0;
+
+protected:
+    void set_property(const PassPropertyMask& prop, bool value);
+
+private:
+    PassPropertyMask m_property;
+
+    std::string m_name;
+    std::shared_ptr<PassConfig> m_pass_config;
+};
+
+class OPENVINO_API FunctionPass : public PassBase {
+public:
+    NGRAPH_RTTI_DECLARATION;
+    ~FunctionPass() override;
+    virtual bool run_on_function(std::shared_ptr<ngraph::Function>) = 0;
+};
+
+class Manager;
+enum class FusionType : uint32_t {
+    //`DIFFERENTIABLE_FUSIONS` produce ops that support autodiff
+    // i.e. implement `generate_adjoints`
+    DIFFERENTIABLE_FUSIONS = 0x1,
+    REGULAR_FUSIONS = 0x2,
+    //`FOP_FUSIONS` produce ops in the FusedOps category that might
+    // not be supported by all backends
+    FOP_FUSIONS = 0x4,
+    ALL_FUSIONS = 0xFFFFFFFF
+};
+using FusionTypeMask = ngraph::EnumMask<FusionType>;
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pass_config.hpp b/ngraph/core/include/openvino/pass/pass_config.hpp
new file mode 100644
index 00000000000000..5dcd72f3e89def
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pass_config.hpp
@@ -0,0 +1,176 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <list>
+#include <memory>
+#include <vector>
+
+#include "ngraph/util.hpp"
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/core/deprecated.hpp"
+#include "openvino/core/function.hpp"
+#include "openvino/core/node.hpp"
+
+namespace ov {
+namespace pass {
+using param_callback = std::function<bool(const std::shared_ptr<const ::ov::Node>)>;
+using param_callback_map = std::map<ov::DiscreteTypeInfo, param_callback>;
+
+/// \brief Class representing a transformations config that is used for disabling/enabling
+/// transformations registered inside pass::Manager and also allows to set callback for all
+/// transformations or for particular transformation.
+///
+/// When pass::Manager is created all passes registered inside this manager including nested
+/// passes will share the same instance of PassConfig class.
+/// To work with this class first you need to get shared instance of this class by calling
+/// manager.get_pass_config() method. Then you will be able to disable/enable passes based
+/// on transformations type_info. For example:
+///
+///     pass::Manager manager;
+///     manager.register_pass<CommonOptimizations>();
+///     auto pass_config = manager.get_pass_config();
+///     pass_config->disable<ConvertGELU>(); // this will disable nested pass inside
+///                                          // CommonOptimizations pipeline
+///     manager.run_passes(f);
+///
+/// Sometimes it is needed to call transformation inside other transformation manually. And
+/// for that case before running transformation you need manually check that this pass is
+/// not disabled and then you need to set current PassConfig instance to this
+/// transformation. For example:
+///
+///     // Inside MatcherPass callback or inside FunctionPass run_on_function() method
+///     // you need to call get_pass_config() method to get shared instance of PassConfig
+///     auto pass_config = get_pass_config();
+///
+///     // Before running nested transformation you need to check is it disabled or not
+///     if (!pass_config->is_disabled<ConvertGELU>()) {
+///         auto pass = ConvertGELU();
+///         pass->set_pass_config(pass_config);
+///         pass.apply(node);
+///     }
+///
+/// Following this logic inside your transformations you will guaranty that transformations
+/// will be executed in a right way.
+class OPENVINO_API PassConfig {
+public:
+    /// \brief Disable transformation by its type_info
+    /// \param type_info Transformation type_info
+    void disable(const DiscreteTypeInfo& type_info);
+    /// \brief Disable transformation by its class type (based on type_info)
+    template <typename T>
+    void disable() {
+        OPENVINO_SUPPRESS_DEPRECATED_START
+        disable(T::type_info);
+        OPENVINO_SUPPRESS_DEPRECATED_END
+    }
+
+    /// \brief Enable transformation by its type_info
+    /// \param type_info Transformation type_info
+    void enable(const DiscreteTypeInfo& type_info);
+    /// \brief Enable transformation by its class type (based on type_info)
+    template <typename T>
+    void enable() {
+        OPENVINO_SUPPRESS_DEPRECATED_START
+        enable(T::type_info);
+        OPENVINO_SUPPRESS_DEPRECATED_END
+    }
+
+    /// \brief Set callback for all kind of transformations
+    void set_callback(const param_callback& callback) {
+        m_callback = callback;
+    }
+    template <typename... Args>
+    typename std::enable_if<sizeof...(Args) == 0>::type set_callback(const param_callback& callback) {}
+
+    /// \brief Set callback for particular transformation class types
+    ///
+    /// Example below show how to set callback for one or multiple passes using this method.
+    ///
+    ///     pass_config->set_callback<ngraph::pass::ConvertBatchToSpace,
+    ///                               ngraph::pass::ConvertSpaceToBatch>(
+    ///              [](const_node_ptr &node) -> bool {
+    ///                   // Disable transformations for cases when input shape rank is not
+    ///                   equal to 4
+    ///                   const auto input_shape_rank =
+    ///                   node->get_output_partial_shape(0).rank().get_length();
+    ///                   if (input_shape_rank != 4) {
+    ///                       return false;
+    ///                   }
+    ///                   return true;
+    ///               });
+    ///
+    /// Note that inside transformations you must provide code that work with this callback.
+    /// See example below:
+    ///
+    ///     if (transformation_callback(node)) {
+    ///         return false; // exit from transformation
+    ///     }
+    ///
+    template <typename T, class... Args>
+    void set_callback(const param_callback& callback) {
+        m_callback_map[T::type_info] = callback;
+        set_callback<Args...>(callback);
+    }
+
+    /// \brief Get callback for given transformation type_info
+    /// \param type_info Transformation type_info
+    ///
+    /// In case if callback wasn't set for given transformation type then global callback
+    /// will be returned. But if even global callback wasn't set then default callback will
+    /// be returned.
+    param_callback get_callback(const DiscreteTypeInfo& type_info) const;
+
+    /// \brief Get callback for given transformation class type
+    /// \return callback lambda function
+    template <typename T>
+    param_callback get_callback() const {
+        NGRAPH_SUPPRESS_DEPRECATED_START
+        return get_callback(T::type_info);
+        NGRAPH_SUPPRESS_DEPRECATED_END
+    }
+
+    /// \brief Check either transformation type is disabled or not
+    /// \param type_info Transformation type_info
+    /// \return true if transformation type was disabled and false otherwise
+    bool is_disabled(const DiscreteTypeInfo& type_info) const {
+        return m_disabled.count(type_info);
+    }
+
+    /// \brief Check either transformation class type is disabled or not
+    /// \return true if transformation type was disabled and false otherwise
+    template <typename T>
+    bool is_disabled() const {
+        NGRAPH_SUPPRESS_DEPRECATED_START
+        return is_disabled(T::type_info);
+        NGRAPH_SUPPRESS_DEPRECATED_END
+    }
+
+    /// \brief Check either transformation type is force enabled or not
+    /// \param type_info Transformation type_info
+    /// \return true if transformation type was force enabled and false otherwise
+    bool is_enabled(const DiscreteTypeInfo& type_info) const {
+        return m_enabled.count(type_info);
+    }
+
+    /// \brief Check either transformation class type is force enabled or not
+    /// \return true if transformation type was force enabled and false otherwise
+    template <typename T>
+    bool is_enabled() const {
+        return is_enabled(T::type_info);
+    }
+
+    void add_disabled_passes(const PassConfig& rhs);
+
+private:
+    param_callback m_callback = [](const std::shared_ptr<const ::ngraph::Node>&) {
+        return false;
+    };
+    param_callback_map m_callback_map;
+    std::unordered_set<DiscreteTypeInfo> m_disabled;
+    std::unordered_set<DiscreteTypeInfo> m_enabled;
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/matcher.hpp b/ngraph/core/include/openvino/pass/pattern/matcher.hpp
new file mode 100644
index 00000000000000..261be2f86bc556
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/matcher.hpp
@@ -0,0 +1,271 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <memory.h>
+
+#include <algorithm>
+#include <functional>
+
+#include "ngraph/op/constant.hpp"
+#include "openvino/core/except.hpp"
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/any.hpp"
+#include "openvino/pass/pattern/op/any_of.hpp"
+#include "openvino/pass/pattern/op/any_output.hpp"
+#include "openvino/pass/pattern/op/label.hpp"
+#include "openvino/pass/pattern/op/skip.hpp"
+
+namespace ov {
+namespace pass {
+class GraphRewrite;
+
+namespace pattern {
+class Matcher;
+
+class OPENVINO_API MatcherState {
+public:
+    MatcherState(Matcher*);
+    bool finish(bool is_successful);
+    ~MatcherState();
+
+protected:
+    Matcher* m_matcher;
+    PatternValueMap m_pattern_value_map;
+    PatternValueMaps m_pattern_value_maps;
+    size_t m_watermark;
+    size_t m_capture_size;
+    bool m_restore{true};
+};
+
+/// Matcher looks for node patterns in a computation graph. The patterns are described by an
+/// automaton that is described by an extended computation graph. The matcher executes
+/// by attempting to match the start node of the pattern to a computation graph value
+/// (output of a Node). In addition to determing if a match occurs, a pattern node may add
+/// graph nodes to a list of matched nodes, associate nodes with graph values, and start
+/// submatches. Submatches add match state changes to the enclosing match if the submatch
+/// succeeds; otherwise the state is reverted.
+///
+/// The default match behavior of a pattern node with a graph nodes is that the computation
+/// graph value is added to the end of the matched value list and the match succeeds if the
+/// node/pattern types match and the input values match. In the case of a commutative node,
+/// the inputs can match in any order. If the matcher is in strict mode, the graph value
+/// element type and shape must also match.
+///
+/// Pattern nodes that have different match behavior are in ov::pass::pattern::op and have
+/// descriptions of their match behavior.
+class OPENVINO_API Matcher {
+public:
+    using PatternMap = ov::pass::pattern::PatternMap;
+
+    // Avoid implicit string construction from nullptr.
+    Matcher(const std::shared_ptr<Node> pattern_node, std::nullptr_t name) = delete;
+
+    Matcher() = default;
+    Matcher(Output<Node>& pattern_node) : m_pattern_node{pattern_node} {}
+
+    Matcher(Output<Node>& pattern_node, const std::string& name) : m_pattern_node(pattern_node), m_name{name} {}
+
+    /// \brief Constructs a Matcher object
+    ///
+    /// \param pattern_node is a pattern sub graph that will be matched against input graphs
+    /// \param name is a string which is used for logging and disabling a matcher
+    /// \param strict_mode forces a matcher to consider shapes and ET of nodes
+    Matcher(const Output<Node>& pattern_node, const std::string& name, bool strict_mode)
+        : m_pattern_node(pattern_node),
+          m_name(name),
+          m_strict_mode(strict_mode) {}
+
+    // Some matches should start on a node rather than an output. These three constructors
+    // are transition until we work out the right way to do that.
+    Matcher(std::shared_ptr<Node> pattern_node);
+    Matcher(std::shared_ptr<Node> pattern_node, const std::string& name);
+    Matcher(std::shared_ptr<Node> pattern_node, const std::string& name, bool strict_mode);
+
+    virtual ~Matcher() = default;
+    /// \brief Matches a pattern to \p graph_node
+    ///
+    /// \param graph_value is an input graph to be matched against
+    bool match(const Output<Node>& graph_value);
+
+    bool match(std::shared_ptr<Node> graph_node);
+
+    /// \brief Matches a pattern to \p graph_node
+    ///
+    /// \param graph_value is an input graph to be matched against
+    /// \param previous_matches contains previous mappings from labels to nodes to use
+    bool match(const Output<Node>& graph_value, const PatternMap& previous_matches);
+    bool match(const Output<Node>& graph_value, const PatternValueMap& previous_matches);
+
+    template <typename T>
+    static std::shared_ptr<T> unique_match(const std::shared_ptr<Node>& node) {
+        std::shared_ptr<T> matched;
+        for (const auto& arg : node->input_values()) {
+            if (auto t_casted = ov::as_type_ptr<T>(arg.get_node_shared_ptr())) {
+                if (matched) {
+                    throw Exception("There's more than two arguments of the same type");
+                } else {
+                    matched = t_casted;
+                }
+            }
+        }
+        return matched;
+    }
+
+    bool is_contained_match(const NodeVector& exclusions = {}, bool ignore_unused = true);
+    const NodeVector get_matched_nodes() {
+        return as_node_vector(m_matched_list);
+    }
+    const OutputVector& get_matched_values() const {
+        return m_matched_list;
+    }
+    OutputVector& get_matched_values() {
+        return m_matched_list;
+    }
+    void reset() {}
+    const std::string& get_name() {
+        return m_name;
+    }
+    std::shared_ptr<Node> get_pattern() {
+        return m_pattern_node.get_node_shared_ptr();
+    }
+    Output<Node> get_pattern_value() {
+        return m_pattern_node;
+    }
+    std::shared_ptr<Node> get_match_root();
+    Output<Node> get_match_value();
+    PatternMap get_pattern_map() const;
+    PatternValueMap& get_pattern_value_map() {
+        return m_pattern_map;
+    }
+    PatternValueMaps& get_pattern_value_maps() {
+        return m_pattern_value_maps;
+    }
+    /// \brief Low-level helper to match recurring patterns
+    ///
+    /// \param graph is a graph to be matched against
+    /// \param pattern is a recurring pattern
+    /// \param rpattern specifies a node to recur from next
+    /// \param patterns a map from labels to matches
+
+    size_t add_node(Output<Node> node);
+
+    bool virtual match_value(const ov::Output<Node>& pattern_value, const ov::Output<Node>& graph_value);
+
+    bool is_strict_mode() {
+        return m_strict_mode;
+    }
+    virtual bool match_arguments(Node* pattern_node, const std::shared_ptr<Node>& graph_node);
+
+    void capture(const std::set<Node*>& static_nodes);
+
+    void clear_state();
+
+    size_t get_number_of_recurrent_matches() const {
+        return m_pattern_value_maps.size();
+    }
+    NodeVector get_bound_nodes_for_pattern(const Output<Node>& pattern) const;
+    size_t get_number_of_bound_labels() const;
+    /// \brief Try a match
+    MatcherState start_match();
+
+    Output<Node> m_match_root;
+    Output<Node> m_pattern_node;
+    PatternValueMap m_pattern_map;
+    PatternValueMaps m_pattern_value_maps;
+    OutputVector m_matched_list;
+
+protected:
+    bool match_permutation(const OutputVector& pattern_args, const OutputVector& args);
+
+    std::string m_name{"unnamed"};
+    bool m_strict_mode{false};
+};
+
+class OPENVINO_API RecurrentMatcher {
+public:
+    /// \brief Constructs a RecurrentMatcher object. Reccurent Matchers are used to match
+    ///        repeating patterns (e.g. RNN, LSTM, GRU cells)
+    ///
+    /// \param initial_pattern is a pattern sub graph describing the initial cell
+    /// \param pattern is a pattern sub graph describing an individual cell
+    /// \param rpattern is a (recurring) label to denote which node the next match should
+    ///                 start at
+    /// \param correlated_patterns is a set of labels whose bound nodes must remain the same
+    ///                            across all cells
+    RecurrentMatcher(const Output<Node>& initial_pattern,
+                     const Output<Node>& pattern,
+                     const std::shared_ptr<Node>& rpattern,
+                     const std::set<std::shared_ptr<Node>>& correlated_patterns)
+        : m_initial_pattern(initial_pattern),
+          m_pattern(pattern),
+          m_recurrent_pattern(rpattern),
+          m_correlated_patterns(correlated_patterns) {}
+
+    /// \brief Constructs a RecurrentMatcher object. Reccurent Matchers are used to match
+    ///        repeating patterns (e.g. RNN, LSTM, GRU cells)
+    ///
+    /// \param pattern is a pattern sub graph describing an individual cell
+    /// \param rpattern is a (recurring) label to denote which node the next match should
+    ///                 start at
+    /// \param correlated_patterns is a set of labels whose bound nodes must remain the same
+    ///                            across all cells
+    RecurrentMatcher(const Output<Node>& pattern,
+                     const std::shared_ptr<Node>& rpattern,
+                     const std::set<std::shared_ptr<Node>>& correlated_patterns)
+        : RecurrentMatcher(pattern, pattern, rpattern, correlated_patterns) {}
+
+    RecurrentMatcher(const Output<Node>& initial_pattern,
+                     const Output<Node>& pattern,
+                     const std::shared_ptr<Node>& rpattern,
+                     const std::set<std::shared_ptr<op::Label>>& correlated_patterns);
+
+    RecurrentMatcher(const Output<Node>& pattern,
+                     const std::shared_ptr<Node>& rpattern,
+                     const std::set<std::shared_ptr<op::Label>>& correlated_patterns)
+        : RecurrentMatcher(pattern, pattern, rpattern, correlated_patterns) {}
+
+    /// \brief Returns a vector of bound nodes for a given label (used in a pattern
+    /// describing an individual cell
+    NodeVector get_bound_nodes_for_pattern(const std::shared_ptr<Node>& pattern) const {
+        if (m_matches.count(pattern) == 0) {
+            throw Exception("No bound nodes for a given label");
+        }
+
+        return as_node_vector(m_matches.at(pattern));
+    }
+
+    size_t get_number_of_recurrent_matches() const {
+        if (m_matches.size() == 0) {
+            return 0;
+        }
+
+        return (*m_matches.begin()).second.size();
+    }
+
+    size_t get_number_of_bound_labels() const {
+        return m_matches.size();
+    }
+    /// \brief Tries to match a pattern for an individual cell to a given \p graph
+    bool match(Output<Node> graph);
+
+    std::shared_ptr<Node> get_match_root() {
+        return m_match_root.get_node_shared_ptr();
+    }
+    Output<Node> get_match_value() {
+        return m_match_root;
+    }
+
+private:
+    Output<Node> m_initial_pattern;
+    Output<Node> m_pattern;
+    std::shared_ptr<Node> m_recurrent_pattern;
+    const std::set<std::shared_ptr<Node>> m_correlated_patterns;
+    RPatternValueMap m_matches;
+    Output<Node> m_match_root;
+};
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/any.hpp b/ngraph/core/include/openvino/pass/pattern/op/any.hpp
new file mode 100644
index 00000000000000..3552e25ebc09ce
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/any.hpp
@@ -0,0 +1,45 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// The graph value is to the matched value list. If the predicate is true for the node
+/// and the arguments match, the match succeeds.
+class OPENVINO_API Any : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternAny", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    /// \brief creates a Any node containing a sub-pattern described by \sa type and \sa
+    ///        shape.
+    Any(const element::Type& type, const PartialShape& s, ValuePredicate pred, const OutputVector& wrapped_values)
+        : Pattern(wrapped_values, pred) {
+        set_output_type(0, type, s);
+    }
+    Any(const element::Type& type, const PartialShape& s, NodePredicate pred, const NodeVector& wrapped_values)
+        : Any(type, s, as_value_predicate(pred), as_output_vector(wrapped_values)) {}
+    /// \brief creates a Any node containing a sub-pattern described by the type and
+    ///        shape of \sa node.
+    Any(const Output<Node>& node, ValuePredicate pred, const OutputVector& wrapped_values)
+        : Any(node.get_element_type(), node.get_partial_shape(), pred, wrapped_values) {}
+    Any(const Output<Node>& node, NodePredicate pred, const NodeVector& wrapped_values)
+        : Any(node.get_element_type(),
+              node.get_partial_shape(),
+              as_value_predicate(pred),
+              as_output_vector(wrapped_values)) {}
+
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/any_of.hpp b/ngraph/core/include/openvino/pass/pattern/op/any_of.hpp
new file mode 100644
index 00000000000000..ce07522173cbf5
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/any_of.hpp
@@ -0,0 +1,54 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// The graph value is added to the matched values list. If the predicate is true for
+/// the
+/// graph node, a submatch is performed on the input of AnyOf and each input of the
+/// graph node. The first match that succeeds results in a successful match. Otherwise
+/// the match fails.
+///
+/// AnyOf may be given a type and shape for use in strict mode.
+class OPENVINO_API AnyOf : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternAnyOf", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    /// \brief creates a AnyOf node containing a sub-pattern described by \sa type and
+    ///        \sa shape.
+    AnyOf(const element::Type& type, const PartialShape& s, ValuePredicate pred, const OutputVector& wrapped_values)
+        : Pattern(wrapped_values, pred) {
+        if (wrapped_values.size() != 1) {
+            throw Exception("AnyOf expects exactly one argument");
+        }
+        set_output_type(0, type, s);
+    }
+    AnyOf(const element::Type& type, const PartialShape& s, NodePredicate pred, const NodeVector& wrapped_values)
+        : AnyOf(
+              type,
+              s,
+              [pred](const Output<Node>& value) {
+                  return pred(value.get_node_shared_ptr());
+              },
+              as_output_vector(wrapped_values)) {}
+
+    /// \brief creates a AnyOf node containing a sub-pattern described by the type and
+    ///        shape of \sa node.
+    AnyOf(const Output<Node>& node, ValuePredicate pred, const OutputVector& wrapped_values)
+        : AnyOf(node.get_element_type(), node.get_partial_shape(), pred, wrapped_values) {}
+    AnyOf(const std::shared_ptr<Node>& node, NodePredicate pred, const NodeVector& wrapped_values)
+        : AnyOf(node, as_value_predicate(pred), as_output_vector(wrapped_values)) {}
+    bool match_value(Matcher* matcher, const Output<Node>& pattern_value, const Output<Node>& graph_value) override;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/any_output.hpp b/ngraph/core/include/openvino/pass/pattern/op/any_output.hpp
new file mode 100644
index 00000000000000..cbd7865ecda966
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/any_output.hpp
@@ -0,0 +1,30 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// Matches any output of a node
+class OPENVINO_API AnyOutput : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternAnyOutput", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    /// \brief creates an AnyOutput node matching any output of a node
+    /// \param node The node to match
+    AnyOutput(const std::shared_ptr<Node>& pattern) : Pattern({pattern->output(0)}) {}
+
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/branch.hpp b/ngraph/core/include/openvino/pass/pattern/op/branch.hpp
new file mode 100644
index 00000000000000..2251ca9e8c6977
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/branch.hpp
@@ -0,0 +1,55 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// A branch adds a loop to the pattern. The branch match is successful if the
+/// destination node pattern matches the graph value. The destination node is a node in
+/// the pattern graph that will not have been created some time after the Branch node is
+/// created; use set_destination to add it.
+///
+/// The branch destination is not stored as a shared pointer to prevent reference
+/// cycles. Thus the destination node must be referenced in some other way to prevent it
+/// from being deleted.
+class OPENVINO_API Branch : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternBranch", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    /// \brief Creates a Branch pattern
+    /// \param pattern the destinationing pattern
+    /// \param labels Labels where the destination may occur
+    Branch() : Pattern(OutputVector{}) {
+        set_output_type(0, element::f32, Shape{});
+    }
+
+    void set_destination(const Output<Node>& destination) {
+        m_destination_node = destination.get_node();
+        m_destination_index = destination.get_index();
+    }
+
+    Output<Node> get_destination() const {
+        return m_destination_node == nullptr
+                   ? Output<Node>()
+                   : Output<Node>{m_destination_node->shared_from_this(), m_destination_index};
+    }
+
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+
+protected:
+    Node* m_destination_node{nullptr};
+    size_t m_destination_index{0};
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/capture.hpp b/ngraph/core/include/openvino/pass/pattern/op/capture.hpp
new file mode 100644
index 00000000000000..0b2a5eca940c55
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/capture.hpp
@@ -0,0 +1,44 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// Experimental for support of recurrent matches.
+///
+/// Capture adds the pattern value map to a list of pattern value maps and resets
+/// matches for pattern nodes not in the static node list. The match always succeeds.
+class OPENVINO_API Capture : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternCapture", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    Capture(const Output<Node>& arg) : Pattern({arg}) {
+        set_output_type(0, arg.get_element_type(), arg.get_partial_shape());
+    }
+
+    /// \brief static nodes are retained after a capture. All other nodes are dropped
+    std::set<Node*> get_static_nodes() {
+        return m_static_nodes;
+    }
+    void set_static_nodes(const std::set<Node*>& static_nodes) {
+        m_static_nodes = static_nodes;
+    }
+
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+
+protected:
+    std::set<Node*> m_static_nodes;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/label.hpp b/ngraph/core/include/openvino/pass/pattern/op/label.hpp
new file mode 100644
index 00000000000000..2e7013b0131a28
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/label.hpp
@@ -0,0 +1,113 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// Fails if the predicate returns false on the graph value.
+///
+/// The graph value is added to the matched values list. If the Label is already
+/// associated with a value, the match succeeds if the value is the same as the graph
+/// value. Otherwise, the label is associated with the graph value and the match
+/// succeeds if the pattern input matches the graph value.
+///
+/// DEPRECATED: If no inputs are given to Label, a True node is serves as the input. If
+/// more than one inputs are given, an Or pattern of the inputs serves as the input.
+class OPENVINO_API Label : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternLabel", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    /// \brief creates a Label node containing a sub-pattern described by \sa type and
+    ///        \sa shape.
+    ///
+    /// this Label node can be bound only to the nodes in the input graph
+    /// that match the pattern specified by \sa wrapped_nodes
+    /// Example:
+    /// \code{.cpp}
+    /// auto add = a + b; // a and b are op::Parameter in this example
+    /// auto label = std::make_shared<pattern::op::Label>(element::f32,
+    ///                                                   PartialShape{2,2},
+    ///                                                   nullptr,
+    ///                                                   OutputVector{add});
+    /// \endcode
+    Label(const element::Type& type,
+          const PartialShape& s,
+          const ValuePredicate pred,
+          const OutputVector& wrapped_values)
+        : Pattern(OutputVector{wrap_values(wrapped_values)}, pred) {
+        set_output_type(0, type, s);
+    }
+
+    explicit Label(const element::Type& type = element::dynamic, const PartialShape& s = PartialShape::dynamic())
+        : Label(
+              type,
+              s,
+              [](const Output<Node>&) {
+                  return true;
+              },
+              OutputVector()) {}
+
+    Label(const element::Type& type, const PartialShape& s, ValuePredicate pred)
+        : Label(type, s, pred, OutputVector{}) {}
+
+    Label(const element::Type& type, const PartialShape& s, NodePredicate pred)
+        : Label(type, s, as_value_predicate(pred), OutputVector{}) {}
+
+    Label(const element::Type& type, const PartialShape& s, const NodePredicate pred, const NodeVector& wrapped_values)
+        : Label(type, s, as_value_predicate(pred), as_output_vector(wrapped_values)) {}
+
+    /// \brief creates a Label node containing a sub-pattern described by the type and
+    ///        shape of \sa node.
+    ///
+    /// this Label node can be bound only to the nodes in the input graph
+    /// that match the pattern specified by \sa wrapped_values
+    /// Example:
+    /// \code{.cpp}
+    /// auto add = a + b; // a and b are op::Parameter in this example
+    /// auto label = std::make_shared<pattern::op::Label>(add,
+    ///                                                   nullptr,
+    ///                                                   OutputVector{add});
+    /// \endcode
+    Label(const Output<Node>& value, const ValuePredicate pred, const OutputVector& wrapped_values)
+        : Label(value.get_element_type(), value.get_partial_shape(), pred, wrapped_values) {}
+    Label(const Output<Node>& value, const ValuePredicate pred)
+        : Label(value.get_element_type(), value.get_partial_shape(), pred, OutputVector{}) {}
+
+    Label(const Output<Node>& value, const NodePredicate pred)
+        : Label(value.get_element_type(), value.get_partial_shape(), as_value_predicate(pred), OutputVector{}) {}
+    Label(const Output<Node>& value)
+        : Label(
+              value.get_element_type(),
+              value.get_partial_shape(),
+              [](const Output<Node>&) {
+                  return true;
+              },
+              OutputVector{}) {}
+    Label(const Output<Node>& node, const NodePredicate pred, const NodeVector& wrapped_values)
+        : Label(node.get_element_type(),
+                node.get_partial_shape(),
+                as_value_predicate(pred),
+                as_output_vector(wrapped_values)) {}
+
+    bool match_value(Matcher* matcher, const Output<Node>& pattern_value, const Output<Node>& graph_value) override;
+
+protected:
+    static Output<Node> wrap_values(const OutputVector& wrapped_values);
+};
+}  // namespace op
+
+OPENVINO_API
+std::shared_ptr<Node> any_input();
+
+OPENVINO_API
+std::shared_ptr<Node> any_input(const pattern::op::ValuePredicate& pred);
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/or.hpp b/ngraph/core/include/openvino/pass/pattern/op/or.hpp
new file mode 100644
index 00000000000000..1f173bdd418255
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/or.hpp
@@ -0,0 +1,32 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// A submatch on the graph value is performed on each input to the Or; the match
+/// succeeds on the first match. Otherwise the match fails.
+class OPENVINO_API Or : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternOr", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    /// \brief creates an Or node matching one of several sub-patterns in order. Does
+    /// not add node to match list.
+    /// \param patterns The patterns to try for matching
+    Or(const OutputVector& patterns) : Pattern(patterns) {}
+
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/pattern.hpp b/ngraph/core/include/openvino/pass/pattern/op/pattern.hpp
new file mode 100644
index 00000000000000..9fe455e00792c8
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/pattern.hpp
@@ -0,0 +1,96 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <functional>
+
+#include "openvino/core/node.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+class Label;
+}
+
+class Matcher;
+class MatcherState;
+
+using RPatternValueMap = std::map<std::shared_ptr<Node>, OutputVector>;
+using PatternValueMap = std::map<std::shared_ptr<Node>, Output<Node>>;
+using PatternValueMaps = std::vector<PatternValueMap>;
+
+using PatternMap = std::map<std::shared_ptr<Node>, std::shared_ptr<Node>>;
+
+PatternMap as_pattern_map(const PatternValueMap& pattern_value_map);
+PatternValueMap as_pattern_value_map(const PatternMap& pattern_map);
+
+template <typename T>
+std::function<bool(std::shared_ptr<Node>)> has_class() {
+    auto pred = [](std::shared_ptr<Node> node) -> bool {
+        return ov::is_type<T>(node);
+    };
+
+    return pred;
+}
+
+OPENVINO_API
+std::function<bool(Output<Node>)> consumers_count(size_t n);
+
+OPENVINO_API
+std::function<bool(Output<Node>)> has_static_dim(size_t pos);
+
+OPENVINO_API
+std::function<bool(Output<Node>)> has_static_dims(const std::vector<size_t>& dims);
+
+OPENVINO_API
+std::function<bool(Output<Node>)> has_static_shape();
+
+OPENVINO_API
+std::function<bool(Output<Node>)> has_static_rank();
+
+OPENVINO_API
+std::function<bool(Output<Node>)> rank_equals(const Dimension& expected_rank);
+
+OPENVINO_API
+std::function<bool(Output<Node>)> type_matches(const element::Type& type);
+
+OPENVINO_API
+std::function<bool(Output<Node>)> type_matches_any(const std::vector<element::Type>& types);
+
+namespace op {
+using NodePredicate = std::function<bool(std::shared_ptr<Node>)>;
+using ValuePredicate = std::function<bool(const Output<Node>& value)>;
+
+OPENVINO_API
+ValuePredicate as_value_predicate(NodePredicate pred);
+
+class OPENVINO_API Pattern : public Node {
+public:
+    /// \brief \p a base class for \sa Skip and \sa Label
+    ///
+    Pattern(const OutputVector& patterns, ValuePredicate pred) : Node(patterns), m_predicate(pred) {
+        if (!m_predicate) {
+            m_predicate = [](const Output<Node>&) {
+                return true;
+            };
+        }
+    }
+
+    Pattern(const OutputVector& patterns) : Pattern(patterns, nullptr) {}
+
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& /* new_args */) const override {
+        throw Exception("Uncopyable");
+    }
+
+    ValuePredicate get_predicate() const;
+
+protected:
+    ValuePredicate m_predicate;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/skip.hpp b/ngraph/core/include/openvino/pass/pattern/op/skip.hpp
new file mode 100644
index 00000000000000..02888a7502259b
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/skip.hpp
@@ -0,0 +1,44 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// The graph value is added to the matched value list. If the predicate is true, the
+/// match succeeds if the arguments match; if the predicate is false, the match succeeds
+/// if the pattern input matches the graph value.
+class OPENVINO_API Skip : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternSkip", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    Skip(const Output<Node>& arg, ValuePredicate pred) : Pattern({arg}, pred) {
+        set_output_type(0, arg.get_element_type(), arg.get_partial_shape());
+    }
+
+    Skip(const Output<Node>& arg, NodePredicate pred = nullptr) : Pattern({arg}, as_value_predicate(pred)) {
+        set_output_type(0, arg.get_element_type(), arg.get_partial_shape());
+    }
+
+    Skip(const OutputVector& args, ValuePredicate pred) : Pattern(args, pred) {
+        set_output_type(0, args.at(0).get_element_type(), args.at(0).get_partial_shape());
+    }
+
+    Skip(const OutputVector& args, NodePredicate pred = nullptr) : Pattern(args, as_value_predicate(pred)) {
+        set_output_type(0, args.at(0).get_element_type(), args.at(0).get_partial_shape());
+    }
+
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/true.hpp b/ngraph/core/include/openvino/pass/pattern/op/true.hpp
new file mode 100644
index 00000000000000..b99170ce799562
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/true.hpp
@@ -0,0 +1,28 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+/// \brief The match always succeeds.
+class OPENVINO_API True : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternTrue", 0};
+    const NodeTypeInfo& get_type_info() const override;
+    /// \brief Always matches, does not add node to match list.
+    True() : Pattern(OutputVector{}) {}
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+};
+}  // namespace op
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/pattern/op/wrap_type.hpp b/ngraph/core/include/openvino/pass/pattern/op/wrap_type.hpp
new file mode 100644
index 00000000000000..01498b81b5f2d3
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/pattern/op/wrap_type.hpp
@@ -0,0 +1,75 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/node.hpp"
+#include "openvino/pass/pattern/op/pattern.hpp"
+
+namespace ov {
+namespace pass {
+namespace pattern {
+namespace op {
+class OPENVINO_API WrapType : public Pattern {
+public:
+    static constexpr NodeTypeInfo type_info{"patternAnyType", 0};
+    const NodeTypeInfo& get_type_info() const override;
+
+    explicit WrapType(
+        NodeTypeInfo wrapped_type,
+        const ValuePredicate& pred =
+            [](const Output<Node>& output) {
+                return true;
+            },
+        const OutputVector& input_values = {})
+        : Pattern(input_values, pred),
+          m_wrapped_types({wrapped_type}) {
+        set_output_type(0, element::Type_t::dynamic, PartialShape::dynamic());
+    }
+
+    explicit WrapType(
+        std::vector<NodeTypeInfo> wrapped_types,
+        const ValuePredicate& pred =
+            [](const Output<Node>& output) {
+                return true;
+            },
+        const OutputVector& input_values = {})
+        : Pattern(input_values, pred),
+          m_wrapped_types(std::move(wrapped_types)) {
+        set_output_type(0, element::Type_t::dynamic, PartialShape::dynamic());
+    }
+
+    bool match_value(pattern::Matcher* matcher,
+                     const Output<Node>& pattern_value,
+                     const Output<Node>& graph_value) override;
+
+    NodeTypeInfo get_wrapped_type() const;
+
+    const std::vector<NodeTypeInfo>& get_wrapped_types() const;
+
+private:
+    std::vector<NodeTypeInfo> m_wrapped_types;
+};
+}  // namespace op
+
+template <class... Args>
+std::shared_ptr<Node> wrap_type(const OutputVector& inputs, const pattern::op::ValuePredicate& pred) {
+    std::vector<DiscreteTypeInfo> info{Args::type_info...};
+    return std::make_shared<op::WrapType>(info, pred, inputs);
+}
+
+template <class... Args>
+std::shared_ptr<Node> wrap_type(const OutputVector& inputs = {}) {
+    return wrap_type<Args...>(inputs, [](const Output<Node>& output) {
+        return true;
+    });
+}
+
+template <class... Args>
+std::shared_ptr<Node> wrap_type(const pattern::op::ValuePredicate& pred) {
+    return wrap_type<Args...>({}, pred);
+}
+}  // namespace pattern
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/validate.hpp b/ngraph/core/include/openvino/pass/validate.hpp
new file mode 100644
index 00000000000000..63b502a1a28bf5
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/validate.hpp
@@ -0,0 +1,32 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "openvino/core/core_visibility.hpp"
+#include "openvino/pass/pass.hpp"
+
+namespace ov {
+namespace pass {
+/// \brief The Validate pass performs sanity checks on attributes and inputs, and
+/// computes output shapes and element types for all computation nodes in a given
+/// computation graph.
+///
+/// \details The verification and inference is done via invoking each node's specific
+/// implementation of \link ov::Node::validate_and_infer_types() \endlink function.
+///
+/// By default, the \ref ov::pass::Manager runs this pass after executing every
+/// optimization pass. This is to ensure that any update to the graph by an optimization
+/// pass does not break the shape and data type requirement on a computation node.
+/// This default validation run can be changed via calling the
+/// \link ov::pass::Manager::set_per_pass_validation(bool) \endlink function.
+class OPENVINO_API Validate : public FunctionPass {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    Validate() : FunctionPass() {}
+    bool run_on_function(std::shared_ptr<ov::Function> f) override;
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/include/openvino/pass/visualize_tree.hpp b/ngraph/core/include/openvino/pass/visualize_tree.hpp
new file mode 100644
index 00000000000000..7eab8b8f2c94cc
--- /dev/null
+++ b/ngraph/core/include/openvino/pass/visualize_tree.hpp
@@ -0,0 +1,57 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <functional>
+#include <set>
+#include <sstream>
+#include <string>
+#include <typeindex>
+#include <typeinfo>
+#include <unordered_map>
+#include <utility>
+
+#include "openvino/pass/pass.hpp"
+
+class HeightMap;
+
+using visualize_tree_ops_map_t =
+    std::unordered_map<ov::Node::type_info_t, std::function<void(const ov::Node&, std::ostream& ss)>>;
+
+namespace ov {
+namespace pass {
+class OPENVINO_API VisualizeTree : public FunctionPass {
+public:
+    OPENVINO_RTTI_DECLARATION;
+
+    using node_modifiers_t = std::function<void(const Node& node, std::vector<std::string>& attributes)>;
+    VisualizeTree(const std::string& file_name, node_modifiers_t nm = nullptr, bool dot_only = false);
+    bool run_on_function(std::shared_ptr<ov::Function>) override;
+
+    void set_ops_to_details(const visualize_tree_ops_map_t& ops_map) {
+        m_ops_to_details = ops_map;
+    }
+
+protected:
+    void add_node_arguments(std::shared_ptr<Node> node,
+                            std::unordered_map<Node*, HeightMap>& height_maps,
+                            size_t& fake_node_ctr);
+    std::string add_attributes(std::shared_ptr<Node> node);
+    virtual std::string get_attributes(std::shared_ptr<Node> node);
+    virtual std::string get_node_name(std::shared_ptr<Node> node);
+    std::string get_constant_value(std::shared_ptr<Node> node, size_t max_elements = 7);
+
+    void render() const;
+
+    std::stringstream m_ss;
+    std::string m_name;
+    std::set<std::shared_ptr<Node>> m_nodes_with_attributes;
+    visualize_tree_ops_map_t m_ops_to_details;
+    node_modifiers_t m_node_modifiers = nullptr;
+    bool m_dot_only;
+    static const int max_jump_distance;
+};
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/reference/include/ngraph/runtime/reference/avg_pool.hpp b/ngraph/core/reference/include/ngraph/runtime/reference/avg_pool.hpp
index 94dfbdf1d46675..f68865830af040 100644
--- a/ngraph/core/reference/include/ngraph/runtime/reference/avg_pool.hpp
+++ b/ngraph/core/reference/include/ngraph/runtime/reference/avg_pool.hpp
@@ -215,16 +215,17 @@ void avg_pool(const T* arg,
             }
         }
 
-        if (n_elements == 0) {
-            throw std::runtime_error("AvgPool elements == 0, must be non-zero");
-        }
-
-        if (std::is_same<T, int8_t>::value || std::is_same<T, uint8_t>::value) {
-            out[output_transform.index(out_coord)] =
-                static_cast<T>(std::nearbyint(static_cast<float>(result) / n_elements));
+        if (n_elements != 0) {
+            if (std::is_same<T, int8_t>::value || std::is_same<T, uint8_t>::value) {
+                out[output_transform.index(out_coord)] =
+                    static_cast<T>(std::nearbyint(static_cast<float>(result) / n_elements));
+            } else {
+                out[output_transform.index(out_coord)] = result / n_elements;
+            }
         } else {
-            out[output_transform.index(out_coord)] = result / n_elements;
+            out[output_transform.index(out_coord)] = T{0};
         }
+
         std::fesetround(old_mode);
     }
     NGRAPH_SUPPRESS_DEPRECATED_END
diff --git a/ngraph/core/reference/include/ngraph/runtime/reference/max_pool.hpp b/ngraph/core/reference/include/ngraph/runtime/reference/max_pool.hpp
index e0729ee5e82a32..74c0261112b653 100644
--- a/ngraph/core/reference/include/ngraph/runtime/reference/max_pool.hpp
+++ b/ngraph/core/reference/include/ngraph/runtime/reference/max_pool.hpp
@@ -110,6 +110,339 @@ void max_pool(const T* arg,
     }
     NGRAPH_SUPPRESS_DEPRECATED_END
 }
+
+namespace {
+void validate_max_pool_kernel_params(const size_t dims,
+                                     const Shape& kernel,
+                                     const Strides& kernel_strides,
+                                     const Strides& kernel_dilations,
+                                     const Shape& pads_begin,
+                                     const Shape& pads_end) {
+    NGRAPH_CHECK(kernel.size() == dims && kernel_strides.size() == dims && kernel_dilations.size() == dims &&
+                     pads_begin.size() == dims && pads_end.size() == dims,
+                 "One of the MaxPool params does not match the ",
+                 dims,
+                 "D implementation.\nkernel=",
+                 kernel,
+                 "\nkernel_strides=",
+                 kernel_strides,
+                 "\nkernel_dilations=",
+                 kernel_dilations,
+                 "\npads_begin=",
+                 pads_begin,
+                 "\npads_end=",
+                 pads_end);
+}
+
+/// \brief A helper struct representing spatial coordinates of a tensor element. It can use signed numbers as the
+///        underlying type; this way it is possible to represent elements which belong to the padding area
+///        (by using negative values).
+///
+/// \note  This struct can be used to represent a location of a pooling kernel in space (non-flattened version)
+///        but at the same time it can represent pixel offsets in the filter itself (dilated or non-dilated)
+template <typename T>
+struct Coord : public std::vector<T> {
+    Coord(const Shape& pads_begin) {
+        std::vector<T>::reserve(pads_begin.size());
+        for (const auto axis_padding : pads_begin) {
+            std::vector<T>::push_back(0 - axis_padding);
+        }
+    }
+
+    Coord(std::initializer_list<T>&& values) : std::vector<T>{std::move(values)} {}
+};
+
+bool elem_in_padding_area(const Coord<int>& kernel_position,
+                          const Coord<size_t>& kernel_offset,
+                          const Shape& data_shape) {
+    for (size_t dim = 0; dim + 2 < data_shape.size(); ++dim) {
+        if (kernel_position[dim] + kernel_offset[dim] < 0 ||
+            kernel_position[dim] + kernel_offset[dim] >= data_shape[dim + 2]) {
+            return true;
+        }
+    }
+
+    return false;
+}
+
+template <typename T>
+Coord<T> next_kernel_position_2D(Coord<T> kernel_position,
+                                 const Shape& kernel,
+                                 const Strides& kernel_strides,
+                                 const Strides& kernel_dilations,
+                                 const Shape& data_shape,
+                                 const Shape& pads_begin,
+                                 const Shape& pads_end) {
+    // move the kernel horizontally one stride to the right
+    kernel_position[1] += kernel_strides[1];
+
+    // if the top-right corner of the kernel is outside of the padding area,
+    // move it back to the left and one stride down
+    if (kernel_position[1] + (kernel[1] - 1) * kernel_dilations[1] >= data_shape[3] + pads_end[1]) {
+        kernel_position[1] = 0 - pads_begin[1];
+        kernel_position[0] += kernel_strides[0];
+    }
+
+    return kernel_position;
+}
+
+template <typename T>
+Coord<T> next_kernel_position_3D(Coord<T> kernel_position,
+                                 const Shape& kernel,
+                                 const Strides& kernel_strides,
+                                 const Strides& kernel_dilations,
+                                 const Shape& data_shape,
+                                 const Shape& pads_begin,
+                                 const Shape& pads_end) {
+    kernel_position[2] += kernel_strides[2];
+
+    if (kernel_position[2] + (kernel[2] - 1) * kernel_dilations[2] >= data_shape[4] + pads_end[2]) {
+        kernel_position[2] = 0 - pads_begin[2];
+        kernel_position[1] += kernel_strides[1];
+        if (kernel_position[1] + (kernel[1] - 1) * kernel_dilations[1] >= data_shape[3] + pads_end[1]) {
+            kernel_position[1] = 0 - pads_begin[1];
+            kernel_position[0] += kernel_strides[0];
+        }
+    }
+
+    return kernel_position;
+}
+
+namespace kernel {
+template <typename Values_t, typename Indices_t>
+void max_pool_1d(const Values_t* data,
+                 Values_t* values,
+                 Indices_t* indices,
+                 const size_t data_elems,
+                 const size_t out_elems,
+                 const size_t kernel_size,
+                 const size_t kernel_stride,
+                 const size_t kernel_dilation,
+                 const size_t pads_begin,
+                 const size_t pads_end,
+                 const size_t indices_offset) {
+    int kernel_position = 0 - pads_begin;
+    // select max elem and its index for each "placeholder" in the out buffer (pointed to by out_idx)
+    for (size_t out_idx = 0; out_idx < out_elems; ++out_idx) {
+        Values_t max_elem = std::numeric_limits<Values_t>::lowest();
+        Indices_t max_elem_idx = Indices_t{0};
+        for (size_t kernel_elem = 0; kernel_elem < kernel_size; ++kernel_elem) {
+            const size_t kernel_elem_offset = kernel_elem * kernel_dilation;
+            // don't process the padding elements
+            if (kernel_position + kernel_elem_offset >= 0 && kernel_position + kernel_elem_offset < data_elems &&
+                data[kernel_position + kernel_elem_offset] > max_elem) {
+                max_elem = data[kernel_position + kernel_elem_offset];
+                max_elem_idx = kernel_position + kernel_elem_offset;
+            }
+        }
+        values[out_idx] = max_elem;
+        indices[out_idx] = max_elem_idx + indices_offset;
+        kernel_position += kernel_stride;
+    }
+}
+
+template <typename Values_t, typename Indices_t>
+void max_pool_2d(const Values_t* data,
+                 Values_t* values,
+                 Indices_t* indices,
+                 const Shape& data_shape,
+                 const Shape& out_shape,
+                 const Shape& kernel,
+                 const Strides& kernel_strides,
+                 const Strides& kernel_dilations,
+                 const Shape& pads_begin,
+                 const Shape& pads_end,
+                 const size_t indices_offset) {
+    validate_max_pool_kernel_params(2, kernel, kernel_strides, kernel_dilations, pads_begin, pads_end);
+
+    Coord<int> kernel_position{pads_begin};
+
+    // select max elem and its index for each "placeholder" in the out buffer (pointed to by out_idx)
+    for (size_t out_idx = 0; out_idx < out_shape[2] * out_shape[3]; ++out_idx) {
+        Values_t max_elem = std::numeric_limits<Values_t>::lowest();
+        Indices_t max_elem_idx = Indices_t{0};
+
+        // find the max element in the area covered by a current position of the kernel
+        for (size_t kernel_row = 0; kernel_row < kernel[0]; ++kernel_row) {
+            for (size_t kernel_col = 0; kernel_col < kernel[1]; ++kernel_col) {
+                // offset from the top-left corner of the kernel for a given row and col
+                const Coord<size_t> kernel_offset{kernel_row * kernel_dilations[0], kernel_col * kernel_dilations[1]};
+
+                // ignore the elements in the padding area
+                if (!elem_in_padding_area(kernel_position, kernel_offset, data_shape)) {
+                    // index of the flattened tensor element under the current row & column of the kernel
+                    const size_t data_elem_index =
+                        data_shape[2] * (kernel_offset[0] + kernel_position[0]) + kernel_offset[1] + kernel_position[1];
+
+                    if (data[data_elem_index] > max_elem) {
+                        max_elem = data[data_elem_index];
+                        max_elem_idx = data_elem_index;
+                    }
+                }
+            }
+        }
+
+        values[out_idx] = max_elem;
+        indices[out_idx] = max_elem_idx + indices_offset;
+
+        kernel_position = next_kernel_position_2D(kernel_position,
+                                                  kernel,
+                                                  kernel_strides,
+                                                  kernel_dilations,
+                                                  data_shape,
+                                                  pads_begin,
+                                                  pads_end);
+    }
+}
+
+template <typename Values_t, typename Indices_t>
+void max_pool_3d(const Values_t* data,
+                 Values_t* values,
+                 Indices_t* indices,
+                 const Shape& data_shape,
+                 const Shape& out_shape,
+                 const Shape& kernel,
+                 const Strides& kernel_strides,
+                 const Strides& kernel_dilations,
+                 const Shape& pads_begin,
+                 const Shape& pads_end,
+                 const size_t indices_offset) {
+    validate_max_pool_kernel_params(3, kernel, kernel_strides, kernel_dilations, pads_begin, pads_end);
+
+    Coord<int> kernel_position{pads_begin};
+
+    const size_t out_elems = shape_size(std::begin(out_shape) + 2, std::end(out_shape));
+
+    // select max elem and its index for each "placeholder" in the out buffer (pointed to by out_idx)
+    for (size_t out_idx = 0; out_idx < out_elems; ++out_idx) {
+        Values_t max_elem = std::numeric_limits<Values_t>::lowest();
+        Indices_t max_elem_idx = Indices_t{0};
+
+        for (size_t kernel_channel = 0; kernel_channel < kernel[0]; ++kernel_channel) {
+            for (size_t kernel_row = 0; kernel_row < kernel[1]; ++kernel_row) {
+                for (size_t kernel_col = 0; kernel_col < kernel[2]; ++kernel_col) {
+                    // offset from the top-left corner of the kernel for a given row and col
+                    const Coord<size_t> kernel_offset{kernel_channel * kernel_dilations[0],
+                                                      kernel_row * kernel_dilations[1],
+                                                      kernel_col * kernel_dilations[2]};
+
+                    // ignore the elements in the padding area
+                    if (!elem_in_padding_area(kernel_position, kernel_offset, data_shape)) {
+                        // index of the flattened tensor element under the current row & column of the kernel
+                        const size_t data_elem_index =
+                            data_shape[2] * data_shape[3] * (kernel_offset[0] + kernel_position[0]) +
+                            data_shape[3] * (kernel_offset[1] + kernel_position[1]) + kernel_offset[2] +
+                            kernel_position[2];
+
+                        if (data[data_elem_index] > max_elem) {
+                            max_elem = data[data_elem_index];
+                            max_elem_idx = data_elem_index;
+                        }
+                    }
+                }
+            }
+        }
+        values[out_idx] = max_elem;
+        indices[out_idx] = max_elem_idx + indices_offset;
+
+        kernel_position = next_kernel_position_3D(kernel_position,
+                                                  kernel,
+                                                  kernel_strides,
+                                                  kernel_dilations,
+                                                  data_shape,
+                                                  pads_begin,
+                                                  pads_end);
+    }
+}
+}  // namespace kernel
+}  // namespace
+
+template <typename Values_t, typename Indices_t>
+void max_pool(const Values_t* data,
+              Values_t* values,
+              Indices_t* indices,
+              const Shape& data_shape,
+              const Shape& out_shape,
+              const Shape& kernel,
+              const Strides& strides,
+              const Strides& dilations,
+              const Shape& pads_begin,
+              const Shape& pads_end,
+              const int64_t axis = 0) {
+    const auto data_batch_elems = shape_size(std::begin(data_shape) + 1, std::end(data_shape));
+    const auto data_channel_elems = shape_size(std::begin(data_shape) + 2, std::end(data_shape));
+
+    const auto out_batch_elems = shape_size(std::begin(out_shape) + 1, std::end(out_shape));
+    const auto out_channel_elems = shape_size(std::begin(out_shape) + 2, std::end(out_shape));
+
+    for (size_t b = 0; b < data_shape[0]; ++b) {
+        const Indices_t batch_indices_offset = b * data_batch_elems;
+
+        for (size_t c = 0; c < data_shape[1]; ++c) {
+            // calculate the buffer offsets for a given channel "c" then execute an appropriate
+            // kernel for each processed channel
+            const Values_t* data_channel_first_elem = data + b * data_batch_elems + c * data_channel_elems;
+            Values_t* out_channel_first_elem = values + b * out_batch_elems + c * out_channel_elems;
+            Indices_t* indices_channel_first_elem = indices + b * out_batch_elems + c * out_channel_elems;
+            const Indices_t channel_indices_offset = c * data_channel_elems;
+            // total offset of the flattened tensor indices for currently processed batch and channel
+            const Indices_t indices_offset = batch_indices_offset + channel_indices_offset;
+
+            if (data_shape.size() == 3) {
+                kernel::max_pool_1d<Values_t, Indices_t>(data_channel_first_elem,
+                                                         out_channel_first_elem,
+                                                         indices_channel_first_elem,
+                                                         data_shape[2],
+                                                         out_shape[2],
+                                                         kernel[0],
+                                                         strides[0],
+                                                         dilations[0],
+                                                         pads_begin[0],
+                                                         pads_end[0],
+                                                         indices_offset);
+            } else if (data_shape.size() == 4) {
+                kernel::max_pool_2d<Values_t, Indices_t>(data_channel_first_elem,
+                                                         out_channel_first_elem,
+                                                         indices_channel_first_elem,
+                                                         data_shape,
+                                                         out_shape,
+                                                         kernel,
+                                                         strides,
+                                                         dilations,
+                                                         pads_begin,
+                                                         pads_end,
+                                                         indices_offset);
+            } else if (data_shape.size() == 5) {
+                kernel::max_pool_3d<Values_t, Indices_t>(data_channel_first_elem,
+                                                         out_channel_first_elem,
+                                                         indices_channel_first_elem,
+                                                         data_shape,
+                                                         out_shape,
+                                                         kernel,
+                                                         strides,
+                                                         dilations,
+                                                         pads_begin,
+                                                         pads_end,
+                                                         indices_offset);
+            } else {
+                NGRAPH_CHECK(false,
+                             "Unsupported input shape ",
+                             data_shape,
+                             " passed to the MaxPool reference implementation. Supported shapes: 3D, 4D and 5D.");
+            }
+        }
+    }
+
+    // adjust the calculated indices to the requested range (specified by the axis attribute) if needed
+    if (axis != 0) {
+        const Indices_t max_index = shape_size(std::begin(data_shape) + axis, std::end(data_shape));
+
+        const auto indices_number = shape_size(out_shape);
+        for (size_t i = 0; i < indices_number; ++i) {
+            indices[i] %= max_index;
+        }
+    }
+}
 }  // namespace reference
 }  // namespace runtime
 }  // namespace ngraph
diff --git a/ngraph/core/reference/include/ngraph/runtime/reference/not_equal.hpp b/ngraph/core/reference/include/ngraph/runtime/reference/not_equal.hpp
index 7b10df0e22d197..fcc3206c2921f2 100644
--- a/ngraph/core/reference/include/ngraph/runtime/reference/not_equal.hpp
+++ b/ngraph/core/reference/include/ngraph/runtime/reference/not_equal.hpp
@@ -18,17 +18,6 @@
 namespace ngraph {
 namespace runtime {
 namespace reference {
-template <typename T>
-void not_equal(const T* arg0,
-               const T* arg1,
-               char* out,
-               size_t count)  // TODO: using char for bool, is this right?
-{
-    for (size_t i = 0; i < count; i++) {
-        out[i] = arg0[i] != arg1[i];
-    }
-}
-
 template <typename T, typename U>
 void not_equal(const T* arg0,
                const T* arg1,
diff --git a/ngraph/core/reference/include/ngraph/runtime/reference/random_uniform.hpp b/ngraph/core/reference/include/ngraph/runtime/reference/random_uniform.hpp
new file mode 100644
index 00000000000000..3652938e26f53a
--- /dev/null
+++ b/ngraph/core/reference/include/ngraph/runtime/reference/random_uniform.hpp
@@ -0,0 +1,51 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <ctime>
+#include <ngraph/type/element_type.hpp>
+
+#include "ngraph/shape.hpp"
+
+namespace ngraph {
+namespace runtime {
+namespace reference {
+
+// Helper struct for converting between types
+struct convert_types {
+    union {
+        uint64_t ui64;
+        double d;
+        float f;
+        float16 f16;
+        bfloat16 bf16;
+    };
+};
+
+std::pair<uint64_t, uint64_t> random_uniform(const uint64_t* out_shape,
+                                             const char* min_val,
+                                             const char* max_val,
+                                             char* out,
+                                             const Shape& out_shape_shape,
+                                             const ngraph::element::Type& elem_type,
+                                             uint64_t seed,
+                                             uint64_t seed2,
+                                             std::pair<uint64_t, uint64_t> prev_state);
+
+// Following const values are taken from the original paper:
+// https://www.thesalmons.org/john/random123/papers/random123sc11.pdf
+const uint32_t crush_resistance_const_lower_value = 0x9E3779B9;
+const uint32_t crush_resistance_const_upper_value = 0xBB67AE85;
+const uint64_t statistic_maximizing_multiplier_n = 0xD2511F53;
+const uint64_t statistic_maximizing_multiplier_counter = 0xCD9E8D57;
+const size_t rounds_number = 10;
+
+// Determines how many sequence elements of RNG sequence are skipped between runs.
+// Can be any positive value, 256 is chosen for parity with Tensorflow.
+const uint64_t skip_const = 256;
+
+}  // namespace reference
+}  // namespace runtime
+}  // namespace ngraph
diff --git a/ngraph/core/reference/src/runtime/reference/gather_tree.cpp b/ngraph/core/reference/src/runtime/reference/gather_tree.cpp
index de021bc963fd2d..66e6476cf2bfc7 100644
--- a/ngraph/core/reference/src/runtime/reference/gather_tree.cpp
+++ b/ngraph/core/reference/src/runtime/reference/gather_tree.cpp
@@ -72,11 +72,12 @@ void runtime::reference::gather_tree(const char* step_ids,
         throw ngraph_error("max_seq_len must have size of BATCH_SIZE");
     }
 
-    NGRAPH_SUPPRESS_DEPRECATED_START
-    ngraph::CoordinateTransform cordinate_transform(step_ids_shape);
+    const auto in_strides = row_major_strides(step_ids_shape);
+    ngraph::CoordinateTransformBasic cordinate_transform(step_ids_shape);
 
     for (const auto& coord : cordinate_transform) {
-        memcpy(out + cordinate_transform.index(coord) * elem_size, end_token, elem_size);
+        const auto out_idx = std::inner_product(coord.begin(), coord.end(), in_strides.begin(), 0);
+        memcpy(out + out_idx * elem_size, end_token, elem_size);
     }
 
     for (size_t batch = 0; batch < batch_size; ++batch) {
@@ -87,31 +88,35 @@ void runtime::reference::gather_tree(const char* step_ids,
                 continue;
             }
 
-            auto offset = cordinate_transform.index({max_seq_in_beam - 1, batch, beam}) * elem_size;
-
+            const auto coord = Coordinate({max_seq_in_beam - 1, batch, beam});
+            const auto offset = std::inner_product(coord.begin(), coord.end(), in_strides.begin(), 0) * elem_size;
             memcpy(out + offset, step_ids + offset, elem_size);
 
             size_t parent = _asIndex(parent_ids + offset, element_type);
 
             for (size_t level = max_seq_in_beam - 1; level-- > 0;) {
-                memcpy(out + cordinate_transform.index({level, batch, beam}) * elem_size,
-                       step_ids + cordinate_transform.index({level, batch, parent}) * elem_size,
-                       elem_size);
+                const auto coord_beam = Coordinate({level, batch, beam});
+                const auto out_idx = std::inner_product(coord_beam.begin(), coord_beam.end(), in_strides.begin(), 0);
+
+                const auto coord_parent = Coordinate({level, batch, parent});
+                const auto step_ids_idx =
+                    std::inner_product(coord_parent.begin(), coord_parent.end(), in_strides.begin(), 0);
+
+                memcpy(out + out_idx * elem_size, step_ids + step_ids_idx * elem_size, elem_size);
 
-                parent =
-                    _asIndex(parent_ids + cordinate_transform.index({level, batch, parent}) * elem_size, element_type);
+                parent = _asIndex(parent_ids + step_ids_idx * elem_size, element_type);
             }
 
             bool finished = false;
             for (size_t time = 0; time < max_seq_in_beam; ++time) {
+                const auto out_coord = Coordinate({time, batch, beam});
+                const auto out_idx = std::inner_product(out_coord.begin(), out_coord.end(), in_strides.begin(), 0);
                 if (finished) {
-                    memcpy(out + cordinate_transform.index({time, batch, beam}) * elem_size, end_token, elem_size);
-                } else if (_asIndex(out + cordinate_transform.index({time, batch, beam}) * elem_size, element_type) ==
-                           _asIndex(end_token, element_type)) {
+                    memcpy(out + out_idx * elem_size, end_token, elem_size);
+                } else if (_asIndex(out + out_idx * elem_size, element_type) == _asIndex(end_token, element_type)) {
                     finished = true;
                 }
             }
         }
     }
-    NGRAPH_SUPPRESS_DEPRECATED_END
 }
diff --git a/ngraph/core/reference/src/runtime/reference/random_uniform.cpp b/ngraph/core/reference/src/runtime/reference/random_uniform.cpp
new file mode 100644
index 00000000000000..e183eba59aabba
--- /dev/null
+++ b/ngraph/core/reference/src/runtime/reference/random_uniform.cpp
@@ -0,0 +1,321 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "ngraph/runtime/reference/random_uniform.hpp"
+
+#include <ctime>
+
+#include "ngraph/shape.hpp"
+
+namespace ngraph {
+namespace runtime {
+namespace reference {
+
+// Splits uint64 value into two uint32 values with right and left part of original value.
+std::pair<uint32_t, uint32_t> split_high_low(uint64_t value) {
+    uint32_t low = static_cast<uint32_t>(value);
+    uint32_t high = static_cast<uint32_t>(value >> 32);
+    return {low, high};
+}
+
+// Concatenates two uint32 values into single uint64 values.
+uint64_t unite_high_low(uint32_t high, uint32_t low) {
+    return (static_cast<uint64_t>(high) << 32) + low;
+}
+
+// Runs single "round" of Philox algorithm.
+void calculate_round(uint64_t key, uint64_t& counter, uint64_t& n) {
+    // Split key, counter and n into two uint32 values.
+    auto counter_lr = split_high_low(counter);
+    auto key_lr = split_high_low(key);
+    auto n_lr = split_high_low(n);
+
+    // Each round performs following updating for n and counter:
+    // left uint32 part = mullo(R, M)
+    // right uint32 part  = mulhi(R, M) xor k xor L
+    // mulhi(a, b) = floor((a * b) / 2^32)
+    // mullo(a, b) = (a * b) mod 2^32,
+    // where M - statistic_maximizing_multiplier const
+    auto prod0 = split_high_low(statistic_maximizing_multiplier_n * n_lr.first);
+    auto prod1 = split_high_low(statistic_maximizing_multiplier_counter * counter_lr.first);
+    n_lr.first = prod1.second ^ n_lr.second ^ key_lr.first;
+    n_lr.second = prod1.first;
+    counter_lr.first = prod0.second ^ counter_lr.second ^ key_lr.second;
+    counter_lr.second = prod0.first;
+
+    // Unite counter and n into uint64 values.
+    counter = unite_high_low(counter_lr.second, counter_lr.first);
+    n = unite_high_low(n_lr.second, n_lr.first);
+}
+
+// Increases key value.
+void raise_key(uint64_t& key) {
+    auto key_lr = split_high_low(key);
+    key_lr.first += crush_resistance_const_lower_value;
+    key_lr.second += crush_resistance_const_upper_value;
+    key = unite_high_low(key_lr.second, key_lr.first);
+}
+
+// Helper function for converting uint32 values to float32. Sets fractional part of
+// floating value with bits from uint32 value. Resulting value is in interval [0,1).
+float uint32_to_float(uint32_t x) {
+    // float32 is formatted as follows: sign(1 bit) exponent(8 bits) mantissa(23 bits). The value is interpreted
+    // The value is interpreted using following formula:
+    // (-1)^sign * 1, mantissa * 2 ^ (exponent - 127)
+    // Here we set the following values:
+    // sign = 0
+    // exponent = 127, for obtaining a zero exponent.
+    // mantissa = 23 right bits from generated uint32 random value.
+
+    convert_types out_val = {(static_cast<uint32_t>(127) << 23) | (x & 0x7fffffu)};
+    return out_val.f - 1.0f;
+}
+
+// Helper function for converting uint32 values to float16.Sets fractional part of
+// floating value with bits from uint32 value. Resulting value is in interval [0,1).
+float16 uint32_to_float16(uint32_t x) {
+    // float16 is formatted as follows: sign(1 bit) exponent(5 bits) mantissa(10 bits). The value is interpreted
+    // The value is interpreted using following formula:
+    // (-1)^sign * 1, mantissa * 2 ^ (exponent - 15)
+    // Here we set the following values:
+    // sign = 0
+    // exponent = 15, for obtaining a zero exponent.
+    // mantissa = 10 right bits from generated uint32 random value.
+
+    uint16_t x_uint16 = static_cast<uint16_t>(x);
+    convert_types out_val = {(static_cast<uint16_t>(15) << 10) | (x_uint16 & 0x3ffu)};
+    return out_val.f16 - static_cast<float16>(1);
+}
+
+// Helper function for converting uint32 values to double. Sets fractional part of
+// floating double with bits from uint32 values. Resulting value is in interval [0,1).
+double uint32_to_double(uint32_t x1, uint32_t x2) {
+    // float64 is formatted as follows: sign(1 bit) exponent(11 bits) mantissa(52 bits). The value is interpreted
+    // The value is interpreted using following formula:
+    // (-1)^sign * 1, mantissa * 2 ^ (exponent - 1023)
+    // Here we set the following values:
+    // sign = 0
+    // exponent = 1023, for obtaining a zero exponent.
+    // mantissa = 52 right bits from two concatenated uint32 values from random integer generator.
+
+    uint64_t significant = ((static_cast<uint64_t>(x1) & 0xfffffu) << 32) | static_cast<uint64_t>(x2);
+    convert_types out_val = {((static_cast<uint64_t>(1023) << 52) | significant)};
+    return out_val.d - 1.0;
+}
+
+// Helper function for converting uint32 values to bfloat16. Sets fractional part of
+// floating value with bits from uint32 value. Resulting value is in interval [0,1).
+bfloat16 uint32_to_bfloat16(uint32_t x) {
+    // bfloat16 is formatted as follows: sign(1 bit) exponent(8 bits) mantissa(7 bits). The value is interpreted
+    // The value is interpreted using following formula:
+    // (-1)^sign * 1, mantissa * 2 ^ (exponent - 127)
+    // Here we set the following values:
+    // sign = 0
+    // exponent = 127, for obtaining a zero exponent.
+    // mantissa = 7 right bits from generated uint32 random value.
+
+    uint16_t x_uint16 = static_cast<uint16_t>(x);
+    convert_types out_val = {(static_cast<uint16_t>(127) << 7) | (x_uint16 & 0x7fu)};
+    return out_val.bf16 - static_cast<bfloat16>(1);
+}
+
+// Runs Philox algorithm.
+void run_philox(uint64_t key, uint64_t counter, uint64_t n, size_t n_rounds, std::vector<uint32_t>& res) {
+    for (size_t i = 0; i < n_rounds; i++) {
+        calculate_round(key, counter, n);
+        if (i < n_rounds - 1)
+            raise_key(key);
+    }
+    auto res1 = split_high_low(n);
+    auto res2 = split_high_low(counter);
+    res[0] = res1.first;
+    res[1] = res1.second;
+    res[2] = res2.first;
+    res[3] = res2.second;
+}
+
+// Converts uint32 values to destination type and normalizes to required range
+template <typename T>
+void convert_to_output_type(const std::vector<uint32_t>& res,
+                            size_t step,
+                            const ngraph::element::Type& elem_type,
+                            const char* min_val,
+                            const char* max_val,
+                            char* out,
+                            size_t k,
+                            size_t elem_count,
+                            T (*convert_single_input)(uint32_t) = nullptr,
+                            T (*convert_two_inputs)(uint32_t, uint32_t, T, T) = nullptr,
+                            T (*mod_func)(uint32_t, T, T) = nullptr) {
+    // Get min and max values
+    T mn[1];
+    T mx[1];
+    memcpy(mn, min_val, elem_type.size());
+    memcpy(mx, max_val, elem_type.size());
+
+    std::vector<T> res_out_type(step);
+    if (elem_type.size() > 4) {
+        // Each element of resulting sequence is formed using two uint32 values
+        res_out_type[0] = convert_two_inputs(res[0], res[1], mn[0], mx[0]);
+        res_out_type[1] = convert_two_inputs(res[2], res[3], mn[0], mx[0]);
+    } else {
+        // Each element of resulting sequence is formed using single uint32 value
+        std::transform(res.data(),
+                       res.data() + step,
+                       res_out_type.data(),
+                       [&mn, &mx, &convert_single_input, &mod_func](uint32_t elem) {
+                           if (convert_single_input != nullptr) {
+                               return convert_single_input(elem) * (mx[0] - mn[0]) + mn[0];
+                           } else {
+                               return mod_func(elem, mn[0], mx[0]);
+                           }
+                       });
+    }
+
+    memcpy(out + k * elem_type.size(), res_out_type.data(), std::min(step, elem_count - k) * elem_type.size());
+}
+
+// Implementation of RandomUniform that uses Philox algorithm as inner random unsigned integer generator.
+std::pair<uint64_t, uint64_t> random_uniform(const uint64_t* out_shape,
+                                             const char* min_val,
+                                             const char* max_val,
+                                             char* out,
+                                             const Shape& out_shape_shape,
+                                             const ngraph::element::Type& elem_type,
+                                             uint64_t seed,
+                                             uint64_t seed2,
+                                             std::pair<uint64_t, uint64_t> prev_state) {
+    // When both seed values are equal to zero RandomUniform should generate non-deterministic sequence.
+    // Implementation in plugins may differ for this case.
+    if (seed == 0 && seed2 == 0) {
+        std::srand(std::time(nullptr));
+        seed = std::rand();
+    }
+
+    // Get previous counter state
+    uint64_t n_state = prev_state.first;
+    uint64_t counter_state = prev_state.second;
+
+    // Initialize Philox key and counters
+    uint64_t key = seed;
+    uint64_t counter = counter_state > 0 ? counter_state : seed2;
+    uint64_t n = n_state;
+
+    // Calculate total element count for generation
+    size_t shape_count = shape_size(out_shape_shape);
+    size_t elem_count = 1;
+    for (size_t i = 0; i < shape_count; i++) {
+        elem_count *= out_shape[i];
+    }
+
+    // Philox algorithm returns 4 elements of RNG sequence per each invocation
+    const size_t philox_output_size = 4;
+
+    // Each run of Philox algorithm generates 4 uint32 values.
+    // If output_type is int32, f32, bf16, or f16 each value is converted to
+    // corresponding type so we have 4 result values. For f64 and i64 we use
+    // a pair of values for conversion, so we have 2 result values.
+    // Step indicates how many values we generate in one iteration.
+    const size_t step = elem_type.size() > 4 ? 2 : 4;
+
+    for (size_t k = 0; k < elem_count; k += step) {
+        // generate 4 random uint32 values using Philox algorithm
+        std::vector<uint32_t> res(philox_output_size);
+        run_philox(key, counter, n, rounds_number, res);
+
+        // convert values to corresponding output_type
+        switch (elem_type) {
+        case ngraph::element::Type_t::f32: {
+            convert_to_output_type<float>(res, step, elem_type, min_val, max_val, out, k, elem_count, uint32_to_float);
+            break;
+        }
+        case ngraph::element::Type_t::f16: {
+            convert_to_output_type<float16>(res,
+                                            step,
+                                            elem_type,
+                                            min_val,
+                                            max_val,
+                                            out,
+                                            k,
+                                            elem_count,
+                                            uint32_to_float16);
+            break;
+        }
+        case ngraph::element::Type_t::bf16: {
+            convert_to_output_type<bfloat16>(res,
+                                             step,
+                                             elem_type,
+                                             min_val,
+                                             max_val,
+                                             out,
+                                             k,
+                                             elem_count,
+                                             uint32_to_bfloat16);
+            break;
+        }
+        case ngraph::element::Type_t::f64: {
+            convert_to_output_type<double>(res,
+                                           step,
+                                           elem_type,
+                                           min_val,
+                                           max_val,
+                                           out,
+                                           k,
+                                           elem_count,
+                                           nullptr,
+                                           [](uint32_t a, uint32_t b, double mn, double mx) {
+                                               return uint32_to_double(a, b) * (mx - mn) + mn;
+                                           });
+            break;
+        }
+        case ngraph::element::Type_t::i32: {
+            convert_to_output_type<int>(res,
+                                        step,
+                                        elem_type,
+                                        min_val,
+                                        max_val,
+                                        out,
+                                        k,
+                                        elem_count,
+                                        nullptr,
+                                        nullptr,
+                                        [](uint32_t x, int mn, int mx) {
+                                            return static_cast<int>(x % (mx - mn) + mn);
+                                        });
+            break;
+        }
+        case ngraph::element::Type_t::i64: {
+            convert_to_output_type<int64_t>(res,
+                                            step,
+                                            elem_type,
+                                            min_val,
+                                            max_val,
+                                            out,
+                                            k,
+                                            elem_count,
+                                            nullptr,
+                                            [](uint32_t a, uint32_t b, int64_t mn, int64_t mx) {
+                                                return static_cast<int64_t>(unite_high_low(b, a) % (mx - mn) + mn);
+                                            });
+            break;
+        }
+        default:
+            throw ngraph_error("Unsupported type of RandomUniform: " + elem_type.get_type_name());
+        }
+        if (++n == 0)
+            ++counter;
+    }
+
+    // Calculate counter values for next RandomUniform run
+    uint64_t skip_count = elem_count * skip_const;
+    n_state += skip_count;
+    if (n_state < skip_count)
+        counter_state++;
+
+    return {n_state, counter_state};
+}
+
+}  // namespace reference
+}  // namespace runtime
+}  // namespace ngraph
diff --git a/ngraph/core/src/descriptor/input.cpp b/ngraph/core/src/descriptor/input.cpp
index 1e08d4734932a6..827b0f69820553 100644
--- a/ngraph/core/src/descriptor/input.cpp
+++ b/ngraph/core/src/descriptor/input.cpp
@@ -5,11 +5,11 @@
 #include "openvino/core/descriptor/input.hpp"
 
 #include "ngraph/env_util.hpp"
-#include "ngraph/node.hpp"
 #include "openvino/core/descriptor/output.hpp"
+#include "openvino/core/node.hpp"
 #include "openvino/core/type/element_type.hpp"
 
-ov::descriptor::Input::Input(ngraph::Node* node, size_t index, Output& output)
+ov::descriptor::Input::Input(ov::Node* node, size_t index, Output& output)
     : m_node(node),
       m_index(index),
       m_output(&output),
@@ -19,7 +19,7 @@ ov::descriptor::Input::Input(ngraph::Node* node, size_t index, Output& output)
     output.add_input(this);
 }
 
-ov::descriptor::Input::Input(ngraph::Node* node, size_t index)
+ov::descriptor::Input::Input(ov::Node* node, size_t index)
     : m_node(node),
       m_index(index),
       m_output(nullptr),
@@ -46,7 +46,7 @@ void ov::descriptor::Input::replace_output(Output& new_output) {
     }
 }
 
-void ov::descriptor::Input::replace_output(const std::shared_ptr<ngraph::Node>& node, size_t i) {
+void ov::descriptor::Input::replace_output(const std::shared_ptr<ov::Node>& node, size_t i) {
     replace_output(node->m_outputs.at(i));
 }
 
@@ -78,7 +78,7 @@ std::shared_ptr<ov::descriptor::Tensor> ov::descriptor::Input::get_tensor_ptr()
     return m_output->get_tensor_ptr();
 }
 
-const ngraph::Shape& ov::descriptor::Input::get_shape() const {
+const ov::Shape& ov::descriptor::Input::get_shape() const {
     return m_output->get_shape();
 }
 
diff --git a/ngraph/core/src/descriptor/output.cpp b/ngraph/core/src/descriptor/output.cpp
index c90885bc5df8cb..64bb3a525291be 100644
--- a/ngraph/core/src/descriptor/output.cpp
+++ b/ngraph/core/src/descriptor/output.cpp
@@ -43,7 +43,7 @@ ov::descriptor::Tensor& ov::descriptor::Output::get_tensor() const {
     return *m_tensor;
 }
 
-const ngraph::Shape& ov::descriptor::Output::get_shape() const {
+const ov::Shape& ov::descriptor::Output::get_shape() const {
     return m_tensor->get_shape();
 }
 
diff --git a/ngraph/core/src/descriptor/tensor.cpp b/ngraph/core/src/descriptor/tensor.cpp
index 2abc343a2b985d..61926483a2ccf3 100644
--- a/ngraph/core/src/descriptor/tensor.cpp
+++ b/ngraph/core/src/descriptor/tensor.cpp
@@ -55,7 +55,7 @@ void ov::descriptor::Tensor::set_upper_value(const ngraph::HostTensorPtr& value)
     m_upper_value = value;
 }
 
-const ngraph::Shape& ov::descriptor::Tensor::get_shape() const {
+const ov::Shape& ov::descriptor::Tensor::get_shape() const {
     if (m_partial_shape.is_static()) {
         if (m_shape_changed.load(std::memory_order_relaxed)) {
             std::lock_guard<std::mutex> guard(shape_mutex);
diff --git a/ngraph/core/src/function.cpp b/ngraph/core/src/function.cpp
index 88de5c26743981..857e24798435af 100644
--- a/ngraph/core/src/function.cpp
+++ b/ngraph/core/src/function.cpp
@@ -7,129 +7,133 @@
 #include <algorithm>
 #include <list>
 #include <memory>
-#include <ngraph/ops.hpp>
 
 #include "itt.hpp"
 #include "ngraph/graph_util.hpp"
 #include "ngraph/log.hpp"
-#include "ngraph/op/util/op_types.hpp"
-#include "ngraph/op/util/variable_context.hpp"
-#include "ngraph/op/util/variable_extension.hpp"
+#include "ngraph/ops.hpp"
 #include "ngraph/opsets/opset7.hpp"
 #include "ngraph/validation_util.hpp"
+#include "openvino/core/except.hpp"
+#include "openvino/op/util/op_types.hpp"
+#include "openvino/op/util/variable_context.hpp"
+#include "openvino/op/util/variable_extension.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr DiscreteTypeInfo Function::type_info;
+constexpr ov::DiscreteTypeInfo ov::Function::type_info;
 
-atomic<size_t> Function::m_next_instance_id(0);
+atomic<size_t> ov::Function::m_next_instance_id(0);
 
-void check_all_variables_registered(const std::vector<shared_ptr<Node>>& ordered_ops, const VariableVector& variables) {
+void check_all_variables_registered(const std::vector<shared_ptr<ov::Node>>& ordered_ops,
+                                    const ov::op::util::VariableVector& variables) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraphPass_LT, "Function::check_all_variables_registered");
     std::stringstream unregistered_variables;
     for (auto& node : ordered_ops) {
-        const auto& variable_op = dynamic_pointer_cast<VariableExtension>(node);
+        const auto& variable_op = dynamic_pointer_cast<ov::op::util::VariableExtension>(node);
         if (variable_op &&
             std::find(variables.begin(), variables.end(), variable_op->get_variable()) == variables.end())
             unregistered_variables << variable_op->get_variable_id() << std::endl;
     }
     if (!unregistered_variables.str().empty())
-        throw ngraph_error("Function references undeclared variables: " + unregistered_variables.str());
+        throw ov::Exception("Function references undeclared variables: " + unregistered_variables.str());
 }
 
-void check_all_parameters_registered(const std::vector<shared_ptr<Node>>& ordered_ops,
-                                     const ParameterVector& parameters) {
+void check_all_parameters_registered(const std::vector<shared_ptr<ov::Node>>& ordered_ops,
+                                     const ngraph::ParameterVector& parameters) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "Function::check_all_parameters_registered");
 
     std::stringstream unregistered_parameters;
     for (auto& node : ordered_ops) {
-        if (op::is_parameter(node) && std::find(parameters.begin(), parameters.end(), node) == parameters.end())
+        if (ov::op::util::is_parameter(node) &&
+            std::find(parameters.begin(), parameters.end(), node) == parameters.end())
             unregistered_parameters << node << std::endl;
     }
     if (!unregistered_parameters.str().empty())
-        throw ngraph_error("Function references undeclared parameters: " + unregistered_parameters.str());
+        throw ov::Exception("Function references undeclared parameters: " + unregistered_parameters.str());
 }
 
-VariableVector auto_detect_variables(const std::vector<std::shared_ptr<Node>>& ordered_ops) {
+ov::op::util::VariableVector auto_detect_variables(const std::vector<std::shared_ptr<ov::Node>>& ordered_ops) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "Function::auto_detect_variables");
-    unordered_set<VariablePtr> variables;
+    unordered_set<ov::op::util::Variable::Ptr> variables;
     for (const auto& op : ordered_ops) {
-        if (const auto& variable_op = dynamic_pointer_cast<VariableExtension>(op)) {
+        if (const auto& variable_op = dynamic_pointer_cast<ov::op::util::VariableExtension>(op)) {
             variables.insert(variable_op->get_variable());
         }
     }
-    return VariableVector(variables.begin(), variables.end());
+    return ov::op::util::VariableVector(variables.begin(), variables.end());
 }
 
-ParameterVector auto_detect_parameters(const std::vector<std::shared_ptr<Node>>& ordered_ops) {
+ngraph::ParameterVector auto_detect_parameters(const std::vector<std::shared_ptr<ov::Node>>& ordered_ops) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "Function::auto_detect_parameters");
-    ParameterVector parameter_vector;
+    ngraph::ParameterVector parameter_vector;
     for (const auto& op : ordered_ops) {
-        if (const auto& param = dynamic_pointer_cast<opset7::Parameter>(op)) {
+        if (const auto& param = dynamic_pointer_cast<ngraph::opset7::Parameter>(op)) {
             parameter_vector.push_back(param);
         }
     }
     return parameter_vector;
 }
 
-Function::Function(const ResultVector& results, const ParameterVector& parameters, const std::string& name)
+ov::Function::Function(const ResultVector& results, const ngraph::ParameterVector& parameters, const std::string& name)
     : m_name(name),
       m_unique_name("Function_" + to_string(m_next_instance_id.fetch_add(1))),
-      m_topological_sorter(topological_sort<std::vector<std::shared_ptr<Node>>>),
+      m_topological_sorter(ngraph::topological_sort<std::vector<std::shared_ptr<ov::Node>>>),
       m_results(results),
       m_parameters(parameters) {
     prerequirements(true, false);
 }
 
-Function::Function(const OutputVector& results, const ParameterVector& parameters, const std::string& name)
+ov::Function::Function(const OutputVector& results, const ngraph::ParameterVector& parameters, const std::string& name)
     : m_name(name),
       m_unique_name("Function_" + to_string(m_next_instance_id.fetch_add(1))),
-      m_topological_sorter(topological_sort<std::vector<std::shared_ptr<Node>>>),
+      m_topological_sorter(ngraph::topological_sort<std::vector<std::shared_ptr<ov::Node>>>),
       m_results(as_result_vector(results)),
       m_parameters(parameters) {
     prerequirements(true, false);
 }
 
-Function::Function(const NodeVector& results, const ParameterVector& parameters, const std::string& name)
+ov::Function::Function(const NodeVector& results, const ngraph::ParameterVector& parameters, const std::string& name)
     : m_name(name),
       m_unique_name("Function_" + to_string(m_next_instance_id.fetch_add(1))),
-      m_topological_sorter(topological_sort<std::vector<std::shared_ptr<Node>>>),
+      m_topological_sorter(ngraph::topological_sort<std::vector<std::shared_ptr<ov::Node>>>),
       m_results(as_result_vector(as_output_vector(results))),
       m_parameters(parameters) {
     prerequirements(true, false);
 }
 
-Function::Function(const std::shared_ptr<Node>& result, const ParameterVector& parameters, const std::string& name)
+ov::Function::Function(const std::shared_ptr<Node>& result,
+                       const ngraph::ParameterVector& parameters,
+                       const std::string& name)
     : Function(result->outputs(), parameters, name) {}
 
-Function::Function(const ResultVector& results,
-                   const SinkVector& sinks,
-                   const ParameterVector& parameters,
-                   const std::string& name)
+ov::Function::Function(const ngraph::ResultVector& results,
+                       const ngraph::SinkVector& sinks,
+                       const ngraph::ParameterVector& parameters,
+                       const std::string& name)
     : m_name(name),
       m_unique_name("Function_" + to_string(m_next_instance_id.fetch_add(1))),
-      m_topological_sorter(topological_sort<std::vector<std::shared_ptr<Node>>>),
+      m_topological_sorter(ngraph::topological_sort<std::vector<std::shared_ptr<Node>>>),
       m_results(results),
       m_sinks(sinks),
       m_parameters(parameters) {
     prerequirements(true, false);
 }
 
-Function::Function(const OutputVector& results,
-                   const SinkVector& sinks,
-                   const ParameterVector& parameters,
-                   const std::string& name)
+ov::Function::Function(const OutputVector& results,
+                       const ngraph::SinkVector& sinks,
+                       const ngraph::ParameterVector& parameters,
+                       const std::string& name)
     : Function(as_result_vector(results), sinks, parameters, name) {}
 
-Function::Function(const ResultVector& results,
-                   const SinkVector& sinks,
-                   const ParameterVector& parameters,
-                   const VariableVector& variables,
-                   const std::string& name)
+ov::Function::Function(const ngraph::ResultVector& results,
+                       const ngraph::SinkVector& sinks,
+                       const ngraph::ParameterVector& parameters,
+                       const ngraph::VariableVector& variables,
+                       const std::string& name)
     : m_name(name),
       m_unique_name("Function_" + to_string(m_next_instance_id.fetch_add(1))),
-      m_topological_sorter(topological_sort<std::vector<std::shared_ptr<Node>>>),
+      m_topological_sorter(ngraph::topological_sort<std::vector<std::shared_ptr<Node>>>),
       m_results(results),
       m_sinks(sinks),
       m_parameters(parameters),
@@ -137,37 +141,38 @@ Function::Function(const ResultVector& results,
     prerequirements(false, false);
 }
 
-Function::Function(const OutputVector& results,
-                   const SinkVector& sinks,
-                   const ParameterVector& parameters,
-                   const VariableVector& variables,
-                   const std::string& name)
+ov::Function::Function(const OutputVector& results,
+                       const ngraph::SinkVector& sinks,
+                       const ngraph::ParameterVector& parameters,
+                       const ngraph::VariableVector& variables,
+                       const std::string& name)
     : Function(as_result_vector(results), sinks, parameters, variables, name) {}
 
-Function::Function(const OutputVector& results,
-                   const ParameterVector& parameters,
-                   const VariableVector& variables,
-                   const std::string& name)
+ov::Function::Function(const ngraph::OutputVector& results,
+                       const ngraph::ParameterVector& parameters,
+                       const ngraph::VariableVector& variables,
+                       const std::string& name)
     : Function(as_result_vector(results), {}, parameters, variables, name) {}
 
-Function::Function(const ResultVector& results,
-                   const ParameterVector& parameters,
-                   const VariableVector& variables,
-                   const std::string& name)
+ov::Function::Function(const ngraph::ResultVector& results,
+                       const ngraph::ParameterVector& parameters,
+                       const ngraph::VariableVector& variables,
+                       const std::string& name)
     : Function(results, {}, parameters, variables, name) {}
 
-Function::Function(const OutputVector& results, const SinkVector& sinks, const string& name)
+ov::Function::Function(const ngraph::OutputVector& results, const ngraph::SinkVector& sinks, const string& name)
     : m_name(name),
       m_unique_name("Function_" + to_string(m_next_instance_id.fetch_add(1))),
-      m_topological_sorter(topological_sort<std::vector<std::shared_ptr<Node>>>),
+      m_topological_sorter(ngraph::topological_sort<std::vector<std::shared_ptr<Node>>>),
       m_results(as_result_vector(results)),
       m_sinks(sinks) {
     prerequirements(true, true);
 }
 
-Function::Function(const OutputVector& results, const string& name) : Function(results, SinkVector{}, name) {}
+ov::Function::Function(const OutputVector& results, const string& name)
+    : Function(results, ngraph::SinkVector{}, name) {}
 
-void Function::prerequirements(bool detect_variables, bool detect_parameters) {
+void ov::Function::prerequirements(bool detect_variables, bool detect_parameters) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "Function::prerequirements");
 
     const auto& ordered_ops = get_ordered_ops();
@@ -182,47 +187,48 @@ void Function::prerequirements(bool detect_variables, bool detect_parameters) {
         check_all_variables_registered(ordered_ops, m_variables);
 }
 
-void Function::validate_nodes_and_infer_types() const {
+void ov::Function::validate_nodes_and_infer_types() const {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "Function::validate_nodes_and_infer_types");
 
     struct Counter {
         int cnt_assign = 0;
         int cnt_read_val = 0;
     };
-    std::map<Variable*, Counter> pair_checker;
+    std::map<ov::op::util::Variable*, Counter> pair_checker;
     std::stringstream unregistered_parameters;
     std::stringstream unregistered_variables;
     for (auto& node : get_ordered_ops()) {
         node->revalidate_and_infer_types();
-        if (op::is_parameter(node) && std::find(m_parameters.begin(), m_parameters.end(), node) == m_parameters.end())
+        if (op::util::is_parameter(node) &&
+            std::find(m_parameters.begin(), m_parameters.end(), node) == m_parameters.end())
             unregistered_parameters << node << std::endl;
 
-        const auto& variable_op = dynamic_pointer_cast<VariableExtension>(node);
+        const auto& variable_op = dynamic_pointer_cast<op::util::VariableExtension>(node);
         if (variable_op &&
             std::find(m_variables.begin(), m_variables.end(), variable_op->get_variable()) == m_variables.end())
             unregistered_variables << variable_op->get_variable_id() << std::endl;
 
-        if (const auto& assign = std::dynamic_pointer_cast<op::AssignBase>(node)) {
+        if (const auto& assign = std::dynamic_pointer_cast<ngraph::op::AssignBase>(node)) {
             pair_checker[assign->get_variable().get()].cnt_assign++;
-        } else if (const auto& read_value = std::dynamic_pointer_cast<op::ReadValueBase>(node)) {
+        } else if (const auto& read_value = std::dynamic_pointer_cast<ngraph::op::ReadValueBase>(node)) {
             pair_checker[read_value->get_variable().get()].cnt_read_val++;
         }
     }
     if (!unregistered_parameters.str().empty())
-        throw ngraph_error("Function references undeclared parameters: " + unregistered_parameters.str());
+        throw ov::Exception("Function references undeclared parameters: " + unregistered_parameters.str());
 
     if (!unregistered_variables.str().empty())
-        throw ngraph_error("Function references undeclared Variables: " + unregistered_variables.str());
+        throw ov::Exception("Function references undeclared Variables: " + unregistered_variables.str());
     bool only_pairs =
-        std::all_of(pair_checker.begin(), pair_checker.end(), [](const std::pair<Variable*, Counter>& val) {
+        std::all_of(pair_checker.begin(), pair_checker.end(), [](const std::pair<op::util::Variable*, Counter>& val) {
             return val.second.cnt_assign == 1 && val.second.cnt_read_val == 1;
         });
     if (!only_pairs)
-        throw ngraph_error("Function is incorrect. Assign and ReadValue operations must be in pairs on the "
-                           "network.");
+        throw ov::Exception("Function is incorrect. Assign and ReadValue operations must be in pairs on the "
+                            "network.");
 }
 
-std::vector<shared_ptr<Node>> Function::get_ordered_ops() const {
+std::vector<shared_ptr<ov::Node>> ov::Function::get_ordered_ops() const {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "Function::get_ordered_ops");
 
     vector<shared_ptr<Node>> nodes;
@@ -239,7 +245,7 @@ std::vector<shared_ptr<Node>> Function::get_ordered_ops() const {
     return m_topological_sorter(nodes);
 }
 
-void Function::map_unordered_ops(std::function<void(Node*)> f) const {
+void ov::Function::map_unordered_ops(std::function<void(Node*)> f) const {
     std::unordered_set<Node*> unordered_ops;
     std::stack<Node*, std::vector<Node*>> remaining_ops;
     for (auto& r : get_results()) {
@@ -267,75 +273,75 @@ void Function::map_unordered_ops(std::function<void(Node*)> f) const {
     }
 }
 
-const std::string& Function::get_friendly_name() const {
+const std::string& ov::Function::get_friendly_name() const {
     if (m_name.empty()) {
         return m_unique_name;
     }
     return m_name;
 }
 
-const std::string& Function::get_name() const {
+const std::string& ov::Function::get_name() const {
     return m_unique_name;
 }
 
-void Function::set_friendly_name(const string& name) {
+void ov::Function::set_friendly_name(const string& name) {
     m_name = name;
 }
 
-std::ostream& operator<<(std::ostream& out, const Function& f) {
+std::ostream& operator<<(std::ostream& out, const ov::Function& f) {
     out << "Function(" << f.get_name() << ")";
     return out;
 }
 
-size_t Function::get_output_size() const {
+size_t ov::Function::get_output_size() const {
     return m_results.size();
 }
 
-const element::Type& Function::get_output_element_type(size_t i) const {
+const ov::element::Type& ov::Function::get_output_element_type(size_t i) const {
     return m_results.at(i)->get_element_type();
 }
 
-const Shape& Function::get_output_shape(size_t i) const {
+const ov::Shape& ov::Function::get_output_shape(size_t i) const {
     return m_results.at(i)->get_shape();
 }
 
-const PartialShape& Function::get_output_partial_shape(size_t i) const {
+const ov::PartialShape& ov::Function::get_output_partial_shape(size_t i) const {
     return m_results.at(i)->get_output_partial_shape(0);
 }
 
-shared_ptr<Node> Function::get_output_op(size_t i) const {
+shared_ptr<ov::Node> ov::Function::get_output_op(size_t i) const {
     return m_results.at(i);
 }
 
-Output<Node> Function::output(size_t i) const {
+ov::Output<ov::Node> ov::Function::output(size_t i) const {
     return m_results.at(i);
 }
 
-shared_ptr<Node> Function::get_result() const {
+shared_ptr<ov::Node> ov::Function::get_result() const {
     if (m_results.size() != 1) {
-        throw ngraph_error("get_result() must be called on a function with exactly one result.");
+        throw ov::Exception("get_result() must be called on a function with exactly one result.");
     }
     return m_results.at(0);
 }
 
-std::vector<shared_ptr<Node>> Function::get_ops() const {
+std::vector<shared_ptr<ov::Node>> ov::Function::get_ops() const {
     std::vector<std::shared_ptr<Node>> ops;
-    traverse_nodes(this, [&](shared_ptr<Node> node) {
+    ngraph::traverse_nodes(this, [&](shared_ptr<Node> node) {
         ops.push_back(node);
     });
     return ops;
 }
 
-void Function::replace_node(std::shared_ptr<Node> old, std::shared_ptr<Node> repl) {
+void ov::Function::replace_node(std::shared_ptr<Node> old, std::shared_ptr<Node> repl) {
     ngraph::replace_node(old, repl);
 }
 
-size_t Function::get_graph_size() const {
+size_t ov::Function::get_graph_size() const {
     size_t total_size = 0;
     for (auto node : get_ops()) {
         total_size += sizeof(*node);
         if (node->description() == "Constant") {
-            const Shape& shape = node->get_output_shape(0);
+            const ov::Shape& shape = node->get_output_shape(0);
             size_t const_size = node->get_output_element_type(0).size();
             if (shape.size() == 0) {
                 total_size += const_size;
@@ -347,10 +353,7 @@ size_t Function::get_graph_size() const {
     return total_size;
 }
 
-// TODO(pthoreho) this will be expensive, since we will be traversing all the nodes in
-// the graph, figure out if their is a way to cache the result and invalidate/update
-// the result if the function is modified
-bool Function::is_dynamic() const {
+bool ov::Function::is_dynamic() const {
     auto list_of_nodes = this->get_ops();
     for (auto& node : list_of_nodes) {
         if (node->get_output_partial_shape(0).is_dynamic()) {
@@ -360,7 +363,7 @@ bool Function::is_dynamic() const {
     return false;
 }
 
-void Function::replace_parameter(size_t parameter_index, const shared_ptr<op::Parameter>& parameter) {
+void ov::Function::replace_parameter(size_t parameter_index, const shared_ptr<ngraph::op::Parameter>& parameter) {
     NGRAPH_CHECK(parameter_index < m_parameters.size(),
                  "replace_parameter(): Tried to replace parameter at index ",
                  parameter_index,
@@ -371,11 +374,11 @@ void Function::replace_parameter(size_t parameter_index, const shared_ptr<op::Pa
     m_parameters[parameter_index] = parameter;
 }
 
-void Function::set_topological_sort(topological_sort_t sorter) {
+void ov::Function::set_topological_sort(topological_sort_t sorter) {
     m_topological_sorter = sorter;
 }
 
-int64_t Function::get_parameter_index(const std::shared_ptr<op::Parameter>& parameter) const {
+int64_t ov::Function::get_parameter_index(const std::shared_ptr<ngraph::op::Parameter>& parameter) const {
     int64_t pos = 0;
     for (auto p : get_parameters()) {
         if (p == parameter) {
@@ -386,9 +389,9 @@ int64_t Function::get_parameter_index(const std::shared_ptr<op::Parameter>& para
     return -1;
 }
 
-int64_t Function::get_result_index(const Output<Node>& value) const {
+int64_t ov::Function::get_result_index(const Output<Node>& value) const {
     int64_t pos = 0;
-    if (ov::is_type<op::Result>(value.get_node_shared_ptr())) {
+    if (is_type<ngraph::op::Result>(value.get_node_shared_ptr())) {
         auto result = value.get_node_shared_ptr();
         for (auto r : get_results()) {
             if (r == result) {
@@ -407,11 +410,12 @@ int64_t Function::get_result_index(const Output<Node>& value) const {
     return -1;
 }
 
-bool Function::evaluate(const HostTensorVector& output_tensors,
-                        const HostTensorVector& input_tensors,
-                        EvaluationContext evaluation_context) const {
+bool ov::Function::evaluate(const HostTensorVector& output_tensors,
+                            const HostTensorVector& input_tensors,
+                            EvaluationContext evaluation_context) const {
     if (evaluation_context.find("VariableContext") == evaluation_context.end())
-        evaluation_context["VariableContext"] = std::make_shared<VariantWrapper<VariableContext>>(VariableContext());
+        evaluation_context["VariableContext"] =
+            std::make_shared<VariantWrapper<ov::op::util::VariableContext>>(ov::op::util::VariableContext());
     std::map<RawNodeOutput, HostTensorPtr> value_map;
     for (size_t i = 0; i < m_parameters.size(); ++i) {
         value_map[m_parameters.at(i)->output(0)] = input_tensors.at(i);
@@ -426,20 +430,20 @@ bool Function::evaluate(const HostTensorVector& output_tensors,
     for (const auto& m_sink : m_sinks) {
         outputs.push_back(m_sink);
     }
-    evaluate_nodes(value_map, output_tensor_map, outputs, evaluation_context);
+    ngraph::evaluate_nodes(value_map, output_tensor_map, outputs, evaluation_context);
     return true;
 }
 
-bool Function::visit_attributes(AttributeVisitor& visitor) {
+bool ov::Function::visit_attributes(AttributeVisitor& visitor) {
     visitor.on_attribute("parameters", m_parameters);
     visitor.on_attribute("results", m_results);
     return true;
 }
 
-void Function::add_sinks(const SinkVector& sinks) {
+void ov::Function::add_sinks(const ngraph::SinkVector& sinks) {
     m_sinks.insert(m_sinks.end(), sinks.begin(), sinks.end());
     for (const auto& sink : sinks) {
-        if (const auto& variable_op = dynamic_pointer_cast<VariableExtension>(sink)) {
+        if (const auto& variable_op = dynamic_pointer_cast<op::util::VariableExtension>(sink)) {
             if (find(m_variables.begin(), m_variables.end(), variable_op->get_variable()) == m_variables.end()) {
                 m_variables.push_back(variable_op->get_variable());
             }
@@ -447,29 +451,29 @@ void Function::add_sinks(const SinkVector& sinks) {
     }
 }
 
-void Function::remove_sink(const std::shared_ptr<op::Sink>& sink) {
+void ov::Function::remove_sink(const std::shared_ptr<ngraph::op::Sink>& sink) {
     m_sinks.erase(std::remove_if(m_sinks.begin(),
                                  m_sinks.end(),
-                                 [&sink](std::shared_ptr<op::Sink>& s) {
+                                 [&sink](std::shared_ptr<ngraph::op::Sink>& s) {
                                      return s == sink;
                                  }),
                   m_sinks.end());
 }
 
-void Function::add_results(const ResultVector& results) {
+void ov::Function::add_results(const ResultVector& results) {
     m_results.insert(m_results.end(), results.begin(), results.end());
 }
 
-void Function::remove_result(const std::shared_ptr<op::Result>& result) {
+void ov::Function::remove_result(const std::shared_ptr<ngraph::op::Result>& result) {
     m_results.erase(std::remove_if(m_results.begin(),
                                    m_results.end(),
-                                   [&result](std::shared_ptr<op::v0::Result>& r) {
+                                   [&result](std::shared_ptr<ngraph::op::v0::Result>& r) {
                                        return r == result;
                                    }),
                     m_results.end());
 }
 
-void Function::add_parameters(const ParameterVector& params) {
+void ov::Function::add_parameters(const ngraph::ParameterVector& params) {
     for (size_t i = 0; i < params.size(); i++) {
         for (size_t j = 0; j < m_parameters.size(); j++) {
             NGRAPH_CHECK(params[i] != m_parameters[j],
@@ -482,36 +486,37 @@ void Function::add_parameters(const ParameterVector& params) {
     m_parameters.insert(m_parameters.end(), params.begin(), params.end());
 }
 
-void Function::remove_parameter(const std::shared_ptr<op::Parameter>& param) {
+void ov::Function::remove_parameter(const std::shared_ptr<ngraph::op::Parameter>& param) {
     m_parameters.erase(std::remove_if(m_parameters.begin(),
                                       m_parameters.end(),
-                                      [&param](std::shared_ptr<op::v0::Parameter>& r) {
+                                      [&param](std::shared_ptr<ngraph::op::v0::Parameter>& r) {
                                           return r == param;
                                       }),
                        m_parameters.end());
 }
 
-void Function::add_variables(const VariableVector& variables) {
+void ov::Function::add_variables(const op::util::VariableVector& variables) {
     m_variables.insert(m_variables.end(), variables.begin(), variables.end());
 }
 
-void Function::remove_variable(const VariablePtr& variable) {
+void ov::Function::remove_variable(const op::util::Variable::Ptr& variable) {
     m_variables.erase(std::remove_if(m_variables.begin(),
                                      m_variables.end(),
-                                     [&variable](VariablePtr& v) {
+                                     [&variable](op::util::Variable::Ptr& v) {
                                          return v == variable;
                                      }),
                       m_variables.end());
 }
 
-VariablePtr Function::get_variable_by_id(const string& variable_id) const {
-    auto variable = std::find_if(m_variables.begin(), m_variables.end(), [&variable_id](const VariablePtr& cur) {
-        return cur->get_info().variable_id == variable_id;
-    });
+ov::op::util::Variable::Ptr ov::Function::get_variable_by_id(const string& variable_id) const {
+    auto variable =
+        std::find_if(m_variables.begin(), m_variables.end(), [&variable_id](const ov::op::util::Variable::Ptr& cur) {
+            return cur->get_info().variable_id == variable_id;
+        });
     if (variable != m_variables.end())
         return *variable;
     else
-        return VariablePtr();
+        return ov::op::util::Variable::Ptr();
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<shared_ptr<Function>>::type_info;
+constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<shared_ptr<ov::Function>>::type_info;
diff --git a/ngraph/core/src/graph_util.cpp b/ngraph/core/src/graph_util.cpp
index f5bb89d84a0714..eeaa794620648e 100644
--- a/ngraph/core/src/graph_util.cpp
+++ b/ngraph/core/src/graph_util.cpp
@@ -348,8 +348,7 @@ std::shared_ptr<ngraph::Function> ngraph::clone_function(const ngraph::Function&
     VariableVector cloned_vars;
     std::map<std::string, std::shared_ptr<Variable>> var_map;
     for (const auto& var : variables) {
-        auto cloned_var = std::make_shared<Variable>(
-            VariableInfo{PartialShape::dynamic(), element::dynamic, var->get_info().variable_id});
+        auto cloned_var = std::make_shared<Variable>(var->get_info());
         cloned_vars.push_back(cloned_var);
         var_map[cloned_var->get_info().variable_id] = cloned_var;
     }
diff --git a/ngraph/core/src/interval.cpp b/ngraph/core/src/interval.cpp
index 469132f3576ad9..d9aa326772dc72 100644
--- a/ngraph/core/src/interval.cpp
+++ b/ngraph/core/src/interval.cpp
@@ -21,7 +21,17 @@ Interval::value_type clip_times(Interval::value_type a, Interval::value_type b)
     }
 }
 Interval::value_type clip_add(Interval::value_type a, Interval::value_type b) {
-    return (a == Interval::s_max || b == Interval::s_max) ? Interval::s_max : a + b;
+    if (a == Interval::s_max || b == Interval::s_max) {
+        return Interval::s_max;
+    }
+
+    // check overflow without undefined behavior: a + b <= max
+    const static auto max = std::numeric_limits<Interval::value_type>::max();
+    if (b > (max - a)) {
+        return Interval::s_max;
+    }
+
+    return a + b;
 }
 Interval::value_type clip_minus(Interval::value_type a, Interval::value_type b) {
     if (a <= b) {
diff --git a/ngraph/core/src/itt.hpp b/ngraph/core/src/itt.hpp
index 1f602780957989..0e37005b853b59 100644
--- a/ngraph/core/src/itt.hpp
+++ b/ngraph/core/src/itt.hpp
@@ -42,16 +42,23 @@ OV_ITT_DOMAIN(SIMPLE_ngraph_pass);
 #    define NGRAPH_PASS_CALLBACK(matcher)
 #endif
 
-#define NGRAPH_TYPE_CASE(region, a, ...)                    \
-    case element::Type_t::a: {                              \
-        OV_SCOPE(ngraph_op, OV_PP_CAT3(region, _, a)) {     \
-            rc = evaluate<element::Type_t::a>(__VA_ARGS__); \
-        }                                                   \
+#define NGRAPH_TYPE_CASE(region, a, ...)                        \
+    case ov::element::Type_t::a: {                              \
+        OV_SCOPE(ngraph_op, OV_PP_CAT3(region, _, a)) {         \
+            rc = evaluate<ov::element::Type_t::a>(__VA_ARGS__); \
+        }                                                       \
     } break
 
-#define NGRAPH_COPY_TENSOR(region, a, ...)                     \
-    case element::Type_t::a: {                                 \
-        OV_SCOPE(ngraph_op, OV_PP_CAT3(region, _, a)) {        \
-            rc = copy_tensor<element::Type_t::a>(__VA_ARGS__); \
-        }                                                      \
+#define NGRAPH_2_TYPES_CASE(region, a, b, ...)                                  \
+    case element::Type_t::a: {                                                  \
+        OV_SCOPE(ngraph_op, OV_PP_CAT4(region, _, a, b)) {                      \
+            rc = evaluate<element::Type_t::a, element::Type_t::b>(__VA_ARGS__); \
+        }                                                                       \
+    } break
+
+#define NGRAPH_COPY_TENSOR(region, a, ...)                         \
+    case ov::element::Type_t::a: {                                 \
+        OV_SCOPE(ngraph_op, OV_PP_CAT3(region, _, a)) {            \
+            rc = copy_tensor<ov::element::Type_t::a>(__VA_ARGS__); \
+        }                                                          \
     } break
diff --git a/ngraph/core/src/layout.cpp b/ngraph/core/src/layout.cpp
new file mode 100644
index 00000000000000..0f1ca412bfe4f7
--- /dev/null
+++ b/ngraph/core/src/layout.cpp
@@ -0,0 +1,265 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/core/layout.hpp"
+
+#include <algorithm>
+
+#include "ngraph/except.hpp"
+#include "ngraph/util.hpp"
+
+using namespace ov;
+
+/////////////////////////////////////////////////////////////////////////////////
+
+static constexpr char BATCH[] = "N";
+static constexpr char CHANNELS[] = "C";
+static constexpr char WIDTH[] = "W";
+static constexpr char HEIGHT[] = "H";
+static constexpr char DEPTH[] = "D";
+static constexpr char SCALAR[] = "**SCALAR**";
+static constexpr char ELLIPSIS[] = "...";
+static constexpr int ELLIPSIS_LEN = 3;
+
+static const std::map<std::string, std::string>& dim_aliases() {
+    static const std::map<std::string, std::string> DIM_ALIASES = {{BATCH, BATCH},
+                                                                   {"BATCH", BATCH},
+                                                                   {"B", BATCH},
+                                                                   {"CHANNELS", CHANNELS},
+                                                                   {"CHANNEL", CHANNELS},
+                                                                   {"HEIGHT", HEIGHT},
+                                                                   {"WIDTH", WIDTH},
+                                                                   {"DEPTH", DEPTH}};
+    return DIM_ALIASES;
+}
+
+static std::string to_internal_name(const std::string& dim_name) {
+    auto name = ngraph::to_upper(dim_name);
+    auto it = dim_aliases().find(name);
+    if (it != dim_aliases().end()) {
+        name = it->second;
+    }
+    return name;
+}
+
+static void validate_name(const std::string& dim_name) {
+    OPENVINO_ASSERT(!dim_name.empty(), "Layout dimension name can't be empty");
+    bool has_alphanumeric = false;
+    for (const auto& c : dim_name) {
+        bool is_alnum = std::isalnum(c);
+        has_alphanumeric |= is_alnum;
+        OPENVINO_ASSERT(is_alnum || c == '_',
+                        "Layout name is invalid (" + dim_name + "). Only english letters, digits and _ is allowed");
+    }
+    OPENVINO_ASSERT(has_alphanumeric,
+                    "Layout name is invalid (" + dim_name + "). Name shall have alphanumeric characters");
+}
+
+Layout::Layout() : m_dynamic(true), m_left_size(0), m_right_size(0) {}
+
+Layout Layout::scalar() {
+    return SCALAR;
+}
+
+// 1. only order of dimensions "adbc" (0312)
+// 2. can define order and meaning for dimensions "NCHW"
+// 3. partial layout specialization "NC?"
+Layout::Layout(const std::string& layout_str) {
+    auto layout = ngraph::trim(layout_str);
+    OPENVINO_ASSERT(layout.length() > 0, "Cannot parse ov::Layout from an empty string");
+    if (layout == SCALAR) {
+        m_scalar = true;
+        m_dynamic = false;
+        return;
+    }
+    auto is_advanced_syntax = [](const std::string& layout) {
+        return layout.length() >= 2 && layout.front() == '[' && layout.back() == ']';
+    };
+
+    auto assign_name = [&](const std::string& name, int64_t index) {
+        auto dim_name = to_internal_name(name);
+        validate_name(name);
+        OPENVINO_ASSERT(m_names.count(dim_name) == 0,
+                        "Dimension (" + dim_name + ") is defined multiple times in layout");
+        m_names[dim_name] = index;
+        m_index_map[index] = dim_name;
+    };
+
+    if (is_advanced_syntax(layout)) {
+        OPENVINO_ASSERT(layout.length() > 2, "Cannot parse ov::Layout from an empty string");
+        auto parse_commas = [&](const std::string& sub_name, int64_t index = 0) -> int64_t {
+            OPENVINO_ASSERT(!sub_name.empty(), "Empty sub-string detected while parsing layout");
+            std::istringstream ss(sub_name);
+            std::string name;
+            while (std::getline(ss, name, ',')) {
+                name = ngraph::trim(name);
+                if (name != "?") {
+                    assign_name(name, index);
+                }
+                index++;
+            }
+            return index;
+        };
+        layout = layout.substr(1, layout.length() - 2);  // remove []
+        auto ellipsis = layout.find(ELLIPSIS);
+        if (ellipsis == std::string::npos) {
+            auto last_index = parse_commas(layout);
+            m_dynamic = false;
+            m_left_size = last_index;
+        } else {
+            int64_t left_index = 0, right_index = 0;
+            // Parse left and right parts
+            auto left_layout = ngraph::trim(layout.substr(0, ellipsis));
+            if (!left_layout.empty()) {
+                OPENVINO_ASSERT(left_layout.at(left_layout.length() - 1) == ',',
+                                "Layout: Invalid left side (" + layout + ")");
+                left_layout = left_layout.substr(0, left_layout.length() - 1);
+                left_index = parse_commas(left_layout);
+            }
+            auto right_layout = ngraph::trim(layout.substr(ellipsis + ELLIPSIS_LEN));
+            if (!right_layout.empty()) {
+                OPENVINO_ASSERT(right_layout.at(0) == ',', "Layout: Invalid right side (" + layout + ")");
+                right_layout = right_layout.substr(1, right_layout.length() - 1);
+                right_index = std::count(right_layout.begin(), right_layout.end(), ',') + 1;
+                parse_commas(right_layout, -right_index);
+            }
+            m_dynamic = true;
+            m_left_size = left_index;
+            m_right_size = right_index;
+        }
+        return;
+    }
+    auto dynamic_start = layout.find(ELLIPSIS);
+    bool backward = false;
+    int64_t index = -1;
+    for (auto i = 0; i < layout.length(); i++) {
+        index++;
+        auto c = std::toupper(layout[i]);
+        if (c == '?') {
+            continue;
+        } else if (c == '.') {
+            OPENVINO_ASSERT(!backward, std::string("Multiple ") + ELLIPSIS + " are not allowed");
+            OPENVINO_ASSERT(i == dynamic_start, "Undefined number of dimensions shall have ...");
+            // check next characters
+            i += ELLIPSIS_LEN - 1;
+            index += ELLIPSIS_LEN - 1;
+            // undefined middle dimension
+            backward = true;
+            index = index - static_cast<int64_t>(layout.length());
+            continue;
+        }
+        assign_name(std::string(1, static_cast<char>(c)), index);
+    }
+    if (dynamic_start != std::string::npos) {
+        m_dynamic = true;
+        m_left_size = static_cast<int64_t>(dynamic_start);
+        m_right_size = static_cast<int64_t>(layout.length() - dynamic_start - ELLIPSIS_LEN);
+    } else {
+        m_dynamic = false;
+        m_left_size = static_cast<int64_t>(layout.length());
+    }
+}
+
+bool Layout::operator==(const Layout& rhs) const {
+    if (m_scalar != rhs.m_scalar || m_dynamic != rhs.m_dynamic || m_left_size != rhs.m_left_size ||
+        m_right_size != rhs.m_right_size) {
+        return false;
+    }
+    for (const auto& item : m_names) {
+        auto it = rhs.m_names.find(item.first);
+        if (it == rhs.m_names.end()) {
+            return false;
+        }
+        if (it->second != item.second) {
+            return false;
+        }
+    }
+    return std::all_of(rhs.m_names.begin(), rhs.m_names.end(), [&](const std::pair<std::string, int64_t>& item) {
+        return m_names.count(item.first);
+    });
+}
+
+bool Layout::operator!=(const Layout& rhs) const {
+    return !(*this == rhs);
+}
+
+bool Layout::has_name(const std::string& dimension_name) const {
+    auto name = to_internal_name(dimension_name);
+    return m_names.count(name) > 0;
+}
+
+std::int64_t Layout::get_index_by_name(const std::string& dimension_name) const {
+    auto name = to_internal_name(dimension_name);
+    auto it = m_names.find(name);
+    OPENVINO_ASSERT(it != m_names.end(), dimension_name + " dimension index is not defined");
+    return it->second;
+}
+
+std::string Layout::to_string() const {
+    if (m_scalar) {
+        return SCALAR;
+    }
+    std::stringstream res;
+    res << "[";
+    auto add_dim = [&](int64_t index) {
+        auto it = m_index_map.find(index);
+        if (it == m_index_map.end()) {
+            res << "?";
+        } else {
+            res << it->second;
+        }
+    };
+
+    if (m_left_size > 0) {
+        add_dim(0);
+    }
+    for (int64_t i = 1; i < m_left_size; i++) {
+        res << ",";
+        add_dim(i);
+    }
+    if (m_dynamic) {
+        if (m_left_size > 0) {
+            res << ",";
+        }
+        res << "...";
+        for (int64_t i = -m_right_size; i < 0; i++) {
+            res << ",";
+            add_dim(i);
+        }
+    }
+    res << "]";
+    return res.str();
+}
+
+#define DEFINE_NAMED_DIMENSION(NAME, name)            \
+    bool layout::has_##name(const Layout& layout) {   \
+        return layout.has_name(NAME);                 \
+    }                                                 \
+                                                      \
+    std::int64_t layout::name(const Layout& layout) { \
+        return layout.get_index_by_name(NAME);        \
+    }
+
+DEFINE_NAMED_DIMENSION(BATCH, batch)
+
+DEFINE_NAMED_DIMENSION(CHANNELS, channels)
+
+DEFINE_NAMED_DIMENSION(DEPTH, depth)
+
+DEFINE_NAMED_DIMENSION(HEIGHT, height)
+
+DEFINE_NAMED_DIMENSION(WIDTH, width)
+
+constexpr DiscreteTypeInfo AttributeAdapter<ov::Layout>::type_info;
+
+const std::string& AttributeAdapter<ov::Layout>::get() {
+    m_dump = m_ref.to_string();
+    return m_dump;
+}
+
+void AttributeAdapter<ov::Layout>::set(const std::string& value) {
+    m_ref = Layout(value);
+}
+
+constexpr VariantTypeInfo VariantWrapper<ov::Layout>::type_info;
diff --git a/ngraph/core/src/node.cpp b/ngraph/core/src/node.cpp
index c6f4a9dd352cdf..60cc0f7ccc8826 100644
--- a/ngraph/core/src/node.cpp
+++ b/ngraph/core/src/node.cpp
@@ -146,7 +146,7 @@ void ov::Node::safe_delete(NodeVector& nodes, bool recurse) {
 
 void ov::Node::set_arguments(const NodeVector& arguments) {
     OutputVector outputs;
-    for (auto arg : arguments) {
+    for (const auto& arg : arguments) {
         for (auto& output : arg->outputs()) {
             outputs.push_back(output);
         }
@@ -282,7 +282,7 @@ shared_ptr<ov::Node> ov::Node::add_provenance_group_members_above(const OutputVe
         base_set.insert(node);
     }
     vector<Node*> todo;
-    for (auto value : input_values()) {
+    for (const auto& value : input_values()) {
         todo.push_back(value.get_node());
     }
     while (!todo.empty()) {
@@ -292,7 +292,7 @@ shared_ptr<ov::Node> ov::Node::add_provenance_group_members_above(const OutputVe
             continue;
         }
         add_provenance_group_member(node->shared_from_this());
-        for (auto value : node->input_values()) {
+        for (const auto& value : node->input_values()) {
             if (m_provenance_group.count(value.get_node_shared_ptr()) == 0) {
                 todo.push_back(value.get_node());
             }
@@ -315,7 +315,7 @@ void ov::Node::add_provenance_tags_above(const OutputVector& base, const std::un
             continue;
         }
         node->add_provenance_tags(tag_set);
-        for (auto value : node->input_values()) {
+        for (const auto& value : node->input_values()) {
             todo.push_back(value.get_node());
         }
         base_set.insert(node);
@@ -328,7 +328,7 @@ const std::unordered_set<std::string>& ov::Node::get_provenance_tags() const {
 
 void ov::Node::add_provenance_tag(const std::string& tag) {
     m_provenance_tags.insert(tag);
-    for (auto node : m_provenance_group) {
+    for (const auto& node : m_provenance_group) {
         node->add_provenance_tag(tag);
     }
 }
@@ -497,7 +497,7 @@ const ov::element::Type& ov::Node::get_element_type() const {
     return get_output_element_type(0);
 }
 
-const ngraph::Shape& ov::Node::get_output_shape(size_t i) const {
+const ov::Shape& ov::Node::get_output_shape(size_t i) const {
     NGRAPH_CHECK(i < m_outputs.size(), "index '", i, "' out of range in get_output_shape(size_t i)");
     return m_outputs[i].get_shape();
 }
@@ -507,7 +507,7 @@ const ov::PartialShape& ov::Node::get_output_partial_shape(size_t i) const {
     return m_outputs[i].get_partial_shape();
 }
 
-const ngraph::Shape& ov::Node::get_shape() const {
+const ov::Shape& ov::Node::get_shape() const {
     NODE_VALIDATION_CHECK(this, get_output_size() == 1, "get_shape() must be called on a node with exactly one output");
     return get_output_shape(0);
 }
@@ -542,7 +542,7 @@ const ov::element::Type& ov::Node::get_input_element_type(size_t i) const {
     return m_inputs[i].get_element_type();
 }
 
-const ngraph::Shape& ov::Node::get_input_shape(size_t i) const {
+const ov::Shape& ov::Node::get_input_shape(size_t i) const {
     NGRAPH_CHECK(i < m_inputs.size(), "index '", i, "' out of range in get_input_shape(size_t i)");
     return m_inputs[i].get_shape();
 }
@@ -579,7 +579,7 @@ bool ov::Node::has_same_type(std::shared_ptr<const Node> node) const {
 
 ov::NodeVector ov::Node::get_users(bool check_is_used) const {
     NodeVector result;
-    for (auto output : outputs()) {
+    for (const auto& output : outputs()) {
         for (auto input : output.get_target_inputs()) {
             Node* input_node = input.get_node();
             if (!check_is_used || ngraph::is_used(input_node)) {
@@ -610,7 +610,7 @@ const ov::NodeVector& ov::check_single_output_args(const NodeVector& args) {
 
 ov::OutputVector ov::as_output_vector(const NodeVector& args) {
     OutputVector output_vector;
-    for (auto arg : args) {
+    for (const auto& arg : args) {
         output_vector.push_back(arg);
     }
     return output_vector;
@@ -681,7 +681,7 @@ ov::Input<ov::Node> ov::Node::input(size_t input_index) {
         throw out_of_range("node input index is out of range");
     }
 
-    return Input<Node>(this, input_index);
+    return {this, input_index};
 }
 
 ov::Output<ov::Node> ov::Node::input_value(size_t input_index) const {
@@ -693,7 +693,7 @@ ov::Input<const ov::Node> ov::Node::input(size_t input_index) const {
         throw out_of_range("node input index is out of range");
     }
 
-    return Input<const Node>(this, input_index);
+    return {this, input_index};
 }
 
 ov::Output<ov::Node> ov::Node::output(size_t output_index) {
diff --git a/ngraph/core/src/node_input.cpp b/ngraph/core/src/node_input.cpp
index 5c6a45ab837ea6..c5eeecd314a21d 100644
--- a/ngraph/core/src/node_input.cpp
+++ b/ngraph/core/src/node_input.cpp
@@ -19,7 +19,7 @@ const element::Type& Input<Node>::get_element_type() const {
     return m_node->get_input_element_type(m_index);
 }
 
-const ngraph::Shape& Input<Node>::get_shape() const {
+const Shape& Input<Node>::get_shape() const {
     return m_node->get_input_shape(m_index);
 }
 const PartialShape& Input<Node>::get_partial_shape() const {
@@ -95,7 +95,7 @@ size_t Input<const Node>::get_index() const {
 const element::Type& Input<const Node>::get_element_type() const {
     return m_node->get_input_element_type(m_index);
 }
-const ngraph::Shape& Input<const Node>::get_shape() const {
+const Shape& Input<const Node>::get_shape() const {
     return m_node->get_input_shape(m_index);
 }
 const PartialShape& Input<const Node>::get_partial_shape() const {
diff --git a/ngraph/core/src/node_output.cpp b/ngraph/core/src/node_output.cpp
index fcd2285956e35a..e9dc731af5d9a7 100644
--- a/ngraph/core/src/node_output.cpp
+++ b/ngraph/core/src/node_output.cpp
@@ -39,7 +39,7 @@ std::shared_ptr<descriptor::Tensor> Output<Node>::get_tensor_ptr() const {
 const element::Type& Output<Node>::get_element_type() const {
     return m_node->get_output_element_type(m_index);
 }
-const ngraph::Shape& Output<Node>::get_shape() const {
+const Shape& Output<Node>::get_shape() const {
     return m_node->get_output_shape(m_index);
 }
 const PartialShape& Output<Node>::get_partial_shape() const {
@@ -128,7 +128,7 @@ std::shared_ptr<descriptor::Tensor> Output<const Node>::get_tensor_ptr() const {
 const element::Type& Output<const Node>::get_element_type() const {
     return m_node->get_output_element_type(m_index);
 }
-const ngraph::Shape& Output<const Node>::get_shape() const {
+const Shape& Output<const Node>::get_shape() const {
     return m_node->get_output_shape(m_index);
 }
 const PartialShape& Output<const Node>::get_partial_shape() const {
diff --git a/ngraph/core/src/op/abs.cpp b/ngraph/core/src/op/abs.cpp
index de7cdf63499601..2dca43fd01347a 100644
--- a/ngraph/core/src/op/abs.cpp
+++ b/ngraph/core/src/op/abs.cpp
@@ -10,30 +10,27 @@
 #include "ngraph/runtime/host_tensor.hpp"
 #include "ngraph/runtime/reference/abs.hpp"
 
-using namespace std;
-using namespace ngraph;
+OPENVINO_RTTI_DEFINITION(ov::op::v0::Abs, "Abs", 0, util::UnaryElementwiseArithmetic);
 
-constexpr NodeTypeInfo op::Abs::type_info;
-
-op::Abs::Abs(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
+ov::op::v0::Abs::Abs(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
 }
 
-shared_ptr<Node> op::Abs::clone_with_new_inputs(const OutputVector& new_args) const {
+std::shared_ptr<ov::Node> ov::op::v0::Abs::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_Abs_clone_with_new_inputs);
     check_new_args_count(this, new_args);
-    return make_shared<Abs>(new_args.at(0));
+    return std::make_shared<Abs>(new_args.at(0));
 }
 
 namespace absop {
-template <element::Type_t ET>
-inline bool evaluate(const HostTensorPtr& arg0, const HostTensorPtr& out, const size_t count) {
-    using T = typename element_type_traits<ET>::value_type;
-    runtime::reference::abs<T>((arg0->get_data_ptr<ET>()), (out->get_data_ptr<ET>()), count);
+template <ov::element::Type_t ET>
+inline bool evaluate(const ngraph::HostTensorPtr& arg0, const ngraph::HostTensorPtr& out, const size_t count) {
+    using T = typename ov::element_type_traits<ET>::value_type;
+    ngraph::runtime::reference::abs<T>((arg0->get_data_ptr<ET>()), (out->get_data_ptr<ET>()), count);
     return true;
 }
 
-bool evaluate_abs(const HostTensorPtr& arg0, const HostTensorPtr& out, const size_t count) {
+bool evaluate_abs(const ngraph::HostTensorPtr& arg0, const ngraph::HostTensorPtr& out, const size_t count) {
     bool rc = true;
     out->set_unary(arg0);
 
@@ -54,12 +51,12 @@ bool evaluate_abs(const HostTensorPtr& arg0, const HostTensorPtr& out, const siz
 }
 }  // namespace absop
 
-bool op::Abs::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::v0::Abs::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v0_Abs_evaluate);
     return absop::evaluate_abs(inputs[0], outputs[0], shape_size(get_output_shape(0)));
 }
 
-bool op::Abs::has_evaluate() const {
+bool ov::op::v0::Abs::has_evaluate() const {
     NGRAPH_OP_SCOPE(v0_Abs_has_evaluate);
     switch (get_input_element_type(0)) {
     case ngraph::element::i32:
diff --git a/ngraph/core/src/op/acos.cpp b/ngraph/core/src/op/acos.cpp
index fb66557d4f4d91..fc668804eaa837 100644
--- a/ngraph/core/src/op/acos.cpp
+++ b/ngraph/core/src/op/acos.cpp
@@ -18,30 +18,27 @@
 #include "ngraph/runtime/host_tensor.hpp"
 #include "ngraph/runtime/reference/acos.hpp"
 
-using namespace std;
-using namespace ngraph;
+OPENVINO_RTTI_DEFINITION(ov::op::v0::Acos, "Acos", 0, util::UnaryElementwiseArithmetic);
 
-constexpr NodeTypeInfo op::Acos::type_info;
-
-op::Acos::Acos(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
+ov::op::v0::Acos::Acos(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
 }
 
-shared_ptr<Node> op::Acos::clone_with_new_inputs(const OutputVector& new_args) const {
+std::shared_ptr<ov::Node> ov::op::v0::Acos::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_Acos_clone_with_new_inputs);
     check_new_args_count(this, new_args);
-    return make_shared<Acos>(new_args.at(0));
+    return std::make_shared<Acos>(new_args.at(0));
 }
 
 namespace acosop {
-template <element::Type_t ET>
-inline bool evaluate(const HostTensorPtr& arg0, const HostTensorPtr& out, const size_t count) {
-    using T = typename element_type_traits<ET>::value_type;
-    runtime::reference::acos<T>(arg0->get_data_ptr<ET>(), out->get_data_ptr<ET>(), count);
+template <ov::element::Type_t ET>
+inline bool evaluate(const ngraph::HostTensorPtr& arg0, const ngraph::HostTensorPtr& out, const size_t count) {
+    using T = typename ov::element_type_traits<ET>::value_type;
+    ngraph::runtime::reference::acos<T>(arg0->get_data_ptr<ET>(), out->get_data_ptr<ET>(), count);
     return true;
 }
 
-bool evaluate_acos(const HostTensorPtr& arg0, const HostTensorPtr& out, const size_t count) {
+bool evaluate_acos(const ov::HostTensorPtr& arg0, const ov::HostTensorPtr& out, const size_t count) {
     bool rc = true;
     out->set_unary(arg0);
 
@@ -61,12 +58,12 @@ bool evaluate_acos(const HostTensorPtr& arg0, const HostTensorPtr& out, const si
 }
 }  // namespace acosop
 
-bool op::Acos::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::v0::Acos::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v0_Acos_evaluate);
     return acosop::evaluate_acos(inputs[0], outputs[0], shape_size(get_output_shape(0)));
 }
 
-bool op::Acos::has_evaluate() const {
+bool ov::op::v0::Acos::has_evaluate() const {
     NGRAPH_OP_SCOPE(v0_Acos_has_evaluate);
     switch (get_input_element_type(0)) {
     case ngraph::element::i32:
diff --git a/ngraph/core/src/op/acosh.cpp b/ngraph/core/src/op/acosh.cpp
index 230167c9f9b237..99f9bd03bcaf17 100644
--- a/ngraph/core/src/op/acosh.cpp
+++ b/ngraph/core/src/op/acosh.cpp
@@ -12,29 +12,26 @@
 #include "ngraph/runtime/reference/acosh.hpp"
 #include "ngraph/type/element_type.hpp"
 
-using namespace std;
-using namespace ngraph;
+OPENVINO_RTTI_DEFINITION(ov::op::v3::Acosh, "Acosh", 3, util::UnaryElementwiseArithmetic);
 
-NGRAPH_RTTI_DEFINITION(op::v3::Acosh, "Acosh", 3, util::UnaryElementwiseArithmetic);
-
-op::v3::Acosh::Acosh(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
+ov::op::v3::Acosh::Acosh(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
 }
 
-shared_ptr<Node> op::v3::Acosh::clone_with_new_inputs(const OutputVector& new_args) const {
+std::shared_ptr<ov::Node> ov::op::v3::Acosh::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v3_Acosh_clone_with_new_inputs);
     check_new_args_count(this, new_args);
-    return make_shared<Acosh>(new_args.at(0));
+    return std::make_shared<Acosh>(new_args.at(0));
 }
 
 namespace acoshop {
-template <element::Type_t ET>
-bool evaluate(const HostTensorPtr& arg0, const HostTensorPtr& out) {
-    runtime::reference::acosh(arg0->get_data_ptr<ET>(), out->get_data_ptr<ET>(), shape_size(arg0->get_shape()));
+template <ov::element::Type_t ET>
+bool evaluate(const ngraph::HostTensorPtr& arg0, const ngraph::HostTensorPtr& out) {
+    ngraph::runtime::reference::acosh(arg0->get_data_ptr<ET>(), out->get_data_ptr<ET>(), shape_size(arg0->get_shape()));
     return true;
 }
 
-bool evaluate_acosh(const HostTensorPtr& arg0, const HostTensorPtr& out) {
+bool evaluate_acosh(const ngraph::HostTensorPtr& arg0, const ngraph::HostTensorPtr& out) {
     bool rc = true;
     out->set_unary(arg0);
     switch (arg0->get_element_type()) {
@@ -52,12 +49,12 @@ bool evaluate_acosh(const HostTensorPtr& arg0, const HostTensorPtr& out) {
 }
 }  // namespace acoshop
 
-bool op::v3::Acosh::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::v3::Acosh::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v3_Acosh_evaluate);
     return acoshop::evaluate_acosh(inputs[0], outputs[0]);
 }
 
-bool op::v3::Acosh::has_evaluate() const {
+bool ov::op::v3::Acosh::has_evaluate() const {
     NGRAPH_OP_SCOPE(v3_Acosh_has_evaluate);
     switch (get_input_element_type(0)) {
     case ngraph::element::i32:
diff --git a/ngraph/core/src/op/adaptive_avg_pool.cpp b/ngraph/core/src/op/adaptive_avg_pool.cpp
index e8989c9ecebe69..60f4d50917aea6 100644
--- a/ngraph/core/src/op/adaptive_avg_pool.cpp
+++ b/ngraph/core/src/op/adaptive_avg_pool.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v8::AdaptiveAvgPool, "AdaptiveAvgPool", 8);
+OPENVINO_RTTI_DEFINITION(ov::op::v8::AdaptiveAvgPool, "AdaptiveAvgPool", 8);
 
 op::v8::AdaptiveAvgPool::AdaptiveAvgPool(const Output<Node>& data, const Output<Node>& output_shape)
     : Op({data, output_shape}) {
@@ -27,7 +27,7 @@ bool op::v8::AdaptiveAvgPool::visit_attributes(AttributeVisitor& visitor) {
 void op::v8::AdaptiveAvgPool::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v8_AdaptiveAvgPool_validate_and_infer_types);
 
-    const PartialShape& data_shape = get_input_partial_shape(0);
+    const ov::PartialShape& data_shape = get_input_partial_shape(0);
 
     NODE_VALIDATION_CHECK(
         this,
@@ -35,7 +35,7 @@ void op::v8::AdaptiveAvgPool::validate_and_infer_types() {
         "Expected a 3D, 4D or 5D tensor for the input. Got: ",
         data_shape);
 
-    auto output_shape = PartialShape::dynamic(data_shape.rank());
+    auto output_shape = ov::PartialShape::dynamic(data_shape.rank());
     if (data_shape.rank().is_static()) {
         if (data_shape[0].is_static()) {
             output_shape[0] = data_shape[0];  // batch size
diff --git a/ngraph/core/src/op/adaptive_max_pool.cpp b/ngraph/core/src/op/adaptive_max_pool.cpp
index e5f57db472795c..34b256ab9dd179 100644
--- a/ngraph/core/src/op/adaptive_max_pool.cpp
+++ b/ngraph/core/src/op/adaptive_max_pool.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v8::AdaptiveMaxPool, "AdaptiveMaxPool", 8);
+OPENVINO_RTTI_DEFINITION(ov::op::v8::AdaptiveMaxPool, "AdaptiveMaxPool", 8);
 
 op::v8::AdaptiveMaxPool::AdaptiveMaxPool(const Output<Node>& data,
                                          const Output<Node>& output_shape,
@@ -35,7 +35,7 @@ void op::v8::AdaptiveMaxPool::validate_and_infer_types() {
                           m_index_element_type == element::i64 || m_index_element_type == element::i32,
                           "Index element type must be i32 or i64");
 
-    const PartialShape& data_shape = get_input_partial_shape(0);
+    const ov::PartialShape& data_shape = get_input_partial_shape(0);
 
     NODE_VALIDATION_CHECK(
         this,
@@ -43,7 +43,7 @@ void op::v8::AdaptiveMaxPool::validate_and_infer_types() {
         "Expected a 3D, 4D or 5D tensor for the input. Got: ",
         data_shape);
 
-    auto output_shape = PartialShape::dynamic(data_shape.rank());
+    auto output_shape = ov::PartialShape::dynamic(data_shape.rank());
     if (data_shape.rank().is_static()) {
         if (data_shape[0].is_static()) {
             output_shape[0] = data_shape[0];  // batch size
diff --git a/ngraph/core/src/op/add.cpp b/ngraph/core/src/op/add.cpp
index d6a58e8efb1608..35eec6a242fc78 100644
--- a/ngraph/core/src/op/add.cpp
+++ b/ngraph/core/src/op/add.cpp
@@ -54,7 +54,7 @@ bool evaluate_add(const HostTensorPtr& arg0,
 
 // ------------------------------- v1 ------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Add, "Add", 1, util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(ov::op::v1::Add, "Add", 1, util::BinaryElementwiseArithmetic);
 
 op::v1::Add::Add(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/asin.cpp b/ngraph/core/src/op/asin.cpp
index b7675408de4a2d..06bf6904bcf01a 100644
--- a/ngraph/core/src/op/asin.cpp
+++ b/ngraph/core/src/op/asin.cpp
@@ -22,7 +22,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::Asin::type_info;
+OPENVINO_RTTI_DEFINITION(ov::op::v0::Asin, "Asin", 0, util::BinaryElementwiseArithmetic);
 
 op::Asin::Asin(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/asinh.cpp b/ngraph/core/src/op/asinh.cpp
index e6b78fc0f11038..3c44b1fb9532e5 100644
--- a/ngraph/core/src/op/asinh.cpp
+++ b/ngraph/core/src/op/asinh.cpp
@@ -16,7 +16,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v3::Asinh, "Asinh", 3, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(ov::op::v3::Asinh, "Asinh", 3, util::UnaryElementwiseArithmetic);
 
 op::v3::Asinh::Asinh(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/assign.cpp b/ngraph/core/src/op/assign.cpp
index 3476abd5d877cb..812b0c2283ef76 100644
--- a/ngraph/core/src/op/assign.cpp
+++ b/ngraph/core/src/op/assign.cpp
@@ -13,9 +13,8 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::AssignBase, "AssignBase", 0);
-NGRAPH_RTTI_DEFINITION(op::v3::Assign, "Assign", 3, op::Sink);
-NGRAPH_RTTI_DEFINITION(op::v6::Assign, "Assign", 6, op::Sink);
+OPENVINO_RTTI_DEFINITION(ov::op::v3::Assign, "Assign", 3, op::Sink);
+OPENVINO_RTTI_DEFINITION(ov::op::v6::Assign, "Assign", 6, op::Sink);
 
 op::v3::Assign::Assign(const Output<Node>& new_value, const std::string& variable_id)
     : AssignBase({new_value}),
@@ -54,7 +53,7 @@ void op::v3::Assign::validate_and_infer_types() {
 
         set_output_type(0, arg_t, output_shape);
     } else {
-        set_output_type(0, arg_t, PartialShape::dynamic());
+        set_output_type(0, arg_t, ov::PartialShape::dynamic());
     }
 }
 
diff --git a/ngraph/core/src/op/atan.cpp b/ngraph/core/src/op/atan.cpp
index 95a7058164d2e8..e9f81e8782a5f2 100644
--- a/ngraph/core/src/op/atan.cpp
+++ b/ngraph/core/src/op/atan.cpp
@@ -11,7 +11,6 @@
 #include "ngraph/axis_set.hpp"
 #include "ngraph/op/add.hpp"
 #include "ngraph/op/broadcast.hpp"
-#include "ngraph/op/constant.hpp"
 #include "ngraph/op/divide.hpp"
 #include "ngraph/op/multiply.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
@@ -21,7 +20,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Atan, "Atan", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::Atan, "Atan", 0, util::UnaryElementwiseArithmetic);
 
 op::Atan::Atan(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
@@ -46,7 +45,6 @@ bool evaluate_atan(const HostTensorPtr& arg0, const HostTensorPtr& out, const si
     out->set_unary(arg0);
 
     switch (arg0->get_element_type()) {
-        NGRAPH_TYPE_CASE(evaluate_atan, boolean, arg0, out, count);
         NGRAPH_TYPE_CASE(evaluate_atan, i32, arg0, out, count);
         NGRAPH_TYPE_CASE(evaluate_atan, i64, arg0, out, count);
         NGRAPH_TYPE_CASE(evaluate_atan, u32, arg0, out, count);
@@ -69,7 +67,6 @@ bool op::Atan::evaluate(const HostTensorVector& outputs, const HostTensorVector&
 bool op::Atan::has_evaluate() const {
     NGRAPH_OP_SCOPE(v1_Atan_has_evaluate);
     switch (get_input_element_type(0)) {
-    case ngraph::element::boolean:
     case ngraph::element::i32:
     case ngraph::element::i64:
     case ngraph::element::u32:
diff --git a/ngraph/core/src/op/atanh.cpp b/ngraph/core/src/op/atanh.cpp
index 980ac6b795222d..1a6c89c3aaa4eb 100644
--- a/ngraph/core/src/op/atanh.cpp
+++ b/ngraph/core/src/op/atanh.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v3::Atanh, "Atanh", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(ov::op::v3::Atanh, "Atanh", 0, util::UnaryElementwiseArithmetic);
 
 op::v3::Atanh::Atanh(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/avg_pool.cpp b/ngraph/core/src/op/avg_pool.cpp
index 0f1a7f63d3e2f2..afae716cb78a8c 100644
--- a/ngraph/core/src/op/avg_pool.cpp
+++ b/ngraph/core/src/op/avg_pool.cpp
@@ -10,19 +10,18 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
 // *** AvgPool OP SET 1 ***
-NGRAPH_RTTI_DEFINITION(op::v1::AvgPool, "AvgPool", 1);
-
-op::v1::AvgPool::AvgPool(const Output<Node>& arg,
-                         const Strides& strides,
-                         const Shape& pads_begin,
-                         const Shape& pads_end,
-                         const Shape& kernel,
-                         bool exclude_pad,
-                         op::RoundingType rounding_type,
-                         const PadType& auto_pad)
+OPENVINO_RTTI_DEFINITION(ov::op::v1::AvgPool, "AvgPool", 1);
+
+ov::op::v1::AvgPool::AvgPool(const Output<Node>& arg,
+                             const Strides& strides,
+                             const Shape& pads_begin,
+                             const Shape& pads_end,
+                             const Shape& kernel,
+                             bool exclude_pad,
+                             op::RoundingType rounding_type,
+                             const PadType& auto_pad)
     : Op({arg}),
       m_kernel(kernel),
       m_strides(strides),
@@ -34,7 +33,7 @@ op::v1::AvgPool::AvgPool(const Output<Node>& arg,
     constructor_validate_and_infer_types();
 }
 
-bool op::v1::AvgPool::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::v1::AvgPool::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v1_AvgPool_visit_attributes);
     visitor.on_attribute("kernel", m_kernel);
     visitor.on_attribute("strides", m_strides);
@@ -46,7 +45,7 @@ bool op::v1::AvgPool::visit_attributes(AttributeVisitor& visitor) {
     return true;
 }
 
-void op::v1::AvgPool::validate_and_infer_types() {
+void ov::op::v1::AvgPool::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_AvgPool_validate_and_infer_types);
     if (0 == m_strides.size()) {
         m_strides = Strides(m_kernel.size(), 1);
@@ -60,7 +59,7 @@ void op::v1::AvgPool::validate_and_infer_types() {
         m_pads_end = Shape(m_kernel.size(), 0);
     }
 
-    const PartialShape& arg_shape = get_input_partial_shape(0);
+    const ov::PartialShape& arg_shape = get_input_partial_shape(0);
 
     NODE_VALIDATION_CHECK(
         this,
@@ -88,7 +87,7 @@ void op::v1::AvgPool::validate_and_infer_types() {
                               m_kernel.size());
     }
 
-    auto output_shape = PartialShape::dynamic();
+    auto output_shape = ov::PartialShape::dynamic();
     if (arg_shape.rank().is_static()) {
         output_shape = std::vector<Dimension>(arg_shape.rank().get_max_length(), Dimension::dynamic());
         if (arg_shape[0].is_static()) {
@@ -102,13 +101,13 @@ void op::v1::AvgPool::validate_and_infer_types() {
     if (m_auto_pad == PadType::SAME_UPPER || m_auto_pad == PadType::SAME_LOWER) {
         CoordinateDiff pads_end;
         CoordinateDiff pads_begin;
-        update_auto_padding_succeed = try_apply_auto_padding(arg_shape,
-                                                             m_kernel,
-                                                             m_strides,
-                                                             Strides(m_kernel.size(), 1),  // No dilation
-                                                             m_auto_pad,
-                                                             pads_end,
-                                                             pads_begin);
+        update_auto_padding_succeed = ngraph::try_apply_auto_padding(arg_shape,
+                                                                     m_kernel,
+                                                                     m_strides,
+                                                                     Strides(m_kernel.size(), 1),  // No dilation
+                                                                     m_auto_pad,
+                                                                     pads_end,
+                                                                     pads_begin);
         m_pads_end = Shape(pads_end.begin(), pads_end.end());
         m_pads_begin = Shape(pads_begin.begin(), pads_begin.end());
     }
@@ -123,75 +122,75 @@ void op::v1::AvgPool::validate_and_infer_types() {
     set_output_type(0,
                     get_input_element_type(0),
                     update_auto_padding_succeed
-                        ? infer_batched_pooling_forward(this,
-                                                        arg_shape,
-                                                        pads_begin,
-                                                        pads_end,
-                                                        m_kernel,
-                                                        m_strides,
-                                                        !m_exclude_pad,
-                                                        m_rounding_type == op::RoundingType::CEIL,
-                                                        Strides{})  // no dilation of the window
+                        ? ngraph::infer_batched_pooling_forward(this,
+                                                                arg_shape,
+                                                                pads_begin,
+                                                                pads_end,
+                                                                m_kernel,
+                                                                m_strides,
+                                                                !m_exclude_pad,
+                                                                m_rounding_type == op::RoundingType::CEIL,
+                                                                Strides{})  // no dilation of the window
                         : output_shape);
 }
 
-const Shape& op::v1::AvgPool::get_kernel() const {
+const ov::Shape& ov::op::v1::AvgPool::get_kernel() const {
     return m_kernel;
 }
 
-void op::v1::AvgPool::set_kernel(const Shape& kernel) {
+void ov::op::v1::AvgPool::set_kernel(const Shape& kernel) {
     m_kernel = kernel;
 }
 
-const Strides& op::v1::AvgPool::get_strides() const {
+const ov::Strides& ov::op::v1::AvgPool::get_strides() const {
     return m_strides;
 }
 
-void op::v1::AvgPool::set_strides(const Strides& strides) {
+void ov::op::v1::AvgPool::set_strides(const Strides& strides) {
     m_strides = strides;
 }
 
-const Shape& op::v1::AvgPool::get_pads_begin() const {
+const ov::Shape& ov::op::v1::AvgPool::get_pads_begin() const {
     return m_pads_begin;
 }
 
-void op::v1::AvgPool::set_pads_begin(const Shape& pads_begin) {
+void ov::op::v1::AvgPool::set_pads_begin(const Shape& pads_begin) {
     m_pads_begin = pads_begin;
 }
 
-const Shape& op::v1::AvgPool::get_pads_end() const {
+const ov::Shape& ov::op::v1::AvgPool::get_pads_end() const {
     return m_pads_end;
 }
 
-void op::v1::AvgPool::set_pads_end(const Shape& pads_end) {
+void ov::op::v1::AvgPool::set_pads_end(const Shape& pads_end) {
     m_pads_end = pads_end;
 }
 
-bool op::v1::AvgPool::get_exclude_pad() const {
+bool ov::op::v1::AvgPool::get_exclude_pad() const {
     return m_exclude_pad;
 }
 
-void op::v1::AvgPool::set_exclude_pad(bool exclude_pad) {
+void ov::op::v1::AvgPool::set_exclude_pad(bool exclude_pad) {
     m_exclude_pad = exclude_pad;
 }
 
-const op::PadType& op::v1::AvgPool::get_auto_pad() const {
+const ov::op::PadType& ov::op::v1::AvgPool::get_auto_pad() const {
     return m_auto_pad;
 }
 
-void op::v1::AvgPool::set_auto_pad(const op::PadType& auto_pad) {
+void ov::op::v1::AvgPool::set_auto_pad(const op::PadType& auto_pad) {
     m_auto_pad = auto_pad;
 }
 
-op::RoundingType op::v1::AvgPool::get_rounding_type() const {
+ov::op::RoundingType ov::op::v1::AvgPool::get_rounding_type() const {
     return m_rounding_type;
 }
 
-void op::v1::AvgPool::set_rounding_type(op::RoundingType rounding_type) {
+void ov::op::v1::AvgPool::set_rounding_type(op::RoundingType rounding_type) {
     m_rounding_type = rounding_type;
 }
 
-shared_ptr<Node> op::v1::AvgPool::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<ov::Node> ov::op::v1::AvgPool::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v1_AvgPool_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<v1::AvgPool>(new_args.at(0),
@@ -204,6 +203,6 @@ shared_ptr<Node> op::v1::AvgPool::clone_with_new_inputs(const OutputVector& new_
                                     m_auto_pad);
 }
 
-shared_ptr<Node> op::v1::AvgPool::get_default_value() const {
-    return op::Constant::create(get_element_type(), get_shape(), {0});
+shared_ptr<ov::Node> ov::op::v1::AvgPool::get_default_value() const {
+    return op::v0::Constant::create(get_element_type(), get_shape(), {0});
 }
diff --git a/ngraph/core/src/op/batch_norm.cpp b/ngraph/core/src/op/batch_norm.cpp
index 753a59a18b4995..2e748ce9e9af50 100644
--- a/ngraph/core/src/op/batch_norm.cpp
+++ b/ngraph/core/src/op/batch_norm.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::BatchNormInference, "batchNormInference", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::BatchNormInference, "batchNormInference", 0);
 
 op::v0::BatchNormInference::BatchNormInference(const Output<Node>& input,
                                                const Output<Node>& gamma,
@@ -35,8 +35,8 @@ bool op::v0::BatchNormInference::visit_attributes(AttributeVisitor& visitor) {
 void op::v0::BatchNormInference::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_BatchNormInference_validate_and_infer_types);
     element::Type result_et;
-    PartialShape result_batch_shape;
-    PartialShape result_channel_shape;  // unused here
+    ov::PartialShape result_batch_shape;
+    ov::PartialShape result_channel_shape;  // unused here
 
     NODE_VALIDATION_CHECK(this,
                           m_epsilon >= 0,
@@ -71,7 +71,7 @@ std::shared_ptr<Node> op::v0::BatchNormInference::clone_with_new_inputs(const Ou
                                                 m_epsilon);
 }
 
-NGRAPH_RTTI_DEFINITION(op::v5::BatchNormInference, "BatchNormInference", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::BatchNormInference, "BatchNormInference", 5);
 
 op::v5::BatchNormInference::BatchNormInference(const Output<Node>& input,
                                                const Output<Node>& gamma,
@@ -93,8 +93,8 @@ bool op::v5::BatchNormInference::visit_attributes(AttributeVisitor& visitor) {
 void op::v5::BatchNormInference::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v5_BatchNormInference_validate_and_infer_types);
     element::Type result_et;
-    PartialShape result_batch_shape;
-    PartialShape result_channel_shape;  // unused here
+    ov::PartialShape result_batch_shape;
+    ov::PartialShape result_channel_shape;  // unused here
 
     NODE_VALIDATION_CHECK(this,
                           m_epsilon >= 0,
diff --git a/ngraph/core/src/op/batch_to_space.cpp b/ngraph/core/src/op/batch_to_space.cpp
index 0fc96d69f7a39e..d7aa1529e1d3e4 100644
--- a/ngraph/core/src/op/batch_to_space.cpp
+++ b/ngraph/core/src/op/batch_to_space.cpp
@@ -23,7 +23,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::BatchToSpace, "BatchToSpace", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::BatchToSpace, "BatchToSpace", 1);
 
 ngraph::op::v1::BatchToSpace::BatchToSpace(const ngraph::Output<ngraph::Node>& data,
                                            const ngraph::Output<ngraph::Node>& block_shape,
@@ -57,16 +57,16 @@ void op::v1::BatchToSpace::validate_and_infer_types() {
                           "block_shape and crops inputs must have integer element type. Got: ",
                           inputs_integer_et);
 
-    const PartialShape& data_pshape = get_input_partial_shape(0);
-    const PartialShape& block_shape_ps = get_input_partial_shape(1);
-    const PartialShape& crops_begin_ps = get_input_partial_shape(2);
-    const PartialShape& crops_end_ps = get_input_partial_shape(3);
+    const ov::PartialShape& data_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& block_shape_ps = get_input_partial_shape(1);
+    const ov::PartialShape& crops_begin_ps = get_input_partial_shape(2);
+    const ov::PartialShape& crops_end_ps = get_input_partial_shape(3);
 
-    PartialShape inputs_same_ps{PartialShape::dynamic()};
+    ov::PartialShape inputs_same_ps{ov::PartialShape::dynamic()};
     NODE_VALIDATION_CHECK(this,
-                          PartialShape::merge_into(inputs_same_ps, crops_begin_ps) &&
-                              PartialShape::merge_into(inputs_same_ps, crops_end_ps) &&
-                              PartialShape::merge_into(inputs_same_ps, block_shape_ps),
+                          ov::PartialShape::merge_into(inputs_same_ps, crops_begin_ps) &&
+                              ov::PartialShape::merge_into(inputs_same_ps, crops_end_ps) &&
+                              ov::PartialShape::merge_into(inputs_same_ps, block_shape_ps),
                           "block_shape, crops_begin and crops_end inputs must have the same shape. Got: ",
                           block_shape_ps,
                           ", ",
@@ -103,7 +103,7 @@ void op::v1::BatchToSpace::validate_and_infer_types() {
     const auto crops_end_const = get_constant_from_source(input_value(3));
 
     if (block_const && crops_begin_const && crops_end_const && data_pshape.is_static()) {
-        const Shape& data_sshape = data_pshape.to_shape();
+        const ov::Shape& data_sshape = data_pshape.to_shape();
 
         auto block_val = block_const->cast_vector<int64_t>();
         auto crops_begin_val = crops_begin_const->cast_vector<int64_t>();
@@ -143,7 +143,7 @@ void op::v1::BatchToSpace::validate_and_infer_types() {
                                   "block_shape[i] * input_shape[i]");
         }
 
-        Shape output_sshape = {static_cast<size_t>(data_sshape[0] / block_prod)};
+        ov::Shape output_sshape = {static_cast<size_t>(data_sshape[0] / block_prod)};
         for (size_t idx = 1; idx < data_sshape.size(); ++idx) {
             output_sshape.push_back(
                 static_cast<size_t>(data_sshape[idx] * block_val[idx] - crops_begin_val[idx] - crops_end_val[idx]));
@@ -152,7 +152,7 @@ void op::v1::BatchToSpace::validate_and_infer_types() {
         set_output_size(1);
         set_output_type(0, data_et, output_sshape);
     } else {
-        set_output_type(0, data_et, PartialShape::dynamic(data_rank));
+        set_output_type(0, data_et, ov::PartialShape::dynamic(data_rank));
     }
 }
 
@@ -219,12 +219,12 @@ bool batch_to_space_evaluate(const HostTensorVector& outputs, const HostTensorVe
                      "Invalid crops values (out of bounds) with respect to the shape of data input");
     }
 
-    Shape dispersed_shape(1);
+    ov::Shape dispersed_shape(1);
     dispersed_shape.insert(dispersed_shape.end(), data_shape.begin(), data_shape.end());
     std::vector<size_t> axes_order(block_values_size + 1);
     std::vector<size_t> plain_axes_order(block_values_size + 1);
     std::iota(plain_axes_order.begin(), plain_axes_order.end(), 0);
-    Shape squeezed_shape(data_shape.begin(), data_shape.end());
+    ov::Shape squeezed_shape(data_shape.begin(), data_shape.end());
     if (squeezed_shape.size() > block_values_size) {
         return false;
     }
@@ -232,7 +232,7 @@ bool batch_to_space_evaluate(const HostTensorVector& outputs, const HostTensorVe
     auto* flat_data = data->get_data_ptr<char>();
     std::vector<char> dispersed_data(shape_size(data_shape) * elem_size);
 
-    Shape post_transpose_shape(axes_order.size());
+    ov::Shape post_transpose_shape(axes_order.size());
     std::vector<char> post_transpose_data(shape_size(data_shape) * elem_size);
 
     for (size_t block_idx = 1; block_idx < block_values_size; ++block_idx) {
diff --git a/ngraph/core/src/op/binary_convolution.cpp b/ngraph/core/src/op/binary_convolution.cpp
index ff5c804e288365..fa91604e699037 100644
--- a/ngraph/core/src/op/binary_convolution.cpp
+++ b/ngraph/core/src/op/binary_convolution.cpp
@@ -13,19 +13,18 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
-
-NGRAPH_RTTI_DEFINITION(op::v1::BinaryConvolution, "BinaryConvolution", 1);
-
-op::v1::BinaryConvolution::BinaryConvolution(const Output<Node>& data,
-                                             const Output<Node>& kernel,
-                                             const Strides& strides,
-                                             const CoordinateDiff& pads_begin,
-                                             const CoordinateDiff& pads_end,
-                                             const Strides& dilations,
-                                             BinaryConvolutionMode mode,
-                                             float pad_value,
-                                             const PadType& auto_pad)
+
+OPENVINO_RTTI_DEFINITION(ov::op::v1::BinaryConvolution, "BinaryConvolution", 1);
+
+ov::op::v1::BinaryConvolution::BinaryConvolution(const Output<Node>& data,
+                                                 const Output<Node>& kernel,
+                                                 const Strides& strides,
+                                                 const CoordinateDiff& pads_begin,
+                                                 const CoordinateDiff& pads_end,
+                                                 const Strides& dilations,
+                                                 BinaryConvolutionMode mode,
+                                                 float pad_value,
+                                                 const PadType& auto_pad)
     : Op({data, kernel}),
       m_strides(strides),
       m_dilations(dilations),
@@ -37,15 +36,15 @@ op::v1::BinaryConvolution::BinaryConvolution(const Output<Node>& data,
     constructor_validate_and_infer_types();
 }
 
-op::v1::BinaryConvolution::BinaryConvolution(const Output<Node>& data,
-                                             const Output<Node>& kernel,
-                                             const Strides& strides,
-                                             const CoordinateDiff& pads_begin,
-                                             const CoordinateDiff& pads_end,
-                                             const Strides& dilations,
-                                             const std::string& mode,
-                                             float pad_value,
-                                             const PadType& auto_pad)
+ov::op::v1::BinaryConvolution::BinaryConvolution(const Output<Node>& data,
+                                                 const Output<Node>& kernel,
+                                                 const Strides& strides,
+                                                 const CoordinateDiff& pads_begin,
+                                                 const CoordinateDiff& pads_end,
+                                                 const Strides& dilations,
+                                                 const std::string& mode,
+                                                 float pad_value,
+                                                 const PadType& auto_pad)
     : Op({data, kernel}),
       m_strides(strides),
       m_dilations(dilations),
@@ -57,11 +56,11 @@ op::v1::BinaryConvolution::BinaryConvolution(const Output<Node>& data,
     constructor_validate_and_infer_types();
 }
 
-void op::v1::BinaryConvolution::validate_and_infer_types() {
+void ov::op::v1::BinaryConvolution::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_BinaryConvolution_validate_and_infer_types);
-    const PartialShape& data_batch_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& data_batch_pshape = get_input_partial_shape(0);
     element::Type data_batch_et = get_input_element_type(0);
-    const PartialShape& filters_pshape = get_input_partial_shape(1);
+    const ov::PartialShape& filters_pshape = get_input_partial_shape(1);
 
     NODE_VALIDATION_CHECK(this,
                           data_batch_et.is_real() || data_batch_et.is_integral_number(),
@@ -79,19 +78,19 @@ void op::v1::BinaryConvolution::validate_and_infer_types() {
                           " and ",
                           filters_pshape);
 
-    PartialShape result_shape = validate_and_infer_convolution_forward_output_shape(this,
-                                                                                    result_ps_rank,
-                                                                                    data_batch_pshape,
-                                                                                    filters_pshape,
-                                                                                    m_auto_pad,
-                                                                                    m_strides,
-                                                                                    m_dilations,
-                                                                                    m_pads_begin,
-                                                                                    m_pads_end);
+    ov::PartialShape result_shape = ngraph::validate_and_infer_convolution_forward_output_shape(this,
+                                                                                                result_ps_rank,
+                                                                                                data_batch_pshape,
+                                                                                                filters_pshape,
+                                                                                                m_auto_pad,
+                                                                                                m_strides,
+                                                                                                m_dilations,
+                                                                                                m_pads_begin,
+                                                                                                m_pads_end);
     set_output_type(0, data_batch_et, result_shape);
 }
 
-shared_ptr<Node> op::v1::BinaryConvolution::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<ov::Node> ov::op::v1::BinaryConvolution::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v1_BinaryConvolution_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<v1::BinaryConvolution>(new_args.at(0),
@@ -105,7 +104,7 @@ shared_ptr<Node> op::v1::BinaryConvolution::clone_with_new_inputs(const OutputVe
                                               m_auto_pad);
 }
 
-bool op::v1::BinaryConvolution::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::v1::BinaryConvolution::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v1_BinaryConvolution_visit_attributes);
     visitor.on_attribute("strides", m_strides);
     visitor.on_attribute("pads_begin", m_pads_begin);
@@ -119,22 +118,22 @@ bool op::v1::BinaryConvolution::visit_attributes(AttributeVisitor& visitor) {
 
 namespace ov {
 template <>
-NGRAPH_API EnumNames<op::v1::BinaryConvolution::BinaryConvolutionMode>&
-EnumNames<op::v1::BinaryConvolution::BinaryConvolutionMode>::get() {
-    static auto enum_names = EnumNames<op::v1::BinaryConvolution::BinaryConvolutionMode>(
+NGRAPH_API EnumNames<ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode>&
+EnumNames<ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode>(
         "op::v1::BinaryConvolution::BinaryConvolutionMode",
-        {{"xnor-popcount", op::v1::BinaryConvolution::BinaryConvolutionMode::XNOR_POPCOUNT}});
+        {{"xnor-popcount", ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode::XNOR_POPCOUNT}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v1::BinaryConvolution::BinaryConvolutionMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v1::BinaryConvolution::BinaryConvolutionMode>::type_info;
 }  // namespace ov
 
-std::ostream& operator<<(std::ostream& s, const op::v1::BinaryConvolution::BinaryConvolutionMode& type) {
+std::ostream& ov::operator<<(std::ostream& s, const ov::op::v1::BinaryConvolution::BinaryConvolutionMode& type) {
     return s << as_string(type);
 }
 
-op::v1::BinaryConvolution::BinaryConvolutionMode op::v1::BinaryConvolution::mode_from_string(
+ov::op::v1::BinaryConvolution::BinaryConvolutionMode ov::op::v1::BinaryConvolution::mode_from_string(
     const std::string& mode) const {
     return as_enum<BinaryConvolutionMode>(mode);
 }
diff --git a/ngraph/core/src/op/broadcast.cpp b/ngraph/core/src/op/broadcast.cpp
index 38454b35324c4d..fed7ac1b4cc0c2 100644
--- a/ngraph/core/src/op/broadcast.cpp
+++ b/ngraph/core/src/op/broadcast.cpp
@@ -17,7 +17,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v3::Broadcast, "Broadcast", 3, op::util::BroadcastBase);
+OPENVINO_RTTI_DEFINITION(op::v3::Broadcast, "Broadcast", 3, op::util::BroadcastBase);
 
 op::v3::Broadcast::Broadcast(const Output<Node>& arg,
                              const Output<Node>& target_shape,
@@ -35,7 +35,7 @@ op::v3::Broadcast::Broadcast(const Output<Node>& arg,
 }
 
 namespace {
-std::pair<bool, AxisSet> get_broadcast_axes_bidirectional(const Shape& arg_shape, const Shape& result_shape) {
+std::pair<bool, AxisSet> get_broadcast_axes_bidirectional(const ov::Shape& arg_shape, const ov::Shape& result_shape) {
     AxisSet broadcast_axes;
     bool axes_known = false;
     const auto start_axis = result_shape.size() - arg_shape.size();
@@ -67,12 +67,14 @@ std::pair<bool, AxisSet> op::v3::Broadcast::get_broadcast_axes() const {
 }
 
 namespace {
-PartialShape get_result_shape_bidirectional(const Node* this_ptr, const PartialShape& arg_shape, Shape& target_shape) {
+ov::PartialShape get_result_shape_bidirectional(const Node* this_ptr,
+                                                const ov::PartialShape& arg_shape,
+                                                ov::Shape& target_shape) {
     if (arg_shape.rank().is_dynamic()) {
-        return PartialShape::dynamic();
+        return ov::PartialShape::dynamic();
     }
     auto arg_shape_vec = static_cast<std::vector<Dimension>>(arg_shape);
-    PartialShape result_shape;
+    ov::PartialShape result_shape;
     // Add left padding to shorter target or argument shape
     const auto target_padded_rank = std::max(arg_shape_vec.size(), target_shape.size());
     while (arg_shape_vec.size() < target_padded_rank) {
@@ -109,8 +111,8 @@ PartialShape get_result_shape_bidirectional(const Node* this_ptr, const PartialS
 bool op::v3::Broadcast::broadcast_evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     if (get_broadcast_spec().m_type == op::BroadcastType::BIDIRECTIONAL) {
         auto arg_shape = inputs[0]->get_shape();
-        Shape target_shape = op::util::BroadcastBase::get_target_shape(inputs[1]);
-        PartialShape result_shape = get_result_shape_bidirectional(this, PartialShape{arg_shape}, target_shape);
+        ov::Shape target_shape = op::util::BroadcastBase::get_target_shape(inputs[1]);
+        ov::PartialShape result_shape = get_result_shape_bidirectional(this, ov::PartialShape{arg_shape}, target_shape);
         auto pair_broadcast_axes = get_broadcast_axes_bidirectional(arg_shape, result_shape.to_shape());
         return op::util::BroadcastBase::evaluate_broadcast(inputs[0],
                                                            outputs[0],
@@ -203,7 +205,7 @@ BroadcastModeSpec to_broadcast_mode(const AutoBroadcastSpec& bs) {
 }
 }  // namespace
 
-NGRAPH_RTTI_DEFINITION(op::v1::Broadcast, "Broadcast", 1, op::util::BroadcastBase);
+OPENVINO_RTTI_DEFINITION(op::v1::Broadcast, "Broadcast", 1, op::util::BroadcastBase);
 
 op::v1::Broadcast::Broadcast(const Output<Node>& arg,
                              const Output<Node>& target_shape,
@@ -219,7 +221,7 @@ op::v1::Broadcast::Broadcast(const Output<Node>& arg,
                              const AutoBroadcastSpec& broadcast_spec)
     : util::BroadcastBase{arg,
                           target_shape,
-                          op::v0::Constant::create(element::u8, Shape{}, {0})->output(0),
+                          op::v0::Constant::create(element::u8, ov::Shape{}, {0})->output(0),
                           to_broadcast_mode(broadcast_spec)},
       m_broadcast_spec{broadcast_spec} {
     constructor_validate_and_infer_types();
@@ -235,7 +237,7 @@ void op::v1::Broadcast::validate_and_infer_types() {
 
     // Mocking axes_mapping input for cases that don't require it
     if (m_broadcast_spec.m_type == AutoBroadcastType::NUMPY && get_input_size() < 3) {
-        auto output = op::v0::Constant::create(element::u8, Shape{}, {0})->output(0);
+        auto output = op::v0::Constant::create(element::u8, ov::Shape{}, {0})->output(0);
         set_argument(2, output);
     }
 
diff --git a/ngraph/core/src/op/bucketize.cpp b/ngraph/core/src/op/bucketize.cpp
index 5966ce549ef7ff..b77b9260f2a781 100644
--- a/ngraph/core/src/op/bucketize.cpp
+++ b/ngraph/core/src/op/bucketize.cpp
@@ -9,7 +9,7 @@
 using namespace ngraph;
 using namespace std;
 
-NGRAPH_RTTI_DEFINITION(op::v3::Bucketize, "Bucketize", 3);
+OPENVINO_RTTI_DEFINITION(op::v3::Bucketize, "Bucketize", 3);
 
 op::v3::Bucketize::Bucketize(const Output<Node>& data,
                              const Output<Node>& buckets,
@@ -30,8 +30,8 @@ bool op::v3::Bucketize::visit_attributes(AttributeVisitor& visitor) {
 
 void op::v3::Bucketize::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v3_Bucketize_validate_and_infer_types);
-    const PartialShape& data_pshape = get_input_partial_shape(0);
-    const PartialShape& buckets_pshape = get_input_partial_shape(1);
+    const ov::PartialShape& data_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& buckets_pshape = get_input_partial_shape(1);
 
     const auto data_et = get_input_element_type(0);
     const auto buckets_et = get_input_element_type(1);
diff --git a/ngraph/core/src/op/ceiling.cpp b/ngraph/core/src/op/ceiling.cpp
index 75c43e8629a035..7c13facafbe2c3 100644
--- a/ngraph/core/src/op/ceiling.cpp
+++ b/ngraph/core/src/op/ceiling.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Ceiling, "Ceiling", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Ceiling, "Ceiling", 0, util::UnaryElementwiseArithmetic);
 
 op::Ceiling::Ceiling(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/clamp.cpp b/ngraph/core/src/op/clamp.cpp
index ed500f0a8844e3..2a591d1d2c27a8 100644
--- a/ngraph/core/src/op/clamp.cpp
+++ b/ngraph/core/src/op/clamp.cpp
@@ -97,7 +97,7 @@ bool op::v0::Clamp::has_evaluate() const {
     return false;
 }
 
-NGRAPH_RTTI_DEFINITION(op::v0::Clamp, "Clamp", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Clamp, "Clamp", 0);
 
 op::Clamp::Clamp() : Op(), m_min(), m_max() {}
 
diff --git a/ngraph/core/src/op/concat.cpp b/ngraph/core/src/op/concat.cpp
index 0595083adb1d95..e321fd1afd753b 100644
--- a/ngraph/core/src/op/concat.cpp
+++ b/ngraph/core/src/op/concat.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::Concat, "Concat", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::Concat, "Concat", 0);
 
 op::Concat::Concat(const OutputVector& args, int64_t axis) : Op(args), m_axis(axis) {
     constructor_validate_and_infer_types();
@@ -32,7 +32,7 @@ void op::Concat::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_Concat_validate_and_infer_types);
     NODE_VALIDATION_CHECK(this, get_input_size() >= 1, "At least one argument required.");
 
-    PartialShape inputs_shape_scheme{PartialShape::dynamic()};
+    ov::PartialShape inputs_shape_scheme{ov::PartialShape::dynamic()};
     element::Type inputs_et{element::dynamic};
     Dimension concatenation_axis_output_dim{0};
 
@@ -40,7 +40,7 @@ void op::Concat::validate_and_infer_types() {
         NODE_VALIDATION_CHECK(this,
                               element::Type::merge(inputs_et, inputs_et, get_input_element_type(i)),
                               "Argument element types are inconsistent.");
-        PartialShape this_input_shape = get_input_partial_shape(i);
+        ov::PartialShape this_input_shape = get_input_partial_shape(i);
         Dimension this_input_rank = this_input_shape.rank();
         if (this_input_rank.is_static()) {
             if (get_concatenation_axis() < 0) {
@@ -66,7 +66,7 @@ void op::Concat::validate_and_infer_types() {
             this_input_shape[concat_axis] = Dimension::dynamic();
 
             NODE_VALIDATION_CHECK(this,
-                                  PartialShape::merge_into(inputs_shape_scheme, this_input_shape),
+                                  ov::PartialShape::merge_into(inputs_shape_scheme, this_input_shape),
                                   "Argument shapes are inconsistent; they must have the same rank, and must "
                                   "have ",
                                   "equal dimension everywhere except on the concatenation axis (axis ",
@@ -76,13 +76,13 @@ void op::Concat::validate_and_infer_types() {
             concatenation_axis_output_dim += Dimension::dynamic();
         }
     }
-    PartialShape concatenated_shape = inputs_shape_scheme;
+    ov::PartialShape concatenated_shape = inputs_shape_scheme;
 
     if (concatenated_shape.rank().is_static()) {
         concatenated_shape[get_concatenation_axis()] = concatenation_axis_output_dim;
         set_output_type(0, inputs_et, concatenated_shape);
     } else {
-        set_output_type(0, inputs_et, PartialShape::dynamic(concatenation_axis_output_dim));
+        set_output_type(0, inputs_et, ov::PartialShape::dynamic(concatenation_axis_output_dim));
     }
 }
 
@@ -95,8 +95,8 @@ shared_ptr<Node> op::Concat::clone_with_new_inputs(const OutputVector& new_args)
 namespace {
 bool evaluate_concat(const HostTensorVector& args, const HostTensorPtr& out, int64_t concatenation_axis) {
     std::vector<const char*> arg_bufs;
-    std::vector<Shape> arg_shapes;
-    Shape out_shape(args[0]->get_shape());
+    std::vector<ov::Shape> arg_shapes;
+    ov::Shape out_shape(args[0]->get_shape());
     out_shape[concatenation_axis] = 0;
     for (auto& input : args) {
         arg_bufs.push_back(input->get_data_ptr<char>());
diff --git a/ngraph/core/src/op/constant.cpp b/ngraph/core/src/op/constant.cpp
index 763f508d16dccb..ea2f5df7997157 100644
--- a/ngraph/core/src/op/constant.cpp
+++ b/ngraph/core/src/op/constant.cpp
@@ -15,7 +15,6 @@
 #include "ngraph/op/util/attr_types.hpp"
 #include "ngraph/util.hpp"
 
-using namespace ngraph;
 using namespace std;
 
 template <typename T>
@@ -33,15 +32,15 @@ static inline string to_cpp_string(T value) {
     return rc;
 }
 
-NGRAPH_RTTI_DEFINITION(op::Constant, "Constant", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::Constant, "Constant", 0);
 
-op::Constant::Constant(const shared_ptr<runtime::Tensor>& tensor) {
+ov::op::v0::Constant::Constant(const shared_ptr<ngraph::runtime::Tensor>& tensor) {
     m_element_type = tensor->get_element_type();
     m_shape = tensor->get_shape();
     // Share data from HostTensor if we work with it
     // And copy data in other cas
-    if (auto hostTensor = std::dynamic_pointer_cast<runtime::HostTensor>(tensor)) {
-        m_data = make_shared<runtime::SharedBuffer<std::shared_ptr<runtime::Tensor>>>(
+    if (auto hostTensor = std::dynamic_pointer_cast<ngraph::runtime::HostTensor>(tensor)) {
+        m_data = make_shared<ngraph::runtime::SharedBuffer<std::shared_ptr<ngraph::runtime::Tensor>>>(
             static_cast<char*>(hostTensor->get_data_ptr()),
             tensor->get_size_in_bytes(),
             tensor);
@@ -54,7 +53,9 @@ op::Constant::Constant(const shared_ptr<runtime::Tensor>& tensor) {
     constructor_validate_and_infer_types();
 }
 
-op::Constant::Constant(const element::Type& type, const Shape& shape, const std::vector<std::string>& values)
+ov::op::v0::Constant::Constant(const element::Type& type,
+                               const ov::Shape& shape,
+                               const std::vector<std::string>& values)
     : Constant(type, shape) {
     NGRAPH_SUPPRESS_DEPRECATED_START
     NODE_VALIDATION_CHECK(this,
@@ -76,49 +77,49 @@ op::Constant::Constant(const element::Type& type, const Shape& shape, const std:
             fill_data<Type_t::boolean>(stoi(values[0]));
             break;
         case Type_t::bf16:
-            fill_data<Type_t::bf16>(parse_string<float>(values[0]));
+            fill_data<Type_t::bf16>(ngraph::parse_string<float>(values[0]));
             break;
         case Type_t::f16:
-            fill_data<Type_t::f16>(parse_string<float>(values[0]));
+            fill_data<Type_t::f16>(ngraph::parse_string<float>(values[0]));
             break;
         case Type_t::f32:
-            fill_data<Type_t::f32>(parse_string<float>(values[0]));
+            fill_data<Type_t::f32>(ngraph::parse_string<float>(values[0]));
             break;
         case Type_t::f64:
-            fill_data<Type_t::f64>(parse_string<double>(values[0]));
+            fill_data<Type_t::f64>(ngraph::parse_string<double>(values[0]));
             break;
         case Type_t::i4:
-            fill_data<Type_t::i4>(parse_string<int64_t>(values[0]));
+            fill_data<Type_t::i4>(ngraph::parse_string<int64_t>(values[0]));
             break;
         case Type_t::i8:
-            fill_data<Type_t::i8>(parse_string<int64_t>(values[0]));
+            fill_data<Type_t::i8>(ngraph::parse_string<int64_t>(values[0]));
             break;
         case Type_t::i16:
-            fill_data<Type_t::i16>(parse_string<int64_t>(values[0]));
+            fill_data<Type_t::i16>(ngraph::parse_string<int64_t>(values[0]));
             break;
         case Type_t::i32:
-            fill_data<Type_t::i32>(parse_string<int64_t>(values[0]));
+            fill_data<Type_t::i32>(ngraph::parse_string<int64_t>(values[0]));
             break;
         case Type_t::i64:
-            fill_data<Type_t::i64>(parse_string<int64_t>(values[0]));
+            fill_data<Type_t::i64>(ngraph::parse_string<int64_t>(values[0]));
             break;
         case Type_t::u1:
             fill_data<Type_t::u1>(stoi(values[0]));
             break;
         case Type_t::u4:
-            fill_data<Type_t::u4>(parse_string<uint64_t>(values[0]));
+            fill_data<Type_t::u4>(ngraph::parse_string<uint64_t>(values[0]));
             break;
         case Type_t::u8:
-            fill_data<Type_t::u8>(parse_string<uint64_t>(values[0]));
+            fill_data<Type_t::u8>(ngraph::parse_string<uint64_t>(values[0]));
             break;
         case Type_t::u16:
-            fill_data<Type_t::u16>(parse_string<uint64_t>(values[0]));
+            fill_data<Type_t::u16>(ngraph::parse_string<uint64_t>(values[0]));
             break;
         case Type_t::u32:
-            fill_data<Type_t::u32>(parse_string<uint64_t>(values[0]));
+            fill_data<Type_t::u32>(ngraph::parse_string<uint64_t>(values[0]));
             break;
         case Type_t::u64:
-            fill_data<Type_t::u64>(parse_string<uint64_t>(values[0]));
+            fill_data<Type_t::u64>(ngraph::parse_string<uint64_t>(values[0]));
             break;
         case Type_t::undefined:
             throw std::runtime_error("deserialize unsupported type undefined");
@@ -129,52 +130,52 @@ op::Constant::Constant(const element::Type& type, const Shape& shape, const std:
     } else {
         switch (m_element_type) {
         case Type_t::boolean:
-            write_buffer<Type_t::boolean>(parse_string<uint8_t>(values));
+            write_buffer<Type_t::boolean>(ngraph::parse_string<uint8_t>(values));
             break;
         case Type_t::bf16:
-            write_buffer<Type_t::bf16>(parse_string<float>(values));
+            write_buffer<Type_t::bf16>(ngraph::parse_string<float>(values));
             break;
         case Type_t::f16:
-            write_buffer<Type_t::f16>(parse_string<float>(values));
+            write_buffer<Type_t::f16>(ngraph::parse_string<float>(values));
             break;
         case Type_t::f32:
-            write_buffer<Type_t::f32>(parse_string<float>(values));
+            write_buffer<Type_t::f32>(ngraph::parse_string<float>(values));
             break;
         case Type_t::f64:
-            write_buffer<Type_t::f64>(parse_string<double>(values));
+            write_buffer<Type_t::f64>(ngraph::parse_string<double>(values));
             break;
         case Type_t::i4:
-            write_buffer<Type_t::i4>(parse_string<int8_t>(values));
+            write_buffer<Type_t::i4>(ngraph::parse_string<int8_t>(values));
             break;
         case Type_t::i8:
-            write_buffer<Type_t::i8>(parse_string<int8_t>(values));
+            write_buffer<Type_t::i8>(ngraph::parse_string<int8_t>(values));
             break;
         case Type_t::i16:
-            write_buffer<Type_t::i16>(parse_string<int16_t>(values));
+            write_buffer<Type_t::i16>(ngraph::parse_string<int16_t>(values));
             break;
         case Type_t::i32:
-            write_buffer<Type_t::i32>(parse_string<int32_t>(values));
+            write_buffer<Type_t::i32>(ngraph::parse_string<int32_t>(values));
             break;
         case Type_t::i64:
-            write_buffer<Type_t::i64>(parse_string<int64_t>(values));
+            write_buffer<Type_t::i64>(ngraph::parse_string<int64_t>(values));
             break;
         case Type_t::u1:
-            write_buffer<Type_t::u1>(parse_string<uint8_t>(values));
+            write_buffer<Type_t::u1>(ngraph::parse_string<uint8_t>(values));
             break;
         case Type_t::u4:
-            write_buffer<Type_t::u4>(parse_string<uint8_t>(values));
+            write_buffer<Type_t::u4>(ngraph::parse_string<uint8_t>(values));
             break;
         case Type_t::u8:
-            write_buffer<Type_t::u8>(parse_string<uint8_t>(values));
+            write_buffer<Type_t::u8>(ngraph::parse_string<uint8_t>(values));
             break;
         case Type_t::u16:
-            write_buffer<Type_t::u16>(parse_string<uint16_t>(values));
+            write_buffer<Type_t::u16>(ngraph::parse_string<uint16_t>(values));
             break;
         case Type_t::u32:
-            write_buffer<Type_t::u32>(parse_string<uint32_t>(values));
+            write_buffer<Type_t::u32>(ngraph::parse_string<uint32_t>(values));
             break;
         case Type_t::u64:
-            write_buffer<Type_t::u64>(parse_string<uint64_t>(values));
+            write_buffer<Type_t::u64>(ngraph::parse_string<uint64_t>(values));
             break;
         case Type_t::undefined:
             throw std::runtime_error("deserialize unsupported type undefined");
@@ -186,23 +187,26 @@ op::Constant::Constant(const element::Type& type, const Shape& shape, const std:
     NGRAPH_SUPPRESS_DEPRECATED_END
 }
 
-op::Constant::Constant(const element::Type& type, const Shape& shape) : m_element_type(type), m_shape(shape) {
+ov::op::v0::Constant::Constant(const element::Type& type, const ov::Shape& shape)
+    : m_element_type(type),
+      m_shape(shape) {
     allocate_buffer();
     constructor_validate_and_infer_types();
 }
 
-void op::Constant::allocate_buffer() {
-    m_data = make_shared<runtime::AlignedBuffer>(mem_size(), host_alignment());
+void ov::op::v0::Constant::allocate_buffer() {
+    m_data = make_shared<ngraph::runtime::AlignedBuffer>(mem_size(), host_alignment());
     std::memset(m_data->get_ptr(), 0, m_data->size());
 }
 
-op::Constant::Constant(const element::Type& type, const Shape& shape, const void* data) : Constant(type, shape) {
+ov::op::v0::Constant::Constant(const element::Type& type, const ov::Shape& shape, const void* data)
+    : Constant(type, shape) {
     size_t size = ceil(shape_size(m_shape) * m_element_type.bitwidth() / 8.f);
     std::memcpy(get_data_ptr_nc(), data, size);
     m_all_elements_bitwise_identical = are_all_data_elements_bitwise_identical();
 }
 
-op::Constant::Constant(const Constant& other) {
+ov::op::v0::Constant::Constant(const Constant& other) {
     m_element_type = other.m_element_type;
     m_shape = other.m_shape;
     m_data = other.m_data;
@@ -210,9 +214,9 @@ op::Constant::Constant(const Constant& other) {
     constructor_validate_and_infer_types();
 }
 
-op::Constant::Constant(const Constant& other, const Shape& new_shape) {
+ov::op::v0::Constant::Constant(const Constant& other, const ov::Shape& new_shape) {
     NGRAPH_CHECK(shape_size(other.m_shape) == shape_size(new_shape),
-                 "Shape size " + std::to_string(shape_size(new_shape)) + " is not equal to " +
+                 "ov::Shape size " + std::to_string(shape_size(new_shape)) + " is not equal to " +
                      std::to_string(shape_size(other.m_shape)));
     m_element_type = other.m_element_type;
     m_shape = new_shape;
@@ -221,9 +225,9 @@ op::Constant::Constant(const Constant& other, const Shape& new_shape) {
     constructor_validate_and_infer_types();
 }
 
-op::Constant::~Constant() {}
+ov::op::v0::Constant::~Constant() = default;
 
-string op::Constant::convert_value_to_string(size_t index) const {
+string ov::op::v0::Constant::convert_value_to_string(size_t index) const {
     string rc;
 #if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
 #    pragma GCC diagnostic push
@@ -291,7 +295,7 @@ string op::Constant::convert_value_to_string(size_t index) const {
     return rc;
 }
 
-vector<string> op::Constant::get_value_strings() const {
+vector<string> ov::op::v0::Constant::get_value_strings() const {
     vector<string> rc;
 
 #if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
@@ -387,17 +391,17 @@ vector<string> op::Constant::get_value_strings() const {
     return rc;
 }
 
-Shape op::Constant::get_shape_val() const {
+ov::Shape ov::op::v0::Constant::get_shape_val() const {
     NGRAPH_CHECK(m_element_type.is_integral_number());
     std::vector<int64_t> out_shape = cast_vector<int64_t>();
-    Shape output_shape(shape_size(m_shape));
+    ov::Shape output_shape(shape_size(m_shape));
     std::transform(out_shape.begin(), out_shape.end(), output_shape.begin(), [&](const int64_t& v) {
         return (v > 0) ? v : 0;
     });
     return output_shape;
 }
 
-Strides op::Constant::get_strides_val() const {
+ov::Strides ov::op::v0::Constant::get_strides_val() const {
     NGRAPH_CHECK(m_element_type == element::i64);
     std::vector<int64_t> out_strides = cast_vector<int64_t>();
     Strides output_strides(shape_size(m_shape));
@@ -407,7 +411,7 @@ Strides op::Constant::get_strides_val() const {
     return output_strides;
 }
 
-Coordinate op::Constant::get_coordinate_val() const {
+ov::Coordinate ov::op::v0::Constant::get_coordinate_val() const {
     NGRAPH_CHECK(m_element_type == element::i64);
     std::vector<int64_t> out_coordinate = cast_vector<int64_t>();
     Coordinate output_coordinate(shape_size(m_shape));
@@ -417,7 +421,7 @@ Coordinate op::Constant::get_coordinate_val() const {
     return output_coordinate;
 }
 
-CoordinateDiff op::Constant::get_coordinate_diff_val() const {
+ov::CoordinateDiff ov::op::v0::Constant::get_coordinate_diff_val() const {
     NGRAPH_CHECK(m_element_type == element::i64);
     std::vector<int64_t> out_coordinate_diff = cast_vector<int64_t>();
     CoordinateDiff output_coordinate_diff(shape_size(m_shape));
@@ -430,7 +434,7 @@ CoordinateDiff op::Constant::get_coordinate_diff_val() const {
     return output_coordinate_diff;
 }
 
-AxisVector op::Constant::get_axis_vector_val() const {
+ov::AxisVector ov::op::v0::Constant::get_axis_vector_val() const {
     NGRAPH_CHECK(m_element_type.is_integral_number());
     std::vector<int64_t> out_axis_vector = cast_vector<int64_t>();
     AxisVector output_axis_vector(shape_size(m_shape));
@@ -440,7 +444,7 @@ AxisVector op::Constant::get_axis_vector_val() const {
     return output_axis_vector;
 }
 
-AxisSet op::Constant::get_axis_set_val() const {
+ov::AxisSet ov::op::v0::Constant::get_axis_set_val() const {
     NGRAPH_CHECK(m_element_type.is_integral_number());
     std::vector<int64_t> out_axis_set = cast_vector<int64_t>();
     AxisSet output_axis_set;
@@ -450,12 +454,12 @@ AxisSet op::Constant::get_axis_set_val() const {
     return output_axis_set;
 }
 
-void op::Constant::set_data_shape(const Shape& shape) {
+void ov::op::v0::Constant::set_data_shape(const ov::Shape& shape) {
     NGRAPH_CHECK(shape_size(shape) == shape_size(m_shape));
     m_shape = shape;
 }
 
-shared_ptr<Node> op::Constant::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<ov::Node> ov::op::v0::Constant::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_Constant_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<Constant>(*this);
@@ -476,7 +480,7 @@ static bool test_bitwise_identical(const T* data, const size_t size) {
     return data_is_constant;
 }
 
-bool op::Constant::are_all_data_elements_bitwise_identical() const {
+bool ov::op::v0::Constant::are_all_data_elements_bitwise_identical() const {
     bool rc = false;
 #if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
 #    pragma GCC diagnostic push
@@ -522,9 +526,9 @@ bool op::Constant::are_all_data_elements_bitwise_identical() const {
     return rc;
 }
 
-bool op::v0::Constant::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::v0::Constant::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_Constant_visit_attributes);
-    Shape prev_shape = m_shape;
+    ov::Shape prev_shape = m_shape;
     element::Type prev_type = m_element_type;
     visitor.on_attribute("element_type", m_element_type);
     visitor.on_attribute("shape", m_shape);
@@ -539,21 +543,21 @@ bool op::v0::Constant::visit_attributes(AttributeVisitor& visitor) {
     return true;
 }
 
-bool op::v0::Constant::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::v0::Constant::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v0_Constant_evaluate);
     auto output = outputs[0];
     output->write(get_data_ptr(), output->get_size_in_bytes());
     return true;
 }
 
-bool op::v0::Constant::has_evaluate() const {
+bool ov::op::v0::Constant::has_evaluate() const {
     NGRAPH_OP_SCOPE(v0_Constant_has_evaluate);
     return true;
 }
 
-bool op::v0::Constant::evaluate_lower(const HostTensorVector& outputs) const {
+bool ov::op::v0::Constant::evaluate_lower(const HostTensorVector& outputs) const {
     return evaluate(outputs, {});
 }
-bool op::v0::Constant::evaluate_upper(const HostTensorVector& outputs) const {
+bool ov::op::v0::Constant::evaluate_upper(const HostTensorVector& outputs) const {
     return evaluate(outputs, {});
 }
diff --git a/ngraph/core/src/op/convert.cpp b/ngraph/core/src/op/convert.cpp
index 82bd67226801ca..1bd2a639d43a46 100644
--- a/ngraph/core/src/op/convert.cpp
+++ b/ngraph/core/src/op/convert.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Convert, "Convert", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Convert, "Convert", 0);
 
 op::Convert::Convert(const Output<Node>& arg, const element::Type& destination_type)
     : Op({arg}),
diff --git a/ngraph/core/src/op/convert_like.cpp b/ngraph/core/src/op/convert_like.cpp
index b036e5e194a7af..e839d3b53e1302 100644
--- a/ngraph/core/src/op/convert_like.cpp
+++ b/ngraph/core/src/op/convert_like.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::ConvertLike, "ConvertLike", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::ConvertLike, "ConvertLike", 1);
 
 op::v1::ConvertLike::ConvertLike(const Output<Node>& data, const Output<Node>& like) : Op({data, like}) {
     constructor_validate_and_infer_types();
@@ -37,7 +37,7 @@ shared_ptr<Node> op::v1::ConvertLike::clone_with_new_inputs(const OutputVector&
 
 bool op::v1::ConvertLike::constant_fold(OutputVector& output_values, const OutputVector& input_values) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "op::v1::ConvertLike::constant_fold");
-    if (auto data_const = std::dynamic_pointer_cast<op::Constant>(input_values[0].get_node_shared_ptr())) {
+    if (auto data_const = std::dynamic_pointer_cast<op::v0::Constant>(input_values[0].get_node_shared_ptr())) {
         auto convert = make_shared<Convert>(input_values[0], input_values[1].get_element_type());
         convert->constant_fold(output_values, OutputVector{data_const});
         return true;
diff --git a/ngraph/core/src/op/convolution.cpp b/ngraph/core/src/op/convolution.cpp
index c521a29bb71a1a..1b7145fd21add6 100644
--- a/ngraph/core/src/op/convolution.cpp
+++ b/ngraph/core/src/op/convolution.cpp
@@ -15,7 +15,7 @@ using namespace std;
 using namespace ngraph;
 
 // *** Convolution OP SET 1 ***
-NGRAPH_RTTI_DEFINITION(op::v1::Convolution, "Convolution", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Convolution, "Convolution", 1);
 
 op::v1::Convolution::Convolution(const Output<Node>& data_batch,
                                  const Output<Node>& filters,
@@ -45,9 +45,9 @@ bool op::v1::Convolution::visit_attributes(AttributeVisitor& visitor) {
 
 void op::v1::Convolution::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_Convolution_validate_and_infer_types);
-    const PartialShape& data_batch_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& data_batch_pshape = get_input_partial_shape(0);
     element::Type data_batch_et = get_input_element_type(0);
-    const PartialShape& filters_pshape = get_input_partial_shape(1);
+    const ov::PartialShape& filters_pshape = get_input_partial_shape(1);
     element::Type filters_et = get_input_element_type(1);
 
     element::Type result_et;
@@ -72,15 +72,15 @@ void op::v1::Convolution::validate_and_infer_types() {
                           " and ",
                           filters_pshape);
 
-    PartialShape result_shape = validate_and_infer_convolution_forward_output_shape(this,
-                                                                                    result_ps_rank,
-                                                                                    data_batch_pshape,
-                                                                                    filters_pshape,
-                                                                                    m_auto_pad,
-                                                                                    m_strides,
-                                                                                    m_dilations,
-                                                                                    m_pads_begin,
-                                                                                    m_pads_end);
+    ov::PartialShape result_shape = validate_and_infer_convolution_forward_output_shape(this,
+                                                                                        result_ps_rank,
+                                                                                        data_batch_pshape,
+                                                                                        filters_pshape,
+                                                                                        m_auto_pad,
+                                                                                        m_strides,
+                                                                                        m_dilations,
+                                                                                        m_pads_begin,
+                                                                                        m_pads_end);
     set_output_type(0, result_et, result_shape);
 }
 
@@ -161,31 +161,31 @@ bool op::v1::ConvolutionBackpropData::is_dynamic() const {
     return is_dynamic;
 }
 
-const PartialShape op::v1::ConvolutionBackpropData::get_output_shape() const {
+const ov::PartialShape op::v1::ConvolutionBackpropData::get_output_shape() const {
     auto data_pshape = get_input_partial_shape(0);
     auto filter_pshape = get_input_partial_shape(1);
 
-    PartialShape shape;
+    ov::PartialShape shape;
     bool is_output_shape_present = inputs().size() == 3;
     if (is_output_shape_present) {
         if (const auto& const_op = get_constant_from_source(input_value(2))) {
-            return PartialShape{const_op->get_shape_val()};
+            return ov::PartialShape{const_op->get_shape_val()};
         }
     }
 
     if (data_pshape.rank().is_static()) {
-        shape = PartialShape{vector<Dimension>(data_pshape.rank().get_length() - 2)};
+        shape = ov::PartialShape{vector<Dimension>(data_pshape.rank().get_length() - 2)};
     } else if (filter_pshape.rank().is_static()) {
-        shape = PartialShape{vector<Dimension>(filter_pshape.rank().get_length() - 2)};
+        shape = ov::PartialShape{vector<Dimension>(filter_pshape.rank().get_length() - 2)};
     } else {
-        shape = PartialShape::dynamic();
+        shape = ov::PartialShape::dynamic();
     }
     return shape;
 }
 
-void op::v1::ConvolutionBackpropData::set_output_shape(const Shape& shape) {
+void op::v1::ConvolutionBackpropData::set_output_shape(const ov::Shape& shape) {
     this->input(2).replace_source_output(
-        op::Constant::create(this->get_input_element_type(2), Shape{shape.size()}, shape)->output(0));
+        op::v0::Constant::create(this->get_input_element_type(2), ov::Shape{shape.size()}, shape)->output(0));
 }
 
 void op::v1::ConvolutionBackpropData::infer_conv_backprop_output_spatial_shape(
@@ -208,7 +208,7 @@ void op::v1::ConvolutionBackpropData::infer_conv_backprop_output_spatial_shape(
             int64_t val = strides[i] * (input_data_shape[i].get_length() - 1) +
                           dilations[i] * (filters_shape[i].get_length() - 1) + 1 - pads_begin[i] - pads_end[i] +
                           output_padding[i];
-            output_spatial_shape.push_back(val);
+            output_spatial_shape.emplace_back(val);
         } else {
             output_spatial_shape.push_back(Dimension::dynamic());
         }
@@ -217,9 +217,9 @@ void op::v1::ConvolutionBackpropData::infer_conv_backprop_output_spatial_shape(
 
 void op::v1::ConvolutionBackpropData::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_ConvolutionBackpropData_validate_and_infer_types);
-    const PartialShape& data_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& data_pshape = get_input_partial_shape(0);
     element::Type delta_et = get_input_element_type(0);
-    const PartialShape& filters_pshape = get_input_partial_shape(1);
+    const ov::PartialShape& filters_pshape = get_input_partial_shape(1);
     element::Type filters_et = get_input_element_type(1);
 
     element::Type result_et;
@@ -260,7 +260,7 @@ void op::v1::ConvolutionBackpropData::validate_and_infer_types() {
 
     bool is_output_shape_present = inputs().size() == 3;
     if (is_output_shape_present) {
-        const PartialShape& output_shape_pshape = get_input_partial_shape(2);
+        const ov::PartialShape& output_shape_pshape = get_input_partial_shape(2);
         const element::Type output_shape_et = get_input_element_type(2);
 
         NODE_VALIDATION_CHECK(this,
@@ -277,7 +277,7 @@ void op::v1::ConvolutionBackpropData::validate_and_infer_types() {
                               output_shape_pshape,
                               ").");
     }
-    PartialShape output_spatial_pshape = get_output_shape();
+    ov::PartialShape output_spatial_pshape = get_output_shape();
 
     if (result_ps_rank.is_static()) {
         const auto num_spatial_dims = result_ps_rank.get_length() - 2;
@@ -316,7 +316,7 @@ void op::v1::ConvolutionBackpropData::validate_and_infer_types() {
                               "spatial features.");
 
         if (is_output_shape_present && output_spatial_pshape.is_static()) {
-            Shape output_shape = output_spatial_pshape.to_shape();
+            ov::Shape output_shape = output_spatial_pshape.to_shape();
             NODE_VALIDATION_CHECK(this,
                                   static_cast<int64_t>(output_shape.size()) == num_spatial_dims,
                                   "Output shape should be specified only and for "
@@ -324,23 +324,23 @@ void op::v1::ConvolutionBackpropData::validate_and_infer_types() {
         }
     }
 
-    PartialShape result_pshape{PartialShape::dynamic()};
+    ov::PartialShape result_pshape{ov::PartialShape::dynamic()};
     // If output shape is provided, ignore current values for padding begin/end
     // and infer them.
     if (is_output_shape_present) {
         if (output_spatial_pshape.rank().is_static()) {
             if (data_pshape.rank().is_static() && filters_pshape.rank().is_static()) {
-                const PartialShape data_spatial_shape = [data_pshape]() {
+                const ov::PartialShape data_spatial_shape = [data_pshape]() {
                     vector<Dimension> data_dims{data_pshape};
                     data_dims.erase(data_dims.begin(), data_dims.begin() + 2);  // remove {N, C_IN}
-                    return PartialShape{data_dims};
+                    return ov::PartialShape{data_dims};
                 }();
 
-                const PartialShape filters_spatial_shape = [filters_pshape]() {
+                const ov::PartialShape filters_spatial_shape = [filters_pshape]() {
                     vector<Dimension> filters_dims{filters_pshape};
                     filters_dims.erase(filters_dims.begin(),
                                        filters_dims.begin() + 2);  // remove {C_IN, C_OUT}
-                    return PartialShape{filters_dims};
+                    return ov::PartialShape{filters_dims};
                 }();
 
                 // If auto_pad has one of following mode we infer paddings. Otherwise in
@@ -366,7 +366,7 @@ void op::v1::ConvolutionBackpropData::validate_and_infer_types() {
             // N
             auto batches = data_pshape.rank().is_static() ? data_pshape[0] : Dimension::dynamic();
             output_pshape.insert(output_pshape.begin(), batches);
-            result_pshape = PartialShape{output_pshape};
+            result_pshape = ov::PartialShape{output_pshape};
         }
         set_input_is_relevant_to_shape(2);
     }
@@ -410,7 +410,7 @@ void op::v1::ConvolutionBackpropData::validate_and_infer_types() {
             // N
             auto batches = data_pshape.rank().is_static() ? data_pshape[0] : Dimension::dynamic();
             output_pshape.insert(output_pshape.begin(), batches);
-            result_pshape = PartialShape{output_pshape};
+            result_pshape = ov::PartialShape{output_pshape};
         }
     }
     set_input_is_relevant_to_shape(0);
diff --git a/ngraph/core/src/op/cos.cpp b/ngraph/core/src/op/cos.cpp
index 82dc09d4aed54e..47a45bc5fbb165 100644
--- a/ngraph/core/src/op/cos.cpp
+++ b/ngraph/core/src/op/cos.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Cos, "Cos", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Cos, "Cos", 0, util::UnaryElementwiseArithmetic);
 
 op::Cos::Cos(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/cosh.cpp b/ngraph/core/src/op/cosh.cpp
index e53e4c073d81c3..997ea2a0647297 100644
--- a/ngraph/core/src/op/cosh.cpp
+++ b/ngraph/core/src/op/cosh.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Cosh, "Cosh", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Cosh, "Cosh", 0, util::UnaryElementwiseArithmetic);
 
 op::Cosh::Cosh(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/ctc_greedy_decoder.cpp b/ngraph/core/src/op/ctc_greedy_decoder.cpp
index a320dc9d92b521..e2ac407b4d9004 100644
--- a/ngraph/core/src/op/ctc_greedy_decoder.cpp
+++ b/ngraph/core/src/op/ctc_greedy_decoder.cpp
@@ -9,7 +9,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::CTCGreedyDecoder, "CTCGreedyDecoder", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::CTCGreedyDecoder, "CTCGreedyDecoder", 0);
 
 op::CTCGreedyDecoder::CTCGreedyDecoder(const Output<Node>& input,
                                        const Output<Node>& seq_len,
@@ -27,7 +27,7 @@ void op::CTCGreedyDecoder::validate_and_infer_types() {
 
     // output dynamic rank tensor if all inputs are of dynamic rank
     if (logits_pshape.rank().is_dynamic() && seq_mask_pshape.rank().is_dynamic()) {
-        set_output_type(0, input_et, PartialShape{Dimension::dynamic(), Dimension::dynamic(), 1, 1});
+        set_output_type(0, input_et, ov::PartialShape{Dimension::dynamic(), Dimension::dynamic(), 1, 1});
     }
 
     // check ranks of input tensors
@@ -71,7 +71,7 @@ void op::CTCGreedyDecoder::validate_and_infer_types() {
             batch_size = seq_mask_pshape[1];
         }
     }
-    set_output_type(0, input_et, PartialShape{batch_size, time_size, 1, 1});
+    set_output_type(0, input_et, ov::PartialShape{batch_size, time_size, 1, 1});
 }
 
 bool op::CTCGreedyDecoder::visit_attributes(AttributeVisitor& visitor) {
diff --git a/ngraph/core/src/op/ctc_greedy_decoder_seq_len.cpp b/ngraph/core/src/op/ctc_greedy_decoder_seq_len.cpp
index e08cc5e7d34cc9..4ca75d0835a912 100644
--- a/ngraph/core/src/op/ctc_greedy_decoder_seq_len.cpp
+++ b/ngraph/core/src/op/ctc_greedy_decoder_seq_len.cpp
@@ -9,7 +9,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v6::CTCGreedyDecoderSeqLen, "CTCGreedyDecoderSeqLen", 6);
+OPENVINO_RTTI_DEFINITION(op::v6::CTCGreedyDecoderSeqLen, "CTCGreedyDecoderSeqLen", 6);
 
 op::v6::CTCGreedyDecoderSeqLen::CTCGreedyDecoderSeqLen(const Output<Node>& input,
                                                        const Output<Node>& seq_len,
@@ -65,7 +65,7 @@ void op::v6::CTCGreedyDecoderSeqLen::validate_and_infer_types() {
 
         const auto& blank_index_partial_shape = get_input_partial_shape(2);
         if (blank_index_partial_shape.is_static()) {
-            Shape blank_index_shape = blank_index_partial_shape.to_shape();
+            ov::Shape blank_index_shape = blank_index_partial_shape.to_shape();
             NODE_VALIDATION_CHECK(
                 this,
                 ngraph::is_scalar(blank_index_shape) || (is_vector(blank_index_shape) && (blank_index_shape[0] == 1)),
@@ -100,8 +100,8 @@ void op::v6::CTCGreedyDecoderSeqLen::validate_and_infer_types() {
         batch_size = seq_len_pshape[0] & logits_pshape[0];
     }
 
-    set_output_type(0, m_classes_index_type, PartialShape{batch_size, time_size});
-    set_output_type(1, m_sequence_length_type, PartialShape{batch_size});
+    set_output_type(0, m_classes_index_type, ov::PartialShape{batch_size, time_size});
+    set_output_type(1, m_sequence_length_type, ov::PartialShape{batch_size});
 }
 
 bool op::v6::CTCGreedyDecoderSeqLen::visit_attributes(AttributeVisitor& visitor) {
diff --git a/ngraph/core/src/op/ctc_loss.cpp b/ngraph/core/src/op/ctc_loss.cpp
index 6f0da3bfc0868f..93bbc41d13970a 100644
--- a/ngraph/core/src/op/ctc_loss.cpp
+++ b/ngraph/core/src/op/ctc_loss.cpp
@@ -9,7 +9,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v4::CTCLoss, "CTCLoss", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::CTCLoss, "CTCLoss", 4);
 
 op::v4::CTCLoss::CTCLoss(const Output<Node>& logits,
                          const Output<Node>& logit_length,
@@ -186,9 +186,9 @@ void op::v4::CTCLoss::validate_and_infer_types() {
     // set output shape
     set_output_size(1);
     if (is_batch_size_set) {
-        set_output_type(0, logits_type, Shape{batch_size});
+        set_output_type(0, logits_type, ov::Shape{batch_size});
     } else {
-        set_output_type(0, logits_type, PartialShape{Dimension::dynamic()});
+        set_output_type(0, logits_type, ov::PartialShape{Dimension::dynamic()});
     }
 }
 
diff --git a/ngraph/core/src/op/cum_sum.cpp b/ngraph/core/src/op/cum_sum.cpp
index 26c7177920a02b..a154d524d0d4b8 100644
--- a/ngraph/core/src/op/cum_sum.cpp
+++ b/ngraph/core/src/op/cum_sum.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::CumSum, "CumSum", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::CumSum, "CumSum", 0);
 
 op::v0::CumSum::CumSum(const Output<Node>& arg, const Output<Node>& axis, const bool exclusive, const bool reverse)
     : Op({arg, axis}),
@@ -23,7 +23,7 @@ op::v0::CumSum::CumSum(const Output<Node>& arg, const Output<Node>& axis, const
 }
 
 op::v0::CumSum::CumSum(const Output<Node>& arg, const bool exclusive, const bool reverse)
-    : Op({arg, op::Constant::create(element::i32, Shape{}, {0})}),
+    : Op({arg, op::v0::Constant::create(element::i32, ov::Shape{}, {0})}),
       m_exclusive(exclusive),
       m_reverse(reverse) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/deformable_convolution.cpp b/ngraph/core/src/op/deformable_convolution.cpp
index ad993c06cae97b..c7f22f49fc723b 100644
--- a/ngraph/core/src/op/deformable_convolution.cpp
+++ b/ngraph/core/src/op/deformable_convolution.cpp
@@ -14,8 +14,14 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::DeformableConvolution, "DeformableConvolution", 1, op::util::DeformableConvolutionBase);
-NGRAPH_RTTI_DEFINITION(op::v8::DeformableConvolution, "DeformableConvolution", 8, op::util::DeformableConvolutionBase);
+OPENVINO_RTTI_DEFINITION(op::v1::DeformableConvolution,
+                         "DeformableConvolution",
+                         1,
+                         op::util::DeformableConvolutionBase);
+OPENVINO_RTTI_DEFINITION(op::v8::DeformableConvolution,
+                         "DeformableConvolution",
+                         8,
+                         op::util::DeformableConvolutionBase);
 
 op::v8::DeformableConvolution::DeformableConvolution(const Output<Node>& arg,
                                                      const Output<Node>& offsets,
@@ -75,9 +81,9 @@ void op::v8::DeformableConvolution::validate_and_infer_types() {
 
     DeformableConvolutionBase::validate_and_infer_types();
     if (inputs().size() == 4) {
-        const PartialShape& data_pshape = get_input_partial_shape(0);
-        const PartialShape& filters_pshape = get_input_partial_shape(2);
-        const PartialShape& mask_pshape = get_input_partial_shape(3);
+        const ov::PartialShape& data_pshape = get_input_partial_shape(0);
+        const ov::PartialShape& filters_pshape = get_input_partial_shape(2);
+        const ov::PartialShape& mask_pshape = get_input_partial_shape(3);
         element::Type mask_et = get_input_element_type(3);
 
         NODE_VALIDATION_CHECK(this,
@@ -126,7 +132,7 @@ void op::v8::DeformableConvolution::validate_and_infer_types() {
             }
         }
 
-        PartialShape result_pshape = get_output_partial_shape(0);
+        ov::PartialShape result_pshape = get_output_partial_shape(0);
         if (result_pshape.rank().is_static() && mask_pshape.rank().is_static()) {
             NODE_VALIDATION_CHECK(
                 this,
diff --git a/ngraph/core/src/op/deformable_psroi_pooling.cpp b/ngraph/core/src/op/deformable_psroi_pooling.cpp
index 5e6821112de6db..713f71206151f7 100644
--- a/ngraph/core/src/op/deformable_psroi_pooling.cpp
+++ b/ngraph/core/src/op/deformable_psroi_pooling.cpp
@@ -9,7 +9,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::DeformablePSROIPooling, "DeformablePSROIPooling", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::DeformablePSROIPooling, "DeformablePSROIPooling", 1);
 
 op::v1::DeformablePSROIPooling::DeformablePSROIPooling(const Output<Node>& input,
                                                        const Output<Node>& coords,
@@ -111,7 +111,7 @@ void op::v1::DeformablePSROIPooling::validate_and_infer_types() {
         output_dim_vec[i] = m_group_size;
     }
 
-    set_output_type(0, input_et, PartialShape(output_dim_vec));
+    set_output_type(0, input_et, ov::PartialShape(output_dim_vec));
 }
 
 shared_ptr<Node> op::v1::DeformablePSROIPooling::clone_with_new_inputs(const OutputVector& new_args) const {
diff --git a/ngraph/core/src/op/depth_to_space.cpp b/ngraph/core/src/op/depth_to_space.cpp
index 8b6eee758dd6b5..e644ac841c9322 100644
--- a/ngraph/core/src/op/depth_to_space.cpp
+++ b/ngraph/core/src/op/depth_to_space.cpp
@@ -16,7 +16,7 @@
 
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::DepthToSpace, "DepthToSpace", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::DepthToSpace, "DepthToSpace", 0);
 
 op::DepthToSpace::DepthToSpace(const Output<Node>& data, const DepthToSpaceMode& mode, const size_t block_size)
     : Op({data}),
@@ -45,7 +45,7 @@ std::shared_ptr<Node> op::DepthToSpace::clone_with_new_inputs(const OutputVector
 
 void op::DepthToSpace::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_DepthToSpace_validate_and_infer_types);
-    PartialShape data_pshape = get_input_partial_shape(0);
+    ov::PartialShape data_pshape = get_input_partial_shape(0);
 
     const auto& data_type = get_input_element_type(0);
 
@@ -79,7 +79,7 @@ void op::DepthToSpace::validate_and_infer_types() {
         set_output_size(1);
         set_output_type(0, data_type, out_shape);
     } else {
-        set_output_type(0, data_type, PartialShape::dynamic(data_pshape.rank()));
+        set_output_type(0, data_type, ov::PartialShape::dynamic(data_pshape.rank()));
     }
 }
 
@@ -113,19 +113,20 @@ bool op::DepthToSpace::has_evaluate() const {
     return !get_input_partial_shape(0).is_dynamic();
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::DepthToSpace::DepthToSpaceMode& type) {
+std::ostream& ov::operator<<(std::ostream& s, const ov::op::v0::DepthToSpace::DepthToSpaceMode& type) {
     return s << as_string(type);
 }
 
 namespace ov {
 template <>
-NGRAPH_API EnumNames<op::DepthToSpace::DepthToSpaceMode>& EnumNames<op::DepthToSpace::DepthToSpaceMode>::get() {
-    static auto enum_names = EnumNames<op::DepthToSpace::DepthToSpaceMode>(
+NGRAPH_API EnumNames<ngraph::op::DepthToSpace::DepthToSpaceMode>&
+EnumNames<ngraph::op::DepthToSpace::DepthToSpaceMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::DepthToSpace::DepthToSpaceMode>(
         "op::DepthToSpace::DepthToSpaceMode",
-        {{"blocks_first", op::DepthToSpace::DepthToSpaceMode::BLOCKS_FIRST},
-         {"depth_first", op::DepthToSpace::DepthToSpaceMode::DEPTH_FIRST}});
+        {{"blocks_first", ngraph::op::DepthToSpace::DepthToSpaceMode::BLOCKS_FIRST},
+         {"depth_first", ngraph::op::DepthToSpace::DepthToSpaceMode::DEPTH_FIRST}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::DepthToSpace::DepthToSpaceMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::DepthToSpace::DepthToSpaceMode>::type_info;
 }  // namespace ov
diff --git a/ngraph/core/src/op/detection_output.cpp b/ngraph/core/src/op/detection_output.cpp
index bd49fcf80729a8..988a7299a0ed33 100644
--- a/ngraph/core/src/op/detection_output.cpp
+++ b/ngraph/core/src/op/detection_output.cpp
@@ -7,31 +7,30 @@
 #include "itt.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::DetectionOutput, "DetectionOutput", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::DetectionOutput, "DetectionOutput", 0);
 
-op::DetectionOutput::DetectionOutput(const Output<Node>& box_logits,
-                                     const Output<Node>& class_preds,
-                                     const Output<Node>& proposals,
-                                     const Output<Node>& aux_class_preds,
-                                     const Output<Node>& aux_box_preds,
-                                     const DetectionOutputAttrs& attrs)
+ov::op::v0::DetectionOutput::DetectionOutput(const Output<Node>& box_logits,
+                                             const Output<Node>& class_preds,
+                                             const Output<Node>& proposals,
+                                             const Output<Node>& aux_class_preds,
+                                             const Output<Node>& aux_box_preds,
+                                             const Attributes& attrs)
     : Op({box_logits, class_preds, proposals, aux_class_preds, aux_box_preds}),
       m_attrs(attrs) {
     constructor_validate_and_infer_types();
 }
 
-op::DetectionOutput::DetectionOutput(const Output<Node>& box_logits,
-                                     const Output<Node>& class_preds,
-                                     const Output<Node>& proposals,
-                                     const DetectionOutputAttrs& attrs)
+ov::op::v0::DetectionOutput::DetectionOutput(const Output<Node>& box_logits,
+                                             const Output<Node>& class_preds,
+                                             const Output<Node>& proposals,
+                                             const Attributes& attrs)
     : Op({box_logits, class_preds, proposals}),
       m_attrs(attrs) {
     constructor_validate_and_infer_types();
 }
 
-void op::DetectionOutput::validate_and_infer_types() {
+void ov::op::v0::DetectionOutput::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_DetectionOutput_validate_and_infer_types);
     NODE_VALIDATION_CHECK(this, m_attrs.num_classes > 0, "Number of classes must be greater than zero");
 
@@ -57,9 +56,9 @@ void op::DetectionOutput::validate_and_infer_types() {
                           proposals_et.is_real(),
                           "Proposals' data type must be floating point. Got " + proposals_et.get_type_name());
 
-    const PartialShape& box_logits_pshape = get_input_partial_shape(0);
-    const PartialShape& class_preds_pshape = get_input_partial_shape(1);
-    const PartialShape& proposals_pshape = get_input_partial_shape(2);
+    const ov::PartialShape& box_logits_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& class_preds_pshape = get_input_partial_shape(1);
+    const ov::PartialShape& proposals_pshape = get_input_partial_shape(2);
 
     int num_loc_classes = m_attrs.share_location ? 1 : m_attrs.num_classes;
     int prior_box_size = m_attrs.normalized ? 4 : 5;
@@ -175,8 +174,8 @@ void op::DetectionOutput::validate_and_infer_types() {
                               "Additional box predictions' data type must be the same as box logits data type (" +
                                   box_logits_et.get_type_name() + "). Got " + aux_box_preds_et.get_type_name());
 
-        const PartialShape& aux_class_preds_pshape = get_input_partial_shape(3);
-        const PartialShape& aux_box_preds_pshape = get_input_partial_shape(4);
+        const ov::PartialShape& aux_class_preds_pshape = get_input_partial_shape(3);
+        const ov::PartialShape& aux_box_preds_pshape = get_input_partial_shape(4);
         if (aux_class_preds_pshape.rank().is_static()) {
             NODE_VALIDATION_CHECK(this,
                                   aux_class_preds_pshape[0].compatible(num_images),
@@ -205,12 +204,12 @@ void op::DetectionOutput::validate_and_infer_types() {
     } else {
         output_shape.push_back(num_images * num_prior_boxes * m_attrs.num_classes);
     }
-    output_shape.push_back(7);
+    output_shape.emplace_back(7);
 
     set_output_type(0, box_logits_et, output_shape);
 }
 
-shared_ptr<Node> op::DetectionOutput::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<ov::Node> ov::op::v0::DetectionOutput::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_DetectionOutput_clone_with_new_inputs);
     check_new_args_count(this, new_args);
 
@@ -230,7 +229,7 @@ shared_ptr<Node> op::DetectionOutput::clone_with_new_inputs(const OutputVector&
     }
 }
 
-bool op::DetectionOutput::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::v0::DetectionOutput::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_DetectionOutput_visit_attributes);
     visitor.on_attribute("num_classes", m_attrs.num_classes);
     visitor.on_attribute("background_label_id", m_attrs.background_label_id);
diff --git a/ngraph/core/src/op/dft.cpp b/ngraph/core/src/op/dft.cpp
index a6f31b5b7d8fe8..b473e165e19e08 100644
--- a/ngraph/core/src/op/dft.cpp
+++ b/ngraph/core/src/op/dft.cpp
@@ -31,7 +31,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v7::DFT, "DFT", 7, util::FFTBase);
+OPENVINO_RTTI_DEFINITION(op::v7::DFT, "DFT", 7, util::FFTBase);
 
 op::v7::DFT::DFT(const Output<Node>& data, const Output<Node>& axes) : FFTBase(data, axes) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/divide.cpp b/ngraph/core/src/op/divide.cpp
index b6f07f90b987e9..3620fe54c967fc 100644
--- a/ngraph/core/src/op/divide.cpp
+++ b/ngraph/core/src/op/divide.cpp
@@ -53,7 +53,7 @@ bool evaluate_divide(const HostTensorPtr& arg0,
 
 // ------------------------------ v1 -------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Divide, "Divide", 1, util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::Divide, "Divide", 1, util::BinaryElementwiseArithmetic);
 
 op::v1::Divide::Divide(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/einsum.cpp b/ngraph/core/src/op/einsum.cpp
index dd7ceba0b41552..421281f172fdc3 100644
--- a/ngraph/core/src/op/einsum.cpp
+++ b/ngraph/core/src/op/einsum.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v7::Einsum, "Einsum", 7);
+OPENVINO_RTTI_DEFINITION(op::v7::Einsum, "Einsum", 7);
 
 op::v7::Einsum::Einsum(const OutputVector& inputs, const std::string& equation) : Op(inputs), m_equation(equation) {
     // normalize input equation by removing extra white-spaces from the equation
@@ -188,7 +188,7 @@ void op::v7::Einsum::validate_and_infer_types() {
 
     // create a dictionary with dimension sizes (or ranges in case dynamic shapes) for each label
     // and check their compatibility in case repeating labels
-    unordered_map<string, PartialShape> label_to_shape;
+    unordered_map<string, ov::PartialShape> label_to_shape;
     label_to_shape.clear();
 
     for (size_t input_idx = 0; input_idx < num_inputs; ++input_idx) {
@@ -210,14 +210,15 @@ void op::v7::Einsum::validate_and_infer_types() {
                 if (label.compare("...") == 0) {
                     size_t num_broadcasted_dims = input_rank - labels.size() + 1;
                     auto current_sub_pshape =
-                        PartialShape(std::vector<Dimension>(pshape.begin() + dim_ind,
-                                                            pshape.begin() + dim_ind + num_broadcasted_dims));
+                        ov::PartialShape(std::vector<Dimension>(pshape.begin() + dim_ind,
+                                                                pshape.begin() + dim_ind + num_broadcasted_dims));
                     if (label_to_shape.find(label) == label_to_shape.end()) {
                         label_to_shape[label] = current_sub_pshape;
                     } else {
-                        bool is_broadcast_success = PartialShape::broadcast_merge_into(label_to_shape[label],
-                                                                                       current_sub_pshape,
-                                                                                       op::AutoBroadcastType::NUMPY);
+                        bool is_broadcast_success =
+                            ov::PartialShape::broadcast_merge_into(label_to_shape[label],
+                                                                   current_sub_pshape,
+                                                                   op::AutoBroadcastType::NUMPY);
                         NODE_VALIDATION_CHECK(this,
                                               is_broadcast_success,
                                               "Input dimensions labeled with ellipsis for Einsum "
@@ -226,13 +227,13 @@ void op::v7::Einsum::validate_and_infer_types() {
                     dim_ind += num_broadcasted_dims;
                 } else {
                     if (label_to_shape.find(label) == label_to_shape.end()) {
-                        label_to_shape[label] = PartialShape{pshape[dim_ind]};
+                        label_to_shape[label] = ov::PartialShape{pshape[dim_ind]};
                     } else {
                         NODE_VALIDATION_CHECK(this,
-                                              label_to_shape[label].compatible(PartialShape{pshape[label_ind]}),
+                                              label_to_shape[label].compatible(ov::PartialShape{pshape[label_ind]}),
                                               "Different input dimensions indicated by the same labels for Einsum "
                                               "must be compatible.");
-                        PartialShape::merge_into(label_to_shape[label], PartialShape{pshape[dim_ind]});
+                        ov::PartialShape::merge_into(label_to_shape[label], ov::PartialShape{pshape[dim_ind]});
                     }
                     ++dim_ind;
                 }
@@ -245,7 +246,7 @@ void op::v7::Einsum::validate_and_infer_types() {
                                       "not contain ellipsis.");
 
                 if (label_to_shape.find(label) == label_to_shape.end()) {
-                    label_to_shape[label] = PartialShape{Dimension::dynamic()};
+                    label_to_shape[label] = ov::PartialShape{Dimension::dynamic()};
                 }
             }
         }
@@ -265,7 +266,7 @@ void op::v7::Einsum::validate_and_infer_types() {
                                     label_to_shape[output_label].begin(),
                                     label_to_shape[output_label].end());
     }
-    set_output_type(0, input_type_0, PartialShape(output_pshape_vector));
+    set_output_type(0, input_type_0, ov::PartialShape(output_pshape_vector));
 }
 
 bool op::v7::Einsum::visit_attributes(AttributeVisitor& visitor) {
diff --git a/ngraph/core/src/op/elu.cpp b/ngraph/core/src/op/elu.cpp
index fad636d9b4eca0..76d27b589432b2 100644
--- a/ngraph/core/src/op/elu.cpp
+++ b/ngraph/core/src/op/elu.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::Elu, "Elu", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Elu, "Elu", 0);
 
 op::Elu::Elu(const Output<Node>& data, const double alpha) : Op({data}), m_alpha{alpha} {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/embedding_segments_sum.cpp b/ngraph/core/src/op/embedding_segments_sum.cpp
index f95facfec2748a..33150c2f6846b0 100644
--- a/ngraph/core/src/op/embedding_segments_sum.cpp
+++ b/ngraph/core/src/op/embedding_segments_sum.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::EmbeddingSegmentsSum::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::EmbeddingSegmentsSum, "EmbeddingSegmentsSum", 3);
 
 op::v3::EmbeddingSegmentsSum::EmbeddingSegmentsSum(const Output<Node>& emb_table,
                                                    const Output<Node>& indices,
@@ -90,7 +90,7 @@ void op::v3::EmbeddingSegmentsSum::validate_and_infer_types() {
                           "INDICES and SEGMENT_IDS shape must be same");
 
     NODE_VALIDATION_CHECK(this,
-                          get_input_partial_shape(NUM_SEGMENTS).compatible(PartialShape{}),
+                          get_input_partial_shape(NUM_SEGMENTS).compatible(ov::PartialShape{}),
                           "NUM_SEGMENTS must be a scalar");
 
     if (get_input_size() >= 5) {
@@ -108,7 +108,7 @@ void op::v3::EmbeddingSegmentsSum::validate_and_infer_types() {
                               ")");
 
         NODE_VALIDATION_CHECK(this,
-                              get_input_partial_shape(DEFAULT_INDEX).compatible(PartialShape{}),
+                              get_input_partial_shape(DEFAULT_INDEX).compatible(ov::PartialShape{}),
                               "DEFAULT_INDEX must be a scalar");
     }
 
@@ -133,9 +133,9 @@ void op::v3::EmbeddingSegmentsSum::validate_and_infer_types() {
 
     element::Type result_et = get_input_element_type(EMB_TABLE);
 
-    const PartialShape& emb_table_shape = get_input_partial_shape(EMB_TABLE);
+    const ov::PartialShape& emb_table_shape = get_input_partial_shape(EMB_TABLE);
 
-    PartialShape result_shape;
+    ov::PartialShape result_shape;
     if (emb_table_shape.rank().is_static()) {
         result_shape = emb_table_shape;
         if (const auto& num_segments_const = get_constant_from_source(input_value(NUM_SEGMENTS))) {
@@ -145,7 +145,7 @@ void op::v3::EmbeddingSegmentsSum::validate_and_infer_types() {
             set_input_is_relevant_to_shape(NUM_SEGMENTS);
         }
     } else {
-        result_shape = PartialShape::dynamic();
+        result_shape = ov::PartialShape::dynamic();
         set_input_is_relevant_to_shape(NUM_SEGMENTS);
     }
 
diff --git a/ngraph/core/src/op/embeddingbag_offsets_sum.cpp b/ngraph/core/src/op/embeddingbag_offsets_sum.cpp
index 25d8472536143d..98b40f48ef2420 100644
--- a/ngraph/core/src/op/embeddingbag_offsets_sum.cpp
+++ b/ngraph/core/src/op/embeddingbag_offsets_sum.cpp
@@ -10,7 +10,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::EmbeddingBagOffsetsSum::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::EmbeddingBagOffsetsSum, "EmbeddingBagOffsetsSum", 3, util::EmbeddingBagOffsetsBase);
 
 op::v3::EmbeddingBagOffsetsSum::EmbeddingBagOffsetsSum(const Output<Node>& emb_table,
                                                        const Output<Node>& indices,
diff --git a/ngraph/core/src/op/embeddingbag_packedsum.cpp b/ngraph/core/src/op/embeddingbag_packedsum.cpp
index d3da20a33e4088..d45b13ca85338b 100644
--- a/ngraph/core/src/op/embeddingbag_packedsum.cpp
+++ b/ngraph/core/src/op/embeddingbag_packedsum.cpp
@@ -10,7 +10,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::EmbeddingBagPackedSum::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::EmbeddingBagPackedSum, "EmbeddingBagPackedSum", 3, util::EmbeddingBagPackedBase);
 
 op::v3::EmbeddingBagPackedSum::EmbeddingBagPackedSum(const Output<Node>& emb_table,
                                                      const Output<Node>& indices,
diff --git a/ngraph/core/src/op/equal.cpp b/ngraph/core/src/op/equal.cpp
index 7cf02c9d39f4a7..f024f7b6af4ecf 100644
--- a/ngraph/core/src/op/equal.cpp
+++ b/ngraph/core/src/op/equal.cpp
@@ -50,7 +50,7 @@ bool evaluate_equal(const HostTensorPtr& arg0,
 
 //------------------------------- v1 -------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Equal, "Equal", 1, op::util::BinaryElementwiseComparison);
+OPENVINO_RTTI_DEFINITION(op::v1::Equal, "Equal", 1, op::util::BinaryElementwiseComparison);
 
 op::v1::Equal::Equal(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseComparison(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/erf.cpp b/ngraph/core/src/op/erf.cpp
index 8fdfe5222cd607..5315f447715a47 100644
--- a/ngraph/core/src/op/erf.cpp
+++ b/ngraph/core/src/op/erf.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Erf, "Erf", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Erf, "Erf", 0, util::UnaryElementwiseArithmetic);
 
 bool ngraph::op::v0::Erf::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_Erf_visit_attributes);
diff --git a/ngraph/core/src/op/exp.cpp b/ngraph/core/src/op/exp.cpp
index 5e030eeadb805b..8d841b235638af 100644
--- a/ngraph/core/src/op/exp.cpp
+++ b/ngraph/core/src/op/exp.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::Exp, "Exp", 0, UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Exp, "Exp", 0, UnaryElementwiseArithmetic);
 
 op::Exp::Exp(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/experimental_detectron_detection_output.cpp b/ngraph/core/src/op/experimental_detectron_detection_output.cpp
index 25d1c8b4554933..3a4150d3ed52b8 100644
--- a/ngraph/core/src/op/experimental_detectron_detection_output.cpp
+++ b/ngraph/core/src/op/experimental_detectron_detection_output.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v6::ExperimentalDetectronDetectionOutput, "ExperimentalDetectronDetectionOutput", 6);
+OPENVINO_RTTI_DEFINITION(op::v6::ExperimentalDetectronDetectionOutput, "ExperimentalDetectronDetectionOutput", 6);
 
 op::v6::ExperimentalDetectronDetectionOutput::ExperimentalDetectronDetectionOutput(const Output<Node>& input_rois,
                                                                                    const Output<Node>& input_deltas,
@@ -49,9 +49,9 @@ void op::v6::ExperimentalDetectronDetectionOutput::validate_and_infer_types() {
     auto im_info_shape = get_input_partial_shape(3);
 
     set_output_size(3);
-    set_output_type(0, input_et, Shape{rois_num, 4});
-    set_output_type(1, element::Type_t::i32, Shape{rois_num});
-    set_output_type(2, input_et, Shape{rois_num});
+    set_output_type(0, input_et, ov::Shape{rois_num, 4});
+    set_output_type(1, element::Type_t::i32, ov::Shape{rois_num});
+    set_output_type(2, input_et, ov::Shape{rois_num});
 
     if (rois_shape.rank().is_static()) {
         NODE_VALIDATION_CHECK(this, rois_shape.rank().get_length() == 2, "Input rois rank must be equal to 2.");
diff --git a/ngraph/core/src/op/experimental_detectron_generate_proposals.cpp b/ngraph/core/src/op/experimental_detectron_generate_proposals.cpp
index 114542ea8802ef..b26ca6676708c9 100644
--- a/ngraph/core/src/op/experimental_detectron_generate_proposals.cpp
+++ b/ngraph/core/src/op/experimental_detectron_generate_proposals.cpp
@@ -12,9 +12,9 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v6::ExperimentalDetectronGenerateProposalsSingleImage,
-                       "ExperimentalDetectronGenerateProposalsSingleImage",
-                       6);
+OPENVINO_RTTI_DEFINITION(op::v6::ExperimentalDetectronGenerateProposalsSingleImage,
+                         "ExperimentalDetectronGenerateProposalsSingleImage",
+                         6);
 
 op::v6::ExperimentalDetectronGenerateProposalsSingleImage::ExperimentalDetectronGenerateProposalsSingleImage(
     const Output<Node>& im_info,
@@ -49,12 +49,12 @@ bool op::v6::ExperimentalDetectronGenerateProposalsSingleImage::visit_attributes
 
 void op::v6::ExperimentalDetectronGenerateProposalsSingleImage::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v6_ExperimentalDetectronGenerateProposalsSingleImage_validate_and_infer_types);
-    size_t post_nms_count = static_cast<size_t>(m_attrs.post_nms_count);
+    auto post_nms_count = static_cast<size_t>(m_attrs.post_nms_count);
     auto input_et = get_input_element_type(0);
 
     set_output_size(2);
-    set_output_type(0, input_et, Shape{post_nms_count, 4});
-    set_output_type(1, input_et, Shape{post_nms_count});
+    set_output_type(0, input_et, ov::Shape{post_nms_count, 4});
+    set_output_type(1, input_et, ov::Shape{post_nms_count});
 
     auto im_info_shape = get_input_partial_shape(0);
     auto anchors_shape = get_input_partial_shape(1);
diff --git a/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp b/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp
index ab93a19ba6fe81..37dad95ea702a6 100644
--- a/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp
+++ b/ngraph/core/src/op/experimental_detectron_prior_grid_generator.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v6::ExperimentalDetectronPriorGridGenerator, "ExperimentalDetectronPriorGridGenerator", 6);
+OPENVINO_RTTI_DEFINITION(op::v6::ExperimentalDetectronPriorGridGenerator, "ExperimentalDetectronPriorGridGenerator", 6);
 
 op::v6::ExperimentalDetectronPriorGridGenerator::ExperimentalDetectronPriorGridGenerator(
     const Output<Node>& priors,
@@ -94,9 +94,9 @@ void op::v6::ExperimentalDetectronPriorGridGenerator::validate_and_infer_types()
     validate();
 
     set_output_size(1);
-    PartialShape out_shape = {Dimension::dynamic(), Dimension::dynamic(), Dimension::dynamic(), 4};
+    ov::PartialShape out_shape = {Dimension::dynamic(), Dimension::dynamic(), Dimension::dynamic(), 4};
     if (m_attrs.flatten) {
-        out_shape = PartialShape{Dimension::dynamic(), 4};
+        out_shape = ov::PartialShape{Dimension::dynamic(), 4};
     }
 
     if (priors_shape.rank().is_dynamic() || featmap_shape.rank().is_dynamic()) {
@@ -109,9 +109,9 @@ void op::v6::ExperimentalDetectronPriorGridGenerator::validate_and_infer_types()
     auto featmap_width = featmap_shape[3];
 
     if (m_attrs.flatten) {
-        out_shape = PartialShape{featmap_height * featmap_width * num_priors, 4};
+        out_shape = ov::PartialShape{featmap_height * featmap_width * num_priors, 4};
     } else {
-        out_shape = PartialShape{featmap_height, featmap_width, num_priors, 4};
+        out_shape = ov::PartialShape{featmap_height, featmap_width, num_priors, 4};
     }
     set_output_type(0, input_et, out_shape);
 }
diff --git a/ngraph/core/src/op/experimental_detectron_roi_feature.cpp b/ngraph/core/src/op/experimental_detectron_roi_feature.cpp
index bd9b55ba6327af..e6da4827237793 100644
--- a/ngraph/core/src/op/experimental_detectron_roi_feature.cpp
+++ b/ngraph/core/src/op/experimental_detectron_roi_feature.cpp
@@ -14,7 +14,9 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v6::ExperimentalDetectronROIFeatureExtractor, "ExperimentalDetectronROIFeatureExtractor", 6);
+OPENVINO_RTTI_DEFINITION(op::v6::ExperimentalDetectronROIFeatureExtractor,
+                         "ExperimentalDetectronROIFeatureExtractor",
+                         6);
 
 op::v6::ExperimentalDetectronROIFeatureExtractor::ExperimentalDetectronROIFeatureExtractor(const OutputVector& args,
                                                                                            const Attributes& attrs)
@@ -43,9 +45,9 @@ void op::v6::ExperimentalDetectronROIFeatureExtractor::validate_and_infer_types(
     auto rois_shape = get_input_partial_shape(0);
     auto input_et = get_input_element_type(0);
 
-    PartialShape out_shape = {Dimension::dynamic(), Dimension::dynamic(), m_attrs.output_size, m_attrs.output_size};
+    ov::PartialShape out_shape = {Dimension::dynamic(), Dimension::dynamic(), m_attrs.output_size, m_attrs.output_size};
 
-    PartialShape out_rois_shape = {Dimension::dynamic(), 4};
+    ov::PartialShape out_rois_shape = {Dimension::dynamic(), 4};
     if (rois_shape.rank().is_static()) {
         NODE_VALIDATION_CHECK(this, rois_shape.rank().get_length() == 2, "Input rois rank must be equal to 2.");
 
diff --git a/ngraph/core/src/op/experimental_detectron_topkrois.cpp b/ngraph/core/src/op/experimental_detectron_topkrois.cpp
index c92fb94defbfb5..0b970b3eed5540 100644
--- a/ngraph/core/src/op/experimental_detectron_topkrois.cpp
+++ b/ngraph/core/src/op/experimental_detectron_topkrois.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v6::ExperimentalDetectronTopKROIs, "ExperimentalDetectronTopKROIs", 6);
+OPENVINO_RTTI_DEFINITION(op::v6::ExperimentalDetectronTopKROIs, "ExperimentalDetectronTopKROIs", 6);
 
 op::v6::ExperimentalDetectronTopKROIs::ExperimentalDetectronTopKROIs(const Output<Node>& input_rois,
                                                                      const Output<Node>& rois_probs,
@@ -39,7 +39,7 @@ void op::v6::ExperimentalDetectronTopKROIs::validate_and_infer_types() {
     const auto input_rois_shape = get_input_partial_shape(0);
     const auto rois_probs_shape = get_input_partial_shape(1);
 
-    set_output_type(0, get_input_element_type(0), Shape{m_max_rois, 4});
+    set_output_type(0, get_input_element_type(0), ov::Shape{m_max_rois, 4});
 
     if (input_rois_shape.rank().is_static()) {
         NODE_VALIDATION_CHECK(this,
diff --git a/ngraph/core/src/op/extractimagepatches.cpp b/ngraph/core/src/op/extractimagepatches.cpp
index 941aa1c70e82b6..8254e62bb29108 100644
--- a/ngraph/core/src/op/extractimagepatches.cpp
+++ b/ngraph/core/src/op/extractimagepatches.cpp
@@ -12,12 +12,12 @@ using namespace ngraph;
 
 // ExtractImagePatches v3
 
-NGRAPH_RTTI_DEFINITION(op::v3::ExtractImagePatches, "ExtractImagePatches", 3);
+OPENVINO_RTTI_DEFINITION(op::v3::ExtractImagePatches, "ExtractImagePatches", 3);
 
 op::v3::ExtractImagePatches::ExtractImagePatches(const Output<Node>& image,
-                                                 const Shape& sizes,
+                                                 const ov::Shape& sizes,
                                                  const Strides& strides,
-                                                 const Shape& rates,
+                                                 const ov::Shape& rates,
                                                  const PadType& auto_pad)
     : Op({image}),
       m_patch_sizes(sizes),
@@ -29,7 +29,7 @@ op::v3::ExtractImagePatches::ExtractImagePatches(const Output<Node>& image,
 
 void op::v3::ExtractImagePatches::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v3_ExtractImagePatches_validate_and_infer_types);
-    const PartialShape input_pshape = get_input_partial_shape(0);
+    const ov::PartialShape input_pshape = get_input_partial_shape(0);
 
     NODE_VALIDATION_CHECK(this, input_pshape.rank() == 4, "input tensor must be 4D tensor.");
 
@@ -60,7 +60,7 @@ void op::v3::ExtractImagePatches::validate_and_infer_types() {
 
     if (input_pshape[1].is_dynamic() || input_pshape[2].is_dynamic() || input_pshape[3].is_dynamic()) {
         set_input_is_relevant_to_shape(0);
-        auto output_pshape = PartialShape::dynamic(4);
+        auto output_pshape = ov::PartialShape::dynamic(4);
         set_output_type(0, get_input_element_type(0), output_pshape);
     } else {
         int32_t input_depth = input_pshape[1].get_length();
@@ -93,18 +93,17 @@ void op::v3::ExtractImagePatches::validate_and_infer_types() {
         if (out_cols < 0)
             out_cols = 0;
 
-        ngraph::Dimension::value_type out_depth_cast =
+        auto out_depth_cast =
             static_cast<ngraph::Dimension::value_type>(input_depth * m_patch_sizes[0] * m_patch_sizes[1]);
-        ngraph::Dimension::value_type out_rows_cast = static_cast<ngraph::Dimension::value_type>(out_rows);
-        ngraph::Dimension::value_type out_cols_cast = static_cast<ngraph::Dimension::value_type>(out_cols);
+        auto out_rows_cast = static_cast<ngraph::Dimension::value_type>(out_rows);
+        auto out_cols_cast = static_cast<ngraph::Dimension::value_type>(out_cols);
 
-        PartialShape output_pshape;
+        ov::PartialShape output_pshape;
         if (input_pshape[0].is_dynamic()) {
-            output_pshape = PartialShape{input_pshape[0], out_depth_cast, out_rows_cast, out_cols_cast};
+            output_pshape = ov::PartialShape{input_pshape[0], out_depth_cast, out_rows_cast, out_cols_cast};
         } else {
-            ngraph::Dimension::value_type input_batch_cast =
-                static_cast<ngraph::Dimension::value_type>(input_pshape[0].get_length());
-            output_pshape = PartialShape{input_batch_cast, out_depth_cast, out_rows_cast, out_cols_cast};
+            auto input_batch_cast = static_cast<ngraph::Dimension::value_type>(input_pshape[0].get_length());
+            output_pshape = ov::PartialShape{input_batch_cast, out_depth_cast, out_rows_cast, out_cols_cast};
         }
 
         if (input_rows == 0 || input_cols == 0) {
diff --git a/ngraph/core/src/op/fake_quantize.cpp b/ngraph/core/src/op/fake_quantize.cpp
index 645fcc92b97a18..f9342d9f2474ee 100644
--- a/ngraph/core/src/op/fake_quantize.cpp
+++ b/ngraph/core/src/op/fake_quantize.cpp
@@ -11,12 +11,14 @@
 #include "ngraph/op/constant.hpp"
 #include "ngraph/op/convert.hpp"
 #include "ngraph/op/select.hpp"
+#include "ngraph/runtime/reference/fake_quantize.hpp"
 #include "ngraph/shape.hpp"
+#include "ngraph/type/element_type.hpp"
 
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::FakeQuantize, "FakeQuantize", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::FakeQuantize, "FakeQuantize", 0);
 
 op::FakeQuantize::FakeQuantize() : Op(), m_levels() {}
 
@@ -35,18 +37,18 @@ op::FakeQuantize::FakeQuantize(const Output<Node>& data,
 
 void op::FakeQuantize::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_FakeQuantize_validate_and_infer_types);
-    PartialShape data_pshape = get_input_partial_shape(0);
+    ov::PartialShape data_pshape = get_input_partial_shape(0);
 
     for (auto i = 1; i <= 4; i++) {
         if (m_auto_broadcast.m_type == op::AutoBroadcastType::NONE) {
             NODE_VALIDATION_CHECK(this,
-                                  PartialShape::merge_into(data_pshape, get_input_partial_shape(i)),
+                                  ov::PartialShape::merge_into(data_pshape, get_input_partial_shape(i)),
                                   "Argument shapes are inconsistent.");
         } else if (m_auto_broadcast.m_type == op::AutoBroadcastType::NUMPY ||
                    m_auto_broadcast.m_type == op::AutoBroadcastType::PDPD) {
             NODE_VALIDATION_CHECK(
                 this,
-                PartialShape::broadcast_merge_into(data_pshape, get_input_partial_shape(i), m_auto_broadcast),
+                ov::PartialShape::broadcast_merge_into(data_pshape, get_input_partial_shape(i), m_auto_broadcast),
                 "Argument shapes are inconsistent.");
         } else {
             NODE_VALIDATION_CHECK(this, false, "Unsupported auto broadcast specification");
@@ -73,3 +75,80 @@ shared_ptr<Node> op::FakeQuantize::clone_with_new_inputs(const OutputVector& new
                                      m_levels,
                                      m_auto_broadcast);
 }
+
+namespace fakequantizeop {
+template <element::Type_t ET>
+bool evaluate(const HostTensorPtr& arg0,
+              const HostTensorPtr& arg1,
+              const HostTensorPtr& arg2,
+              const HostTensorPtr& arg3,
+              const HostTensorPtr& arg4,
+              const HostTensorPtr& out,
+              const ngraph::op::FakeQuantize* parent) {
+    NGRAPH_OP_SCOPE(v0_FakeQuantize_evaluate);
+    using T = typename element_type_traits<ET>::value_type;
+    runtime::reference::fake_quantize<T>(arg0->get_data_ptr<const T>(),
+                                         arg1->get_data_ptr<const T>(),
+                                         arg2->get_data_ptr<const T>(),
+                                         arg3->get_data_ptr<const T>(),
+                                         arg4->get_data_ptr<const T>(),
+                                         out->get_data_ptr<T>(),
+                                         parent->get_input_shape(0),
+                                         parent->get_input_shape(1),
+                                         parent->get_input_shape(2),
+                                         parent->get_input_shape(3),
+                                         parent->get_input_shape(4),
+                                         parent->get_levels(),
+                                         parent->get_auto_broadcast());
+    return true;
+}
+
+bool evaluate_fakequantize(const HostTensorPtr& arg0,
+                           const HostTensorPtr& arg1,
+                           const HostTensorPtr& arg2,
+                           const HostTensorPtr& arg3,
+                           const HostTensorPtr& arg4,
+                           const HostTensorPtr& out,
+                           const ngraph::op::FakeQuantize* parent) {
+    bool rc = true;
+    switch (arg0->get_element_type()) {
+        NGRAPH_TYPE_CASE(evaluate_fakequantize, i32, arg0, arg1, arg2, arg3, arg4, out, parent);
+        NGRAPH_TYPE_CASE(evaluate_fakequantize, i64, arg0, arg1, arg2, arg3, arg4, out, parent);
+        NGRAPH_TYPE_CASE(evaluate_fakequantize, u32, arg0, arg1, arg2, arg3, arg4, out, parent);
+        NGRAPH_TYPE_CASE(evaluate_fakequantize, u64, arg0, arg1, arg2, arg3, arg4, out, parent);
+        NGRAPH_TYPE_CASE(evaluate_fakequantize, f16, arg0, arg1, arg2, arg3, arg4, out, parent);
+        NGRAPH_TYPE_CASE(evaluate_fakequantize, f32, arg0, arg1, arg2, arg3, arg4, out, parent);
+    default:
+        rc = false;
+        break;
+    }
+    return rc;
+}
+}  // namespace fakequantizeop
+
+bool ngraph::op::FakeQuantize::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+    NGRAPH_OP_SCOPE(v0_FakeQuantize_evaluate);
+    return fakequantizeop::evaluate_fakequantize(inputs[0],
+                                                 inputs[1],
+                                                 inputs[2],
+                                                 inputs[3],
+                                                 inputs[4],
+                                                 outputs[0],
+                                                 this);
+}
+
+bool ngraph::op::FakeQuantize::has_evaluate() const {
+    NGRAPH_OP_SCOPE(v0_FakeQuantize_has_evaluate);
+    switch (get_input_element_type(0)) {
+    case ngraph::element::i32:
+    case ngraph::element::i64:
+    case ngraph::element::u32:
+    case ngraph::element::u64:
+    case ngraph::element::f16:
+    case ngraph::element::f32:
+        return true;
+    default:
+        break;
+    }
+    return false;
+}
diff --git a/ngraph/core/src/op/floor.cpp b/ngraph/core/src/op/floor.cpp
index 22554b7808bb0b..efe732ebe66b79 100644
--- a/ngraph/core/src/op/floor.cpp
+++ b/ngraph/core/src/op/floor.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Floor, "Floor", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Floor, "Floor", 0, util::UnaryElementwiseArithmetic);
 
 op::Floor::Floor(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/floor_mod.cpp b/ngraph/core/src/op/floor_mod.cpp
index 6e72f11be28f53..7795900e70ba38 100644
--- a/ngraph/core/src/op/floor_mod.cpp
+++ b/ngraph/core/src/op/floor_mod.cpp
@@ -11,7 +11,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::FloorMod, "FloorMod", 1, op::util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::FloorMod, "FloorMod", 1, op::util::BinaryElementwiseArithmetic);
 
 op::v1::FloorMod::FloorMod(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/gather.cpp b/ngraph/core/src/op/gather.cpp
index e72163839dcb0c..a52eaff000d8bd 100644
--- a/ngraph/core/src/op/gather.cpp
+++ b/ngraph/core/src/op/gather.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::Gather, "Gather", 1, op::util::GatherBase);
+OPENVINO_RTTI_DEFINITION(op::v1::Gather, "Gather", 1, op::util::GatherBase);
 
 op::v1::Gather::Gather(const Output<Node>& params, const Output<Node>& indices, const Output<Node>& axes)
     : GatherBase(params, indices, axes) {
@@ -36,7 +36,7 @@ shared_ptr<Node> op::v1::Gather::clone_with_new_inputs(const OutputVector& new_a
     return make_shared<v1::Gather>(new_args.at(0), new_args.at(1), new_args.at(2));
 }
 
-NGRAPH_RTTI_DEFINITION(op::v7::Gather, "Gather", 7, op::util::GatherBase);
+OPENVINO_RTTI_DEFINITION(op::v7::Gather, "Gather", 7, op::util::GatherBase);
 
 op::v7::Gather::Gather(const Output<Node>& data,
                        const Output<Node>& indices,
@@ -78,7 +78,7 @@ shared_ptr<Node> op::v7::Gather::clone_with_new_inputs(const OutputVector& new_a
     return make_shared<v7::Gather>(new_args.at(0), new_args.at(1), new_args.at(2), m_batch_dims);
 }
 
-NGRAPH_RTTI_DEFINITION(op::v8::Gather, "Gather", 8, op::util::GatherBase);
+OPENVINO_RTTI_DEFINITION(op::v8::Gather, "Gather", 8, op::util::GatherBase);
 
 op::v8::Gather::Gather(const Output<Node>& data,
                        const Output<Node>& indices,
diff --git a/ngraph/core/src/op/gather_elements.cpp b/ngraph/core/src/op/gather_elements.cpp
index 71f341dd690ce6..7c5c418fac0eef 100644
--- a/ngraph/core/src/op/gather_elements.cpp
+++ b/ngraph/core/src/op/gather_elements.cpp
@@ -12,7 +12,7 @@ using namespace ngraph;
 
 // ------------------------------ V6 ------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v6::GatherElements, "GatherElements", 6);
+OPENVINO_RTTI_DEFINITION(op::v6::GatherElements, "GatherElements", 6);
 
 op::v6::GatherElements::GatherElements(const Output<Node>& data, const Output<Node>& indices, const int64_t axis)
     : Op({data, indices}),
@@ -54,7 +54,7 @@ void op::v6::GatherElements::validate_and_infer_types() {
                           "indices rank must be >= 1.");
 
     if (data_rank.is_static() && indices_rank.is_dynamic()) {
-        PartialShape out_shape_info(data_pshape);
+        ov::PartialShape out_shape_info(data_pshape);
         out_shape_info[axis] = Dimension::dynamic();
         set_output_type(0, data_type, out_shape_info);
         return;
@@ -62,7 +62,7 @@ void op::v6::GatherElements::validate_and_infer_types() {
 
     if (data_rank.is_dynamic()) {
         if (indices_rank.is_dynamic())
-            set_output_type(0, data_type, PartialShape::dynamic());
+            set_output_type(0, data_type, ov::PartialShape::dynamic());
         return;
     }
 
@@ -74,7 +74,7 @@ void op::v6::GatherElements::validate_and_infer_types() {
                           " and ",
                           indices_rank.get_length());
 
-    PartialShape output_pshape(indices_pshape);
+    ov::PartialShape output_pshape(indices_pshape);
     for (int i = 0; i < indices_rank.get_length(); i++) {
         if (i != axis) {
             // if size of the current dimension of indices is unknown it will be retrieved from data
diff --git a/ngraph/core/src/op/gather_nd.cpp b/ngraph/core/src/op/gather_nd.cpp
index d94cefa5b24c66..d8e2b1184508b7 100644
--- a/ngraph/core/src/op/gather_nd.cpp
+++ b/ngraph/core/src/op/gather_nd.cpp
@@ -12,7 +12,7 @@ using namespace ngraph;
 
 // ------------------------------ V5 ------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v5::GatherND, "GatherND", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::GatherND, "GatherND", 5);
 
 op::v5::GatherND::GatherND(const Output<Node>& data, const Output<Node>& indices, const size_t batch_dims)
     : Op({data, indices}),
@@ -105,9 +105,9 @@ void op::v5::GatherND::validate_and_infer_types() {
             output_shape[output_indices_length + dim + delta_output_rank] =
                 data_pshape[m_batch_dims + indices_tuple_length + dim];
         }
-        set_output_type(0, data_type, PartialShape(output_shape));
+        set_output_type(0, data_type, ov::PartialShape(output_shape));
     } else {
-        set_output_type(0, data_type, PartialShape::dynamic());
+        set_output_type(0, data_type, ov::PartialShape::dynamic());
     }
 }
 
diff --git a/ngraph/core/src/op/gather_tree.cpp b/ngraph/core/src/op/gather_tree.cpp
index 88b4b3cab7151b..956a88d738c38e 100644
--- a/ngraph/core/src/op/gather_tree.cpp
+++ b/ngraph/core/src/op/gather_tree.cpp
@@ -10,7 +10,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::GatherTree, "GatherTree", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::GatherTree, "GatherTree", 1);
 
 op::v1::GatherTree::GatherTree(const Output<Node>& step_ids,
                                const Output<Node>& parent_idx,
@@ -33,35 +33,68 @@ bool ngraph::op::v1::GatherTree::visit_attributes(AttributeVisitor& visitor) {
 
 void op::v1::GatherTree::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_GatherTree_validate_and_infer_types);
-    const auto& step_ids_rank = get_input_partial_shape(0);
-    const auto& parent_idx_rank = get_input_partial_shape(1);
-    const auto& max_seq_len_rank = get_input_partial_shape(2);
-    const auto& end_token_rank = get_input_partial_shape(3);
 
+    const auto& step_ids_et = get_input_element_type(0);
+    const auto& parent_idx_et = get_input_element_type(1);
+    const auto& max_seq_len_et = get_input_element_type(2);
+    const auto& end_token_et = get_input_element_type(3);
+
+    element::Type result_et;
     NODE_VALIDATION_CHECK(this,
-                          step_ids_rank.rank().is_dynamic() || step_ids_rank.rank().get_length() == 3,
-                          "step_ids input rank must equal to 3 (step_ids rank: ",
-                          step_ids_rank.rank().get_length(),
+                          element::Type::merge(result_et, step_ids_et, parent_idx_et) &&
+                              element::Type::merge(result_et, result_et, max_seq_len_et) &&
+                              element::Type::merge(result_et, result_et, end_token_et),
+                          "Inputs must have the same element type. Got: step_ids (",
+                          step_ids_et,
+                          "), parent_idx_et (",
+                          parent_idx_et,
+                          "), max_seq_len (",
+                          max_seq_len_et,
+                          "), end_token (",
+                          end_token_et,
                           ")");
 
     NODE_VALIDATION_CHECK(this,
-                          parent_idx_rank.rank().is_dynamic() || parent_idx_rank.rank().get_length() == 3,
-                          "parent_idx input rank must equal to 3 (parent_idx rank: ",
-                          parent_idx_rank.rank().get_length(),
-                          ")");
+                          result_et.is_real() || result_et.is_integral_number(),
+                          "Element type of inputs must be numeric. Got: ",
+                          result_et);
 
+    const auto& step_ids_pshape = get_input_partial_shape(0);
+    const auto& parent_idx_pshape = get_input_partial_shape(1);
+    const auto& max_seq_len_pshape = get_input_partial_shape(2);
+    const auto& end_token_pshape = get_input_partial_shape(3);
+
+    PartialShape result_pshape{PartialShape::dynamic()};
     NODE_VALIDATION_CHECK(this,
-                          max_seq_len_rank.rank().is_dynamic() || max_seq_len_rank.rank().get_length() == 1,
-                          "max_seq_len input rank must equal to 1 (max_seq_len rank: ",
-                          max_seq_len_rank.rank().get_length(),
-                          ")");
+                          PartialShape::merge_into(result_pshape, step_ids_pshape) &&
+                              PartialShape::merge_into(result_pshape, parent_idx_pshape) &&
+                              result_pshape.rank().compatible(3),
+                          "step_ids and parent_idx inputs must have the same shape with rank 3. Got: ",
+                          step_ids_pshape,
+                          " and ",
+                          parent_idx_pshape,
+                          ", respectively");
 
     NODE_VALIDATION_CHECK(this,
-                          end_token_rank.rank().is_dynamic() || end_token_rank.rank().get_length() == 0,
-                          "end_token input rank must be scalar (end_token rank: ",
-                          end_token_rank.rank().get_length(),
-                          ")");
+                          max_seq_len_pshape.rank().compatible(1),
+                          "max_seq_len input must have rank 1. Got: ",
+                          max_seq_len_pshape);
 
-    const auto& step_ids_et = get_input_element_type(0);
-    set_output_type(0, step_ids_et, step_ids_rank);
+    if (result_pshape.rank().is_static() && max_seq_len_pshape.rank().is_static()) {
+        NODE_VALIDATION_CHECK(this,
+                              Dimension::merge(result_pshape[1], result_pshape[1], max_seq_len_pshape[0]),
+                              "Number of elements of max_seq_len input must match BATCH_SIZE dimension of "
+                              "step_ids/parent_idx inputs. Got: ",
+                              result_pshape[1],
+                              " and ",
+                              max_seq_len_pshape[0],
+                              ", respectively");
+    }
+
+    NODE_VALIDATION_CHECK(this,
+                          end_token_pshape.rank().compatible(0),
+                          "end_token input must be scalar. Got: ",
+                          end_token_pshape);
+
+    set_output_type(0, result_et, result_pshape);
 }
diff --git a/ngraph/core/src/op/gelu.cpp b/ngraph/core/src/op/gelu.cpp
index 27152cedf2425e..cfb40df78600d0 100644
--- a/ngraph/core/src/op/gelu.cpp
+++ b/ngraph/core/src/op/gelu.cpp
@@ -14,7 +14,7 @@ using namespace std;
 using namespace ngraph;
 
 // ------------------------------ V0 ------------------------------
-NGRAPH_RTTI_DEFINITION(op::v0::Gelu, "Gelu", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Gelu, "Gelu", 0);
 
 op::v0::Gelu::Gelu() : Op() {}
 
@@ -38,7 +38,7 @@ shared_ptr<Node> op::v0::Gelu::clone_with_new_inputs(const OutputVector& new_arg
 void op::v0::Gelu::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_Gelu_validate_and_infer_types);
     element::Type input_element_type = get_input_element_type(0);
-    PartialShape input_pshape = get_input_partial_shape(0);
+    ov::PartialShape input_pshape = get_input_partial_shape(0);
 
     NODE_VALIDATION_CHECK(this,
                           input_element_type.is_dynamic() || input_element_type.is_real(),
@@ -53,20 +53,20 @@ void op::v0::Gelu::validate_and_infer_types() {
 
 namespace ov {
 template <>
-NGRAPH_API EnumNames<op::GeluApproximationMode>& EnumNames<op::GeluApproximationMode>::get() {
-    static auto enum_names = EnumNames<op::GeluApproximationMode>(
+NGRAPH_API EnumNames<ngraph::op::GeluApproximationMode>& EnumNames<ngraph::op::GeluApproximationMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::GeluApproximationMode>(
         "op::GeluApproximationMode",
-        {{"TANH", op::GeluApproximationMode::TANH}, {"ERF", op::GeluApproximationMode::ERF}});
+        {{"TANH", ngraph::op::GeluApproximationMode::TANH}, {"ERF", ngraph::op::GeluApproximationMode::ERF}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::GeluApproximationMode>::type_info;
-}  // namespace ov
 std::ostream& op::operator<<(std::ostream& s, const op::GeluApproximationMode& type) {
     return s << as_string(type);
 }
 
-NGRAPH_RTTI_DEFINITION(op::v7::Gelu, "Gelu", 7);
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::GeluApproximationMode>::type_info;
+}  // namespace ov
+OPENVINO_RTTI_DEFINITION(op::v7::Gelu, "Gelu", 7);
 
 op::v7::Gelu::Gelu(const Output<Node>& data, GeluApproximationMode mode)
     : UnaryElementwiseArithmetic(data),
@@ -91,7 +91,7 @@ shared_ptr<Node> op::v7::Gelu::clone_with_new_inputs(const OutputVector& new_arg
 void op::v7::Gelu::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v7_Gelu_validate_and_infer_types);
     element::Type input_element_type = get_input_element_type(0);
-    PartialShape input_pshape = get_input_partial_shape(0);
+    ov::PartialShape input_pshape = get_input_partial_shape(0);
 
     NODE_VALIDATION_CHECK(this,
                           input_element_type.is_dynamic() || input_element_type.is_real(),
diff --git a/ngraph/core/src/op/greater.cpp b/ngraph/core/src/op/greater.cpp
index 10d89bcf581a3d..ead2f846b93cb9 100644
--- a/ngraph/core/src/op/greater.cpp
+++ b/ngraph/core/src/op/greater.cpp
@@ -50,7 +50,7 @@ bool evaluate_greater(const HostTensorPtr& arg0,
 
 //-------------------------------------- v1 ------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Greater, "Greater", 1, op::util::BinaryElementwiseComparison);
+OPENVINO_RTTI_DEFINITION(op::v1::Greater, "Greater", 1, op::util::BinaryElementwiseComparison);
 
 op::v1::Greater::Greater(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseComparison(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/greater_eq.cpp b/ngraph/core/src/op/greater_eq.cpp
index c42720e5489c4c..f4d6e7ab297a30 100644
--- a/ngraph/core/src/op/greater_eq.cpp
+++ b/ngraph/core/src/op/greater_eq.cpp
@@ -51,7 +51,7 @@ bool evaluate_greater_equal(const HostTensorPtr& arg0,
 
 //---------------------------------- v1 ----------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::GreaterEqual, "GreaterEqual", 1, op::util::BinaryElementwiseComparison);
+OPENVINO_RTTI_DEFINITION(op::v1::GreaterEqual, "GreaterEqual", 1, op::util::BinaryElementwiseComparison);
 
 op::v1::GreaterEqual::GreaterEqual(const Output<Node>& arg0,
                                    const Output<Node>& arg1,
diff --git a/ngraph/core/src/op/grn.cpp b/ngraph/core/src/op/grn.cpp
index 98cfb19e465763..9a8f49bce11632 100644
--- a/ngraph/core/src/op/grn.cpp
+++ b/ngraph/core/src/op/grn.cpp
@@ -16,7 +16,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::GRN, "GRN", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::GRN, "GRN", 0);
 
 op::v0::GRN::GRN(const Output<Node>& data, float bias) : Op({data}), m_bias(bias) {
     constructor_validate_and_infer_types();
@@ -33,7 +33,7 @@ void op::v0::GRN::validate_and_infer_types() {
     const auto& data_pshape = get_input_partial_shape(0);
 
     if (data_pshape.is_static()) {
-        const Shape& data_shape{data_pshape.to_shape()};
+        const ov::Shape& data_shape{data_pshape.to_shape()};
 
         // Input data must be 2, 3 or 4D tensor.
         NODE_VALIDATION_CHECK(this,
diff --git a/ngraph/core/src/op/group_conv.cpp b/ngraph/core/src/op/group_conv.cpp
index f43c7aa0d0beac..c673c48fb152aa 100644
--- a/ngraph/core/src/op/group_conv.cpp
+++ b/ngraph/core/src/op/group_conv.cpp
@@ -22,10 +22,10 @@ using namespace ngraph;
 //                        v1::GroupConvolution
 //------------------------------------------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::GroupConvolution, "GroupConvolution", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::GroupConvolution, "GroupConvolution", 1);
 
 shared_ptr<Node> op::v1::GroupConvolution::get_default_value() const {
-    return op::Constant::create(get_element_type(), get_shape(), {0});
+    return op::v0::Constant::create(get_element_type(), get_shape(), {0});
 }
 
 op::v1::GroupConvolution::GroupConvolution(const Output<Node>& data_batch,
@@ -54,7 +54,8 @@ bool ngraph::op::v1::GroupConvolution::visit_attributes(AttributeVisitor& visito
     return true;
 }
 
-static Dimension infer_group_from_input_shapes(const PartialShape& data_pshape, const PartialShape& filters_pshape) {
+static Dimension infer_group_from_input_shapes(const ov::PartialShape& data_pshape,
+                                               const ov::PartialShape& filters_pshape) {
     Dimension group_dim = Dimension();
     if (data_pshape.rank().is_static() && data_pshape[1].is_static() && filters_pshape.rank().is_static() &&
         filters_pshape[2].is_static()) {
@@ -70,8 +71,8 @@ static Dimension infer_group_from_input_shapes(const PartialShape& data_pshape,
 
 void op::v1::GroupConvolution::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_GroupConvolution_validate_and_infer_types);
-    PartialShape data_batch_pshape = get_input_partial_shape(0);
-    PartialShape filters_pshape = get_input_partial_shape(1);
+    ov::PartialShape data_batch_pshape = get_input_partial_shape(0);
+    ov::PartialShape filters_pshape = get_input_partial_shape(1);
     element::Type data_batch_et = get_input_element_type(0);
     element::Type filters_et = get_input_element_type(1);
 
@@ -99,7 +100,7 @@ void op::v1::GroupConvolution::validate_and_infer_types() {
                           filters_pshape,
                           ").");
 
-    PartialShape result_shape{PartialShape::dynamic()};
+    ov::PartialShape result_shape{ov::PartialShape::dynamic()};
     if (data_batch_pshape.rank().is_static() || filters_pshape.rank().is_static()) {
         const bool is_data_batch_ps_static = data_batch_pshape.rank().is_static();
         const auto output_ps_rank =
@@ -165,11 +166,11 @@ void op::v1::GroupConvolution::validate_and_infer_types() {
                 m_pads_begin.clear();
                 m_pads_end.clear();
 
-                const PartialShape filter_spatial_shape = [filters_pshape]() {
+                const ov::PartialShape filter_spatial_shape = [filters_pshape]() {
                     vector<Dimension> filter_dims{filters_pshape};
                     filter_dims.erase(filter_dims.begin(),
                                       filter_dims.begin() + 3);  // Remove {GROUP, C_OUT, C_IN}
-                    return PartialShape{filter_dims};
+                    return ov::PartialShape{filter_dims};
                 }();
 
                 if (filter_spatial_shape.is_static()) {
@@ -189,8 +190,8 @@ void op::v1::GroupConvolution::validate_and_infer_types() {
         }
 
         // we need to adjust channels input dim to reuse helpers for regular convolution
-        PartialShape data_batch_ps = [&]() {
-            auto shape = PartialShape{data_batch_pshape};
+        ov::PartialShape data_batch_ps = [&]() {
+            auto shape = ov::PartialShape{data_batch_pshape};
             auto groups = filters_pshape.rank().is_static() ? filters_pshape[0] : Dimension();
             if (groups.is_dynamic()) {
                 groups = infer_group_from_input_shapes(data_batch_pshape, filters_pshape);
@@ -206,8 +207,8 @@ void op::v1::GroupConvolution::validate_and_infer_types() {
         }();
 
         // we need to adjust filters shape to reuse helpers for regular convolution
-        PartialShape filters_ps = [&]() {
-            auto shape = PartialShape{filters_pshape};
+        ov::PartialShape filters_ps = [&]() {
+            auto shape = ov::PartialShape{filters_pshape};
             if (shape.rank().is_static() && shape.rank().get_length() > 2) {
                 auto groups = filters_pshape.rank().is_static() ? filters_pshape[0] : Dimension();
                 if (groups.is_dynamic()) {
@@ -216,7 +217,7 @@ void op::v1::GroupConvolution::validate_and_infer_types() {
                 shape[1] = groups * shape[1];
                 vector<Dimension> dim_vec{shape};
                 dim_vec.erase(dim_vec.begin());
-                shape = PartialShape{dim_vec};
+                shape = ov::PartialShape{dim_vec};
             }
             return shape;
         }();
@@ -249,7 +250,7 @@ shared_ptr<Node> op::v1::GroupConvolution::clone_with_new_inputs(const OutputVec
 //                        v1::GroupConvolutionBackpropData
 //------------------------------------------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::GroupConvolutionBackpropData, "GroupConvolutionBackpropData", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::GroupConvolutionBackpropData, "GroupConvolutionBackpropData", 1);
 
 op::v1::GroupConvolutionBackpropData::GroupConvolutionBackpropData()
     : Op(),
@@ -333,8 +334,8 @@ bool op::v1::GroupConvolutionBackpropData::is_dynamic() const {
     return is_dynamic;
 }
 
-static Dimension infer_backprop_group_from_input_shapes(const PartialShape& data_pshape,
-                                                        const PartialShape& filters_pshape) {
+static Dimension infer_backprop_group_from_input_shapes(const ov::PartialShape& data_pshape,
+                                                        const ov::PartialShape& filters_pshape) {
     Dimension group_dim = Dimension();
     if (data_pshape.rank().is_static() && data_pshape[1].is_static() && filters_pshape.rank().is_static() &&
         filters_pshape[1].is_static()) {
@@ -348,30 +349,30 @@ static Dimension infer_backprop_group_from_input_shapes(const PartialShape& data
     return group_dim;
 }
 
-const PartialShape op::v1::GroupConvolutionBackpropData::get_convolution_output_shape() const {
+const ov::PartialShape op::v1::GroupConvolutionBackpropData::get_convolution_output_shape() const {
     auto data_pshape = get_input_partial_shape(0);
     auto filter_pshape = get_input_partial_shape(1);
 
-    PartialShape shape;
+    ov::PartialShape shape;
     if (inputs().size() == 3) {
         if (const auto& const_op = get_constant_from_source(input_value(2))) {
-            return PartialShape{const_op->get_shape_val()};
+            return ov::PartialShape{const_op->get_shape_val()};
         }
     }
 
     if (data_pshape.rank().is_static()) {
-        shape = PartialShape{vector<Dimension>(data_pshape.rank().get_length() - 2)};
+        shape = ov::PartialShape{vector<Dimension>(data_pshape.rank().get_length() - 2)};
     } else if (filter_pshape.rank().is_static()) {
-        shape = PartialShape{vector<Dimension>(filter_pshape.rank().get_length() - 3)};
+        shape = ov::PartialShape{vector<Dimension>(filter_pshape.rank().get_length() - 3)};
     } else {
-        shape = PartialShape::dynamic();
+        shape = ov::PartialShape::dynamic();
     }
     return shape;
 }
 
-void op::v1::GroupConvolutionBackpropData::set_output_shape(const Shape& shape) {
+void op::v1::GroupConvolutionBackpropData::set_output_shape(const ov::Shape& shape) {
     this->input(2).replace_source_output(
-        op::Constant::create(this->get_input_element_type(2), Shape{shape.size()}, shape)->output(0));
+        op::v0::Constant::create(this->get_input_element_type(2), ov::Shape{shape.size()}, shape)->output(0));
 }
 
 void op::v1::GroupConvolutionBackpropData::infer_conv_backprop_output_spatial_shape(
@@ -393,7 +394,7 @@ void op::v1::GroupConvolutionBackpropData::infer_conv_backprop_output_spatial_sh
             int64_t val = strides[i] * (input_data_shape[i].get_length() - 1) +
                           dilations[i] * (filters_shape[i].get_length() - 1) + 1 - pads_begin[i] - pads_end[i] +
                           output_padding[i];
-            output_spatial_shape.push_back(val);
+            output_spatial_shape.emplace_back(val);
         } else {
             output_spatial_shape.push_back(Dimension::dynamic());
         }
@@ -402,9 +403,9 @@ void op::v1::GroupConvolutionBackpropData::infer_conv_backprop_output_spatial_sh
 
 void op::v1::GroupConvolutionBackpropData::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_GroupConvolutionBackpropData_validate_and_infer_types);
-    const PartialShape& data_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& data_pshape = get_input_partial_shape(0);
     element::Type data_et = get_input_element_type(0);
-    const PartialShape& filters_pshape = get_input_partial_shape(1);
+    const ov::PartialShape& filters_pshape = get_input_partial_shape(1);
     element::Type filters_et = get_input_element_type(1);
 
     element::Type result_et;
@@ -433,7 +434,7 @@ void op::v1::GroupConvolutionBackpropData::validate_and_infer_types() {
 
     bool is_output_shape_present = inputs().size() == 3;
     if (is_output_shape_present) {
-        const PartialShape& output_shape_pshape = get_input_partial_shape(2);
+        const ov::PartialShape& output_shape_pshape = get_input_partial_shape(2);
         const element::Type output_shape_et = get_input_element_type(2);
 
         NODE_VALIDATION_CHECK(this,
@@ -450,7 +451,7 @@ void op::v1::GroupConvolutionBackpropData::validate_and_infer_types() {
                               output_shape_pshape,
                               ").");
     }
-    PartialShape output_spatial_pshape = get_convolution_output_shape();
+    ov::PartialShape output_spatial_pshape = get_convolution_output_shape();
 
     if (data_pshape.rank().is_static() || filters_pshape.rank().is_static()) {
         const bool is_data_ps_static = data_pshape.rank().is_static();
@@ -508,7 +509,7 @@ void op::v1::GroupConvolutionBackpropData::validate_and_infer_types() {
         }
 
         if (is_output_shape_present && output_spatial_pshape.is_static()) {
-            Shape output_shape = output_spatial_pshape.to_shape();
+            ov::Shape output_shape = output_spatial_pshape.to_shape();
             NODE_VALIDATION_CHECK(this,
                                   output_shape.size() == num_spatial_dims,
                                   "Output shape should be specified only and for "
@@ -516,23 +517,23 @@ void op::v1::GroupConvolutionBackpropData::validate_and_infer_types() {
         }
     }
 
-    PartialShape result_pshape{PartialShape::dynamic()};
+    ov::PartialShape result_pshape{ov::PartialShape::dynamic()};
     // If output shape is provided, ignore current values for padding begin/end
     // and infer them.
     if (is_output_shape_present) {
         if (output_spatial_pshape.rank().is_static()) {
             if (data_pshape.rank().is_static() && filters_pshape.rank().is_static()) {
-                const PartialShape data_spatial_shape = [data_pshape]() {
+                const ov::PartialShape data_spatial_shape = [data_pshape]() {
                     vector<Dimension> data_dims{data_pshape};
                     data_dims.erase(data_dims.begin(), data_dims.begin() + 2);  // remove {N, C_IN}
-                    return PartialShape{data_dims};
+                    return ov::PartialShape{data_dims};
                 }();
 
-                const PartialShape filters_spatial_shape = [filters_pshape]() {
+                const ov::PartialShape filters_spatial_shape = [filters_pshape]() {
                     vector<Dimension> filters_dims{filters_pshape};
                     filters_dims.erase(filters_dims.begin(),
                                        filters_dims.begin() + 3);  // remove {GROUPS, C_OUT, C_IN}
-                    return PartialShape{filters_dims};
+                    return ov::PartialShape{filters_dims};
                 }();
 
                 // If auto_pad has one of following mode we infer paddings. Otherwise in
@@ -566,7 +567,7 @@ void op::v1::GroupConvolutionBackpropData::validate_and_infer_types() {
             // N
             auto batches = data_pshape.rank().is_static() ? data_pshape[0] : Dimension::dynamic();
             output_pshape.insert(output_pshape.begin(), batches);
-            result_pshape = PartialShape{output_pshape};
+            result_pshape = ov::PartialShape{output_pshape};
         }
         set_input_is_relevant_to_shape(2);
     }
@@ -616,7 +617,7 @@ void op::v1::GroupConvolutionBackpropData::validate_and_infer_types() {
             // N
             auto batches = data_pshape.rank().is_static() ? data_pshape[0] : Dimension::dynamic();
             output_pshape.insert(output_pshape.begin(), batches);
-            result_pshape = PartialShape{output_pshape};
+            result_pshape = ov::PartialShape{output_pshape};
         }
     }
     set_input_is_relevant_to_shape(0);
diff --git a/ngraph/core/src/op/gru_cell.cpp b/ngraph/core/src/op/gru_cell.cpp
index a17ba0f834a9ce..c0f509c937eee6 100644
--- a/ngraph/core/src/op/gru_cell.cpp
+++ b/ngraph/core/src/op/gru_cell.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::GRUCell::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::GRUCell, "GRUCell", 1, op::util::RNNCellBase);
 
 op::v3::GRUCell::GRUCell() : m_linear_before_reset(false) {
     m_activations = {"sigmoid", "tanh"};
@@ -89,7 +89,7 @@ void op::v3::GRUCell::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v3_GRUCell_validate_and_infer_types);
     for (const auto& input : inputs()) {
         if (input.get_partial_shape().rank().is_dynamic()) {
-            set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
+            set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
             return;
         }
     }
@@ -172,9 +172,9 @@ void op::v3::GRUCell::validate_and_infer_types() {
 
 void op::v3::GRUCell::add_default_bias_input() {
     Output<Node> B =
-        op::Constant::create(get_input_element_type(0),
-                             Shape{(s_gates_count + m_linear_before_reset) * get_hidden_size()},
-                             vector<float>((s_gates_count + m_linear_before_reset) * get_hidden_size(), 0.f));
+        op::v0::Constant::create(get_input_element_type(0),
+                                 ov::Shape{(s_gates_count + m_linear_before_reset) * get_hidden_size()},
+                                 vector<float>((s_gates_count + m_linear_before_reset) * get_hidden_size(), 0.f));
     set_argument(4, B);
 }
 
diff --git a/ngraph/core/src/op/gru_sequence.cpp b/ngraph/core/src/op/gru_sequence.cpp
index cbbae4895bbd4b..1b2a2a0d721367 100644
--- a/ngraph/core/src/op/gru_sequence.cpp
+++ b/ngraph/core/src/op/gru_sequence.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v5::GRUSequence, "GRUSequence", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::GRUSequence, "GRUSequence", 5);
 
 op::v5::GRUSequence::GRUSequence()
     : m_direction(op::RecurrentSequenceDirection::FORWARD),
@@ -49,8 +49,8 @@ void op::v5::GRUSequence::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v5_GRUSequence_validate_and_infer_types);
     for (const auto& input : inputs()) {
         if (input.get_partial_shape().rank().is_dynamic()) {
-            set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
-            set_output_type(1, get_input_element_type(0), PartialShape::dynamic());
+            set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
+            set_output_type(1, get_input_element_type(0), ov::PartialShape::dynamic());
             return;
         }
     }
diff --git a/ngraph/core/src/op/hard_sigmoid.cpp b/ngraph/core/src/op/hard_sigmoid.cpp
index d397831c96263f..5b5c9cda6e4153 100644
--- a/ngraph/core/src/op/hard_sigmoid.cpp
+++ b/ngraph/core/src/op/hard_sigmoid.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::HardSigmoid, "HardSigmoid", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::HardSigmoid, "HardSigmoid", 0);
 
 op::v0::HardSigmoid::HardSigmoid() : Op() {}
 
@@ -34,7 +34,7 @@ void op::v0::HardSigmoid::validate_and_infer_types() {
     if (alpha_pshape.is_static()) {
         const auto alpha_shape = alpha_pshape.to_shape();
         NODE_VALIDATION_CHECK(this,
-                              is_scalar(alpha_shape),
+                              ngraph::is_scalar(alpha_shape),
                               "A scalar is expected for the 'alpha' input. Got: ",
                               alpha_shape);
     }
@@ -42,7 +42,7 @@ void op::v0::HardSigmoid::validate_and_infer_types() {
     if (beta_pshape.is_static()) {
         const auto beta_shape = beta_pshape.to_shape();
         NODE_VALIDATION_CHECK(this,
-                              is_scalar(beta_shape),
+                              ngraph::is_scalar(beta_shape),
                               "A scalar is expected for the 'beta' input. Got: ",
                               beta_shape);
     }
diff --git a/ngraph/core/src/op/hsigmoid.cpp b/ngraph/core/src/op/hsigmoid.cpp
index 32bc9e39b9b439..3757544b8730a0 100644
--- a/ngraph/core/src/op/hsigmoid.cpp
+++ b/ngraph/core/src/op/hsigmoid.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v5::HSigmoid, "HSigmoid", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::HSigmoid, "HSigmoid", 5, op::util::UnaryElementwiseArithmetic);
 
 op::v5::HSigmoid::HSigmoid(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/hswish.cpp b/ngraph/core/src/op/hswish.cpp
index ffb67eebd76540..8dda829655e60b 100644
--- a/ngraph/core/src/op/hswish.cpp
+++ b/ngraph/core/src/op/hswish.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v4::HSwish, "HSwish", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::HSwish, "HSwish", 4, op::util::UnaryElementwiseArithmetic);
 
 op::v4::HSwish::HSwish(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/idft.cpp b/ngraph/core/src/op/idft.cpp
index 72b6ec077e44e9..8c498fc22cc5bd 100644
--- a/ngraph/core/src/op/idft.cpp
+++ b/ngraph/core/src/op/idft.cpp
@@ -18,7 +18,7 @@
 
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v7::IDFT, "IDFT", 7, util::FFTBase);
+OPENVINO_RTTI_DEFINITION(op::v7::IDFT, "IDFT", 7, util::FFTBase);
 
 op::v7::IDFT::IDFT(const Output<Node>& data, const Output<Node>& axes) : FFTBase(data, axes) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/if.cpp b/ngraph/core/src/op/if.cpp
index ea8c76d0c8e91a..95cf4b72772587 100644
--- a/ngraph/core/src/op/if.cpp
+++ b/ngraph/core/src/op/if.cpp
@@ -18,7 +18,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(ngraph::op::v8::If, "If", 8, MultiSubGraphOp);
+OPENVINO_RTTI_DEFINITION(ngraph::op::v8::If, "If", 8, MultiSubGraphOp);
 
 op::v8::If::If() : MultiSubGraphOp(2) {}
 
@@ -28,8 +28,7 @@ op::v8::If::If(const Output<Node>& execution_condition) : If() {
 
 // This function tries to calculate the output shape of the if operation by two outputs from two
 // subgraphs.
-static ngraph::PartialShape resolve_shape(const ngraph::PartialShape& then_pshape,
-                                          const ngraph::PartialShape& else_pshape) {
+static ov::PartialShape resolve_shape(const ov::PartialShape& then_pshape, const ov::PartialShape& else_pshape) {
     // then_pshape - shape of output from then_body
     // else_pshape - shape of output from else_body
     auto then_rank = then_pshape.rank();
@@ -38,7 +37,7 @@ static ngraph::PartialShape resolve_shape(const ngraph::PartialShape& then_pshap
     // if rangs of shapes are not equal or rang of one of them is dynamic function
     // return shape with dynamic rank
     if (then_rank.is_dynamic() || else_rank.is_dynamic() || then_rank.get_length() != else_rank.get_length()) {
-        return ngraph::PartialShape::dynamic(ngraph::Rank::dynamic());
+        return ov::PartialShape::dynamic(ngraph::Rank::dynamic());
     }
     std::vector<Dimension> new_dims;
 
@@ -49,15 +48,15 @@ static ngraph::PartialShape resolve_shape(const ngraph::PartialShape& then_pshap
         if ((*then_it).is_dynamic() || (*else_it).is_dynamic()) {
             new_dims.push_back(Dimension::dynamic());
         } else if (*then_it == *else_it) {
-            new_dims.push_back(Dimension(*then_it));
+            new_dims.emplace_back(*then_it);
         } else {
             auto dim_min = std::min((*then_it).get_min_length(), (*else_it).get_min_length());
             auto dim_max = std::max((*then_it).get_min_length(), (*else_it).get_min_length());
-            new_dims.push_back(Dimension(dim_min, dim_max));
+            new_dims.emplace_back(dim_min, dim_max);
         }
     }
 
-    return PartialShape(new_dims);
+    return ov::PartialShape(new_dims);
 }
 
 bool op::v8::If::visit_attributes(AttributeVisitor& visitor) {
@@ -125,7 +124,7 @@ void op::v8::If::validate_and_infer_types() {
         // shape and type inference for outputs from If operations
         for (const auto& output_descr : m_output_descriptions[cond_index]) {
             auto body_value = body->get_results().at(output_descr->m_body_value_index)->input_value(0);
-            auto body_value_partial_shape = body_value.get_partial_shape();
+            const auto& body_value_partial_shape = body_value.get_partial_shape();
             set_output_type(output_descr->m_output_index, body_value.get_element_type(), body_value_partial_shape);
         }
     } else  // condition is non constant
@@ -236,8 +235,8 @@ bool op::v8::If::has_evaluate() const {
 }
 
 void op::v8::If::set_input(const Output<Node>& value,
-                           const std::shared_ptr<Parameter>& then_parameter,
-                           const std::shared_ptr<Parameter>& else_parameter) {
+                           const std::shared_ptr<v0::Parameter>& then_parameter,
+                           const std::shared_ptr<v0::Parameter>& else_parameter) {
     NGRAPH_CHECK(then_parameter != nullptr || else_parameter != nullptr,
                  "Missing parameters! Both parameters are nullptr!");
     auto then_param_index = m_bodies[THEN_BODY_INDEX]->get_parameter_index(then_parameter);
@@ -253,8 +252,8 @@ void op::v8::If::set_input(const Output<Node>& value,
     set_invariant_inputs(value, {then_parameter, else_parameter});
 }
 
-Output<Node> op::v8::If::set_output(const std::shared_ptr<Result>& then_result,
-                                    const std::shared_ptr<Result>& else_result) {
+Output<Node> op::v8::If::set_output(const std::shared_ptr<v0::Result>& then_result,
+                                    const std::shared_ptr<v0::Result>& else_result) {
     NGRAPH_CHECK(then_result != nullptr, "Incorrect result in \"then_body\"! Result cant be \'nullptr\'");
     NGRAPH_CHECK(else_result != nullptr, "Incorrect result in \"else_body\"! Result cant be \'nullptr\'");
     auto then_result_id = m_bodies[THEN_BODY_INDEX]->get_result_index(then_result);
@@ -264,4 +263,4 @@ Output<Node> op::v8::If::set_output(const std::shared_ptr<Result>& then_result,
     NGRAPH_CHECK(else_result_id != -1, "Missing result ", else_result->get_friendly_name(), "in \'then_body\'!");
 
     return set_body_outputs({then_result, else_result});
-}
\ No newline at end of file
+}
diff --git a/ngraph/core/src/op/interpolate.cpp b/ngraph/core/src/op/interpolate.cpp
index 8aff95c9b8e56a..0ff07069fe4fb7 100644
--- a/ngraph/core/src/op/interpolate.cpp
+++ b/ngraph/core/src/op/interpolate.cpp
@@ -17,11 +17,9 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Interpolate, "Interpolate", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Interpolate, "Interpolate", 0);
 
-op::v0::Interpolate::Interpolate(const Output<Node>& image,
-                                 const Output<Node>& output_shape,
-                                 const op::v0::InterpolateAttrs& attrs)
+op::v0::Interpolate::Interpolate(const Output<Node>& image, const Output<Node>& output_shape, const Attributes& attrs)
     : Op({image, output_shape}),
       m_attrs(attrs) {
     constructor_validate_and_infer_types();
@@ -45,7 +43,7 @@ void op::v0::Interpolate::validate_and_infer_types() {
                           "output shape must be an integral number.");
     set_input_is_relevant_to_shape(1);
 
-    PartialShape output_shape = PartialShape(get_input_partial_shape(0));
+    ov::PartialShape output_shape = ov::PartialShape(get_input_partial_shape(0));
     if (output_shape.rank().is_static()) {
         for (auto axis : m_attrs.axes) {
             NGRAPH_CHECK(static_cast<int64_t>(axis) < output_shape.rank().get_length());
@@ -69,29 +67,30 @@ shared_ptr<Node> op::v0::Interpolate::clone_with_new_inputs(const OutputVector&
     return make_shared<op::v0::Interpolate>(new_args.at(0), new_args.at(1), m_attrs);
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v0::Interpolate::InterpolateMode& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v0::Interpolate::InterpolateMode& type) {
     return s << as_string(type);
 }
 
 namespace ov {
 template <>
-EnumNames<op::v0::Interpolate::InterpolateMode>& EnumNames<op::v0::Interpolate::InterpolateMode>::get() {
-    static auto enum_names =
-        EnumNames<op::v0::Interpolate::InterpolateMode>("op::v0::Interpolate::InterpolateMode",
-                                                        {{"nearest", op::v0::Interpolate::InterpolateMode::NEAREST},
-                                                         {"linear", op::v0::Interpolate::InterpolateMode::LINEAR},
-                                                         {"cubic", op::v0::Interpolate::InterpolateMode::CUBIC},
-                                                         {"area", op::v0::Interpolate::InterpolateMode::AREA}});
+EnumNames<ngraph::op::v0::Interpolate::InterpolateMode>&
+EnumNames<ngraph::op::v0::Interpolate::InterpolateMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v0::Interpolate::InterpolateMode>(
+        "op::v0::Interpolate::InterpolateMode",
+        {{"nearest", ngraph::op::v0::Interpolate::InterpolateMode::NEAREST},
+         {"linear", ngraph::op::v0::Interpolate::InterpolateMode::LINEAR},
+         {"cubic", ngraph::op::v0::Interpolate::InterpolateMode::CUBIC},
+         {"area", ngraph::op::v0::Interpolate::InterpolateMode::AREA}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v0::Interpolate::InterpolateMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v0::Interpolate::InterpolateMode>::type_info;
 
 }  // namespace ov
 
 // Interpolate v4
 
-NGRAPH_RTTI_DEFINITION(op::v4::Interpolate, "Interpolate", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::Interpolate, "Interpolate", 4);
 
 op::v4::Interpolate::Interpolate(const Output<Node>& image,
                                  const Output<Node>& output_shape,
@@ -128,7 +127,7 @@ bool op::v4::Interpolate::visit_attributes(AttributeVisitor& visitor) {
 std::vector<int64_t> op::v4::Interpolate::get_axes() const {
     auto inputs = input_values();
     if (inputs.size() <= 3) {
-        PartialShape input_shape = PartialShape(get_input_partial_shape(0));
+        ov::PartialShape input_shape = ov::PartialShape(get_input_partial_shape(0));
         NODE_VALIDATION_CHECK(this,
                               input_shape.rank().is_static(),
                               "Could not define axes of interpolation because there are "
@@ -158,10 +157,10 @@ int64_t multiply_bound_and_scale(int64_t bound, float scale) {
 }
 }  // namespace
 
-void op::v4::Interpolate::infer_using_scales(PartialShape& output_shape,
+void op::v4::Interpolate::infer_using_scales(ov::PartialShape& output_shape,
                                              const std::vector<int64_t>& axes,
                                              const std::vector<float>& scales,
-                                             const PartialShape& padded_input_shape) const {
+                                             const ov::PartialShape& padded_input_shape) const {
     size_t i = 0;
     for (auto axis : axes) {
         const auto& current_dim = padded_input_shape[axis];
@@ -175,7 +174,7 @@ void op::v4::Interpolate::infer_using_scales(PartialShape& output_shape,
     }
 }
 
-void op::v4::Interpolate::infer_using_shapes(PartialShape& output_shape,
+void op::v4::Interpolate::infer_using_shapes(ov::PartialShape& output_shape,
                                              const std::vector<int64_t>& axes,
                                              const std::vector<int64_t>& sizes) const {
     size_t i = 0;
@@ -184,10 +183,10 @@ void op::v4::Interpolate::infer_using_shapes(PartialShape& output_shape,
     }
 }
 
-PartialShape op::v4::Interpolate::get_padded_input_shape(const PartialShape& input_shape) const {
+ov::PartialShape op::v4::Interpolate::get_padded_input_shape(const ov::PartialShape& input_shape) const {
     const auto input_rank = input_shape.rank().get_length();
 
-    PartialShape padded_input_shape = input_shape;
+    ov::PartialShape padded_input_shape = input_shape;
 
     for (int64_t i = 0; i < input_rank; ++i) {
         if (input_shape[i].is_static()) {
@@ -226,7 +225,7 @@ void op::v4::Interpolate::validate_and_infer_types() {
             "Axes element type must be i32, i64, u32 or u64");
     }
 
-    PartialShape input_shape = PartialShape(get_input_partial_shape(0));
+    ov::PartialShape input_shape = ov::PartialShape(get_input_partial_shape(0));
 
     if (!input_shape.rank().is_static()) {
         set_output_type(0, get_input_element_type(0), input_shape);
@@ -238,7 +237,7 @@ void op::v4::Interpolate::validate_and_infer_types() {
     // If the input 'axes' is given and this input is not Constant, we cannot infer any elements
     // of the output shape. Hence, all components of the output shape should be dynamic.
     if (input_values().size() == 4 && !has_and_set_equal_bounds(input_value(3))) {
-        PartialShape output_shape = std::vector<Dimension>(input_rank, Dimension::dynamic());
+        ov::PartialShape output_shape = std::vector<Dimension>(input_rank, Dimension::dynamic());
         set_output_type(0, get_input_element_type(0), output_shape);
         return;
     }
@@ -246,8 +245,8 @@ void op::v4::Interpolate::validate_and_infer_types() {
     auto axes = get_axes();
     correct_pads();
 
-    PartialShape padded_input_shape = get_padded_input_shape(input_shape);
-    PartialShape output_shape = padded_input_shape;
+    ov::PartialShape padded_input_shape = get_padded_input_shape(input_shape);
+    ov::PartialShape output_shape = padded_input_shape;
 
     if (output_shape.rank().is_static()) {
         for (auto axis : axes) {
@@ -288,7 +287,7 @@ static constexpr size_t axes_port = 3;
 static constexpr size_t max_num_of_ports = 4;
 
 std::vector<int64_t> get_axes_vector(const HostTensorVector& args) {
-    Shape input_shape{args[data_port]->get_shape()};
+    ov::Shape input_shape{args[data_port]->get_shape()};
     size_t input_rank = input_shape.size();
     size_t num_of_inputs = args.size();
 
@@ -317,7 +316,7 @@ std::vector<int64_t> get_target_shape_vector(const HostTensorVector& args, size_
 }
 
 std::vector<float> get_scales_vector(const HostTensorVector& args,
-                                     const Shape& input_shape,
+                                     const ov::Shape& input_shape,
                                      const op::v4::Interpolate::InterpolateAttrs& attrs,
                                      std::vector<int64_t> axes) {
     using ShapeCalcMode = ngraph::op::v4::Interpolate::ShapeCalcMode;
@@ -359,7 +358,7 @@ std::vector<T> correct_pad(const std::vector<T>& p, size_t rank) {
 }  // namespace
 
 void op::v4::Interpolate::correct_pads() {
-    PartialShape input_shape = PartialShape(get_input_partial_shape(0));
+    ov::PartialShape input_shape = ov::PartialShape(get_input_partial_shape(0));
     if (input_shape.rank().is_dynamic()) {
         return;
     }
@@ -372,8 +371,8 @@ void op::v4::Interpolate::correct_pads() {
 static void pad_input_data(const uint8_t* data_ptr,
                            uint8_t* padded_data_ptr,
                            size_t type_size,
-                           const Shape& input_shape,
-                           const Shape& padded_input_shape,
+                           const ov::Shape& input_shape,
+                           const ov::Shape& padded_input_shape,
                            const std::vector<size_t>& pads_begin) {
     NGRAPH_SUPPRESS_DEPRECATED_START
     CoordinateTransform input_transform(input_shape);
@@ -397,15 +396,15 @@ bool op::v4::Interpolate::evaluate_interpolate(const HostTensorVector& outputs,
     element::Type input_et = get_input_element_type(0);
     size_t type_size = input_et.size();
 
-    Shape input_shape{inputs[data_port]->get_shape()};
-    Shape padded_input_shape = get_padded_input_shape(input_shape).to_shape();
+    ov::Shape input_shape{inputs[data_port]->get_shape()};
+    ov::Shape padded_input_shape = get_padded_input_shape(input_shape).to_shape();
 
     auto axes = get_axes_vector(inputs);
     size_t num_of_axes = axes.size();
 
     auto scales = get_scales_vector(inputs, padded_input_shape, m_attrs, axes);
 
-    PartialShape output_shape{padded_input_shape};
+    ov::PartialShape output_shape{padded_input_shape};
 
     if (m_attrs.shape_calculation_mode == ShapeCalcMode::SCALES) {
         infer_using_scales(output_shape, axes, scales, padded_input_shape);
@@ -414,7 +413,7 @@ bool op::v4::Interpolate::evaluate_interpolate(const HostTensorVector& outputs,
         infer_using_shapes(output_shape, axes, sizes);
     }
 
-    Shape out_shape = output_shape.to_shape();
+    ov::Shape out_shape = output_shape.to_shape();
 
     outputs[0]->set_element_type(inputs[0]->get_element_type());
     outputs[0]->set_shape(out_shape);
@@ -480,72 +479,76 @@ bool op::v4::Interpolate::has_evaluate() const {
     return false;
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v4::Interpolate::InterpolateMode& type) {
-    return s << as_string(type);
-}
-
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v4::Interpolate::ShapeCalcMode& type) {
-    return s << as_string(type);
-}
-
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v4::Interpolate::CoordinateTransformMode& type) {
-    return s << as_string(type);
-}
-
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v4::Interpolate::NearestMode& type) {
-    return s << as_string(type);
-}
-
 namespace ov {
 template <>
-NGRAPH_API EnumNames<op::v4::Interpolate::InterpolateMode>& EnumNames<op::v4::Interpolate::InterpolateMode>::get() {
-    static auto enum_names = EnumNames<op::v4::Interpolate::InterpolateMode>(
+NGRAPH_API EnumNames<ngraph::op::v4::Interpolate::InterpolateMode>&
+EnumNames<ngraph::op::v4::Interpolate::InterpolateMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v4::Interpolate::InterpolateMode>(
         "op::v4::Interpolate::InterpolateMode",
-        {{"nearest", op::v4::Interpolate::InterpolateMode::NEAREST},
-         {"linear", op::v4::Interpolate::InterpolateMode::LINEAR},
-         {"linear_onnx", op::v4::Interpolate::InterpolateMode::LINEAR_ONNX},
-         {"cubic", op::v4::Interpolate::InterpolateMode::CUBIC}});
+        {{"nearest", ngraph::op::v4::Interpolate::InterpolateMode::NEAREST},
+         {"linear", ngraph::op::v4::Interpolate::InterpolateMode::LINEAR},
+         {"linear_onnx", ngraph::op::v4::Interpolate::InterpolateMode::LINEAR_ONNX},
+         {"cubic", ngraph::op::v4::Interpolate::InterpolateMode::CUBIC}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v4::Interpolate::InterpolateMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v4::Interpolate::InterpolateMode>::type_info;
 
 template <>
-NGRAPH_API EnumNames<op::v4::Interpolate::ShapeCalcMode>& EnumNames<op::v4::Interpolate::ShapeCalcMode>::get() {
-    static auto enum_names = EnumNames<op::v4::Interpolate::ShapeCalcMode>(
+NGRAPH_API EnumNames<ngraph::op::v4::Interpolate::ShapeCalcMode>&
+EnumNames<ngraph::op::v4::Interpolate::ShapeCalcMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v4::Interpolate::ShapeCalcMode>(
         "op::v4::Interpolate::ShapeCalcMode",
-        {{"sizes", op::v4::Interpolate::ShapeCalcMode::SIZES}, {"scales", op::v4::Interpolate::ShapeCalcMode::SCALES}});
+        {{"sizes", ngraph::op::v4::Interpolate::ShapeCalcMode::SIZES},
+         {"scales", ngraph::op::v4::Interpolate::ShapeCalcMode::SCALES}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v4::Interpolate::ShapeCalcMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v4::Interpolate::ShapeCalcMode>::type_info;
 
 template <>
-NGRAPH_API EnumNames<op::v4::Interpolate::CoordinateTransformMode>&
-EnumNames<op::v4::Interpolate::CoordinateTransformMode>::get() {
-    static auto enum_names = EnumNames<op::v4::Interpolate::CoordinateTransformMode>(
+NGRAPH_API EnumNames<ngraph::op::v4::Interpolate::CoordinateTransformMode>&
+EnumNames<ngraph::op::v4::Interpolate::CoordinateTransformMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v4::Interpolate::CoordinateTransformMode>(
         "op::v4::Interpolate::CoordinateTransformMode",
-        {{"half_pixel", op::v4::Interpolate::CoordinateTransformMode::HALF_PIXEL},
-         {"pytorch_half_pixel", op::v4::Interpolate::CoordinateTransformMode::PYTORCH_HALF_PIXEL},
-         {"asymmetric", op::v4::Interpolate::CoordinateTransformMode::ASYMMETRIC},
-         {"tf_half_pixel_for_nn", op::v4::Interpolate::CoordinateTransformMode::TF_HALF_PIXEL_FOR_NN},
-         {"align_corners", op::v4::Interpolate::CoordinateTransformMode::ALIGN_CORNERS}});
+        {{"half_pixel", ngraph::op::v4::Interpolate::CoordinateTransformMode::HALF_PIXEL},
+         {"pytorch_half_pixel", ngraph::op::v4::Interpolate::CoordinateTransformMode::PYTORCH_HALF_PIXEL},
+         {"asymmetric", ngraph::op::v4::Interpolate::CoordinateTransformMode::ASYMMETRIC},
+         {"tf_half_pixel_for_nn", ngraph::op::v4::Interpolate::CoordinateTransformMode::TF_HALF_PIXEL_FOR_NN},
+         {"align_corners", ngraph::op::v4::Interpolate::CoordinateTransformMode::ALIGN_CORNERS}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v4::Interpolate::CoordinateTransformMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v4::Interpolate::CoordinateTransformMode>::type_info;
 
 template <>
-NGRAPH_API EnumNames<op::v4::Interpolate::NearestMode>& EnumNames<op::v4::Interpolate::NearestMode>::get() {
-    static auto enum_names = EnumNames<op::v4::Interpolate::NearestMode>(
+NGRAPH_API EnumNames<ngraph::op::v4::Interpolate::NearestMode>&
+EnumNames<ngraph::op::v4::Interpolate::NearestMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v4::Interpolate::NearestMode>(
         "op::v4::Interpolate::NearestMode",
-        {{"round_prefer_floor", op::v4::Interpolate::NearestMode::ROUND_PREFER_FLOOR},
-         {"round_prefer_ceil", op::v4::Interpolate::NearestMode::ROUND_PREFER_CEIL},
-         {"floor", op::v4::Interpolate::NearestMode::FLOOR},
-         {"ceil", op::v4::Interpolate::NearestMode::CEIL},
-         {"simple", op::v4::Interpolate::NearestMode::SIMPLE}});
+        {{"round_prefer_floor", ngraph::op::v4::Interpolate::NearestMode::ROUND_PREFER_FLOOR},
+         {"round_prefer_ceil", ngraph::op::v4::Interpolate::NearestMode::ROUND_PREFER_CEIL},
+         {"floor", ngraph::op::v4::Interpolate::NearestMode::FLOOR},
+         {"ceil", ngraph::op::v4::Interpolate::NearestMode::CEIL},
+         {"simple", ngraph::op::v4::Interpolate::NearestMode::SIMPLE}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v4::Interpolate::NearestMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v4::Interpolate::NearestMode>::type_info;
+
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::InterpolateMode& type) {
+    return s << as_string(type);
+}
+
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::ShapeCalcMode& type) {
+    return s << as_string(type);
+}
+
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::CoordinateTransformMode& type) {
+    return s << as_string(type);
+}
+
+std::ostream& operator<<(std::ostream& s, const op::v4::Interpolate::NearestMode& type) {
+    return s << as_string(type);
+}
 }  // namespace ov
diff --git a/ngraph/core/src/op/less.cpp b/ngraph/core/src/op/less.cpp
index 5aaebdd3e54151..f50b2f44468300 100644
--- a/ngraph/core/src/op/less.cpp
+++ b/ngraph/core/src/op/less.cpp
@@ -50,7 +50,7 @@ bool evaluate_less(const HostTensorPtr& arg0,
 
 // ----------------------------- v1 --------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Less, "Less", 1, op::util::BinaryElementwiseComparison);
+OPENVINO_RTTI_DEFINITION(op::v1::Less, "Less", 1, op::util::BinaryElementwiseComparison);
 
 op::v1::Less::Less(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseComparison(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/less_eq.cpp b/ngraph/core/src/op/less_eq.cpp
index 02c2f1c069e7b8..864045e7f6e523 100644
--- a/ngraph/core/src/op/less_eq.cpp
+++ b/ngraph/core/src/op/less_eq.cpp
@@ -13,7 +13,7 @@ using namespace ngraph;
 
 // ---------------------------------- v1 ---------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::LessEqual, "LessEqual", 1, op::util::BinaryElementwiseComparison);
+OPENVINO_RTTI_DEFINITION(op::v1::LessEqual, "LessEqual", 1, op::util::BinaryElementwiseComparison);
 
 op::v1::LessEqual::LessEqual(const Output<Node>& arg0,
                              const Output<Node>& arg1,
diff --git a/ngraph/core/src/op/log.cpp b/ngraph/core/src/op/log.cpp
index 81cba930c0f292..e88f414159a4da 100644
--- a/ngraph/core/src/op/log.cpp
+++ b/ngraph/core/src/op/log.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Log, "Log", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Log, "Log", 0, op::util::UnaryElementwiseArithmetic);
 
 op::Log::Log(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/log_softmax.cpp b/ngraph/core/src/op/log_softmax.cpp
index 1ccf20418b7414..7e00506213a5fa 100644
--- a/ngraph/core/src/op/log_softmax.cpp
+++ b/ngraph/core/src/op/log_softmax.cpp
@@ -10,7 +10,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v5::LogSoftmax, "LogSoftmax", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::LogSoftmax, "LogSoftmax", 5);
 
 op::v5::LogSoftmax::LogSoftmax(const Output<Node>& arg, const int64_t axis) : Op({arg}), m_axis(axis) {
     constructor_validate_and_infer_types();
@@ -24,7 +24,7 @@ bool op::v5::LogSoftmax::visit_attributes(AttributeVisitor& visitor) {
 
 void op::v5::LogSoftmax::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v5_LogSoftmax_validate_and_infer_types);
-    const PartialShape& input_shape = get_input_partial_shape(0);
+    const ov::PartialShape& input_shape = get_input_partial_shape(0);
     if (input_shape.rank().is_static())
         NODE_VALIDATION_CHECK(this,
                               m_axis < input_shape.rank().get_length() && m_axis >= -input_shape.rank().get_length(),
diff --git a/ngraph/core/src/op/and.cpp b/ngraph/core/src/op/logical_and.cpp
similarity index 96%
rename from ngraph/core/src/op/and.cpp
rename to ngraph/core/src/op/logical_and.cpp
index 174eb72653e523..30bd9e43a1b961 100644
--- a/ngraph/core/src/op/and.cpp
+++ b/ngraph/core/src/op/logical_and.cpp
@@ -2,9 +2,8 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "ngraph/op/and.hpp"
-
 #include "itt.hpp"
+#include "ngraph/op/and.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
 #include "ngraph/runtime/reference/and.hpp"
 #include "ngraph/validation_util.hpp"
@@ -12,7 +11,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::LogicalAnd, "LogicalAnd", 1, util::BinaryElementwiseLogical);
+OPENVINO_RTTI_DEFINITION(ov::op::v1::LogicalAnd, "LogicalAnd", 1, util::BinaryElementwiseLogical);
 
 op::v1::LogicalAnd::LogicalAnd(const Output<Node>& arg0,
                                const Output<Node>& arg1,
diff --git a/ngraph/core/src/op/not.cpp b/ngraph/core/src/op/logical_not.cpp
similarity index 93%
rename from ngraph/core/src/op/not.cpp
rename to ngraph/core/src/op/logical_not.cpp
index 26dcc0d734525a..09a28f061ddbfc 100644
--- a/ngraph/core/src/op/not.cpp
+++ b/ngraph/core/src/op/logical_not.cpp
@@ -2,9 +2,8 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "ngraph/op/not.hpp"
-
 #include "itt.hpp"
+#include "ngraph/op/not.hpp"
 #include "ngraph/op/op.hpp"
 #include "ngraph/op/util/elementwise_args.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
@@ -14,7 +13,7 @@
 using namespace ngraph;
 using namespace std;
 
-NGRAPH_RTTI_DEFINITION(op::v1::LogicalNot, "LogicalNot", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::LogicalNot, "LogicalNot", 1);
 
 op::v1::LogicalNot::LogicalNot(const Output<Node>& arg) : Op({arg}) {
     constructor_validate_and_infer_types();
@@ -25,12 +24,11 @@ bool ngraph::op::v1::LogicalNot::visit_attributes(AttributeVisitor& visitor) {
     return true;
 }
 
-// TODO(amprocte): Update this to allow only boolean, for consistency with logical binops.
 void op::v1::LogicalNot::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_LogicalNot_validate_and_infer_types);
     auto args_et_pshape = op::util::validate_and_infer_elementwise_args(this);
     element::Type& args_et = std::get<0>(args_et_pshape);
-    PartialShape& args_pshape = std::get<1>(args_et_pshape);
+    ov::PartialShape& args_pshape = std::get<1>(args_et_pshape);
 
     set_output_type(0, args_et, args_pshape);
 }
diff --git a/ngraph/core/src/op/or.cpp b/ngraph/core/src/op/logical_or.cpp
similarity index 96%
rename from ngraph/core/src/op/or.cpp
rename to ngraph/core/src/op/logical_or.cpp
index 5c1518e5c281f6..c19eb3d8ab5974 100644
--- a/ngraph/core/src/op/or.cpp
+++ b/ngraph/core/src/op/logical_or.cpp
@@ -2,9 +2,8 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "ngraph/op/or.hpp"
-
 #include "itt.hpp"
+#include "ngraph/op/or.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
 #include "ngraph/runtime/reference/or.hpp"
 #include "ngraph/validation_util.hpp"
@@ -12,7 +11,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::LogicalOr, "LogicalOr", 1, util::BinaryElementwiseLogical);
+OPENVINO_RTTI_DEFINITION(op::v1::LogicalOr, "LogicalOr", 1, util::BinaryElementwiseLogical);
 
 op::v1::LogicalOr::LogicalOr(const Output<Node>& arg0,
                              const Output<Node>& arg1,
diff --git a/ngraph/core/src/op/loop.cpp b/ngraph/core/src/op/loop.cpp
index 3b1b1b2064d22d..d85938582af296 100644
--- a/ngraph/core/src/op/loop.cpp
+++ b/ngraph/core/src/op/loop.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v5::Loop, "Loop", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::Loop, "Loop", 5, op::util::SubGraphOp);
 
 op::v5::Loop::Loop(const Output<Node>& trip_count, const Output<Node>& execution_condition) : SubGraphOp() {
     set_argument(0, trip_count);
@@ -160,7 +160,7 @@ void op::v5::Loop::validate_and_infer_types() {
             auto body_parameter = m_bodies[0]->get_parameters().at(slice_input_description->m_body_parameter_index);
             const auto& input_partial_shape = inputs().at(index).get_source_output().get_partial_shape();
             if (input_partial_shape.rank().is_dynamic()) {
-                body_parameter->set_partial_shape(PartialShape::dynamic());
+                body_parameter->set_partial_shape(ov::PartialShape::dynamic());
             } else {
                 auto out_shape = input_partial_shape;
                 const auto axis =
@@ -178,7 +178,7 @@ void op::v5::Loop::validate_and_infer_types() {
 
             body_parameter->set_partial_shape(input_partial_shape);
         } else if (auto invariant_input_description =
-                       ov::as_type_ptr<TensorIterator::InvariantInputDescription>(input_description)) {
+                       ov::as_type_ptr<v0::TensorIterator::InvariantInputDescription>(input_description)) {
             auto body_parameter = m_bodies[0]->get_parameters().at(invariant_input_description->m_body_parameter_index);
 
             auto body_param_partial_shape = body_parameter->get_partial_shape();
@@ -198,16 +198,16 @@ void op::v5::Loop::validate_and_infer_types() {
         auto body_value = m_bodies[0]->get_results().at(output_description->m_body_value_index)->input_value(0);
 
         if (auto concat_output_description =
-                ov::as_type_ptr<TensorIterator::ConcatOutputDescription>(output_description)) {
+                ov::as_type_ptr<v0::TensorIterator::ConcatOutputDescription>(output_description)) {
             const auto& body_value_partial_shape = body_value.get_partial_shape();
             auto out_shape = body_value_partial_shape;
             if (zero_number_of_iter) {
-                out_shape = PartialShape{0};
+                out_shape = ov::PartialShape{0};
             } else if (out_shape.rank().is_static()) {
                 const auto axis = ngraph::normalize_axis(this, concat_output_description->m_axis, out_shape.rank());
                 const auto rank = out_shape.rank().get_length();
                 if (rank == 0) {
-                    out_shape = PartialShape{1};
+                    out_shape = ov::PartialShape{1};
                 }
 
                 if (out_shape[axis].is_static() && m_num_iterations != -1) {
@@ -220,8 +220,8 @@ void op::v5::Loop::validate_and_infer_types() {
         }
 
         else if (auto body_output_description =
-                     ov::as_type_ptr<TensorIterator::BodyOutputDescription>(output_description)) {
-            const PartialShape& ps = body_value.get_partial_shape();
+                     ov::as_type_ptr<v0::TensorIterator::BodyOutputDescription>(output_description)) {
+            const ov::PartialShape& ps = body_value.get_partial_shape();
             if (ps.is_dynamic()) {
                 set_output_type(index, body_value.get_element_type(), ps);
             } else {
@@ -307,5 +307,5 @@ op::v5::Loop::Loop(const op::v5::Loop& other) : SubGraphOp() {
 }
 
 namespace ov {
-constexpr DiscreteTypeInfo AttributeAdapter<op::v5::Loop::SpecialBodyPorts>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v5::Loop::SpecialBodyPorts>::type_info;
 }
diff --git a/ngraph/core/src/op/lrn.cpp b/ngraph/core/src/op/lrn.cpp
index a3884b726ade0e..652ea5e69e5488 100644
--- a/ngraph/core/src/op/lrn.cpp
+++ b/ngraph/core/src/op/lrn.cpp
@@ -14,10 +14,10 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::LRN, "LRN", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::LRN, "LRN", 0);
 
 op::LRN::LRN(const Output<Node>& arg, double alpha, double beta, double bias, size_t size)
-    : LRN(arg, op::Constant::create(element::i64, Shape{1}, {1}), alpha, beta, bias, size) {
+    : LRN(arg, op::v0::Constant::create(element::i64, ov::Shape{1}, {1}), alpha, beta, bias, size) {
     add_provenance_group_member(input_value(1).get_node_shared_ptr());
 }
 
@@ -41,13 +41,13 @@ AxisSet op::LRN::get_reduction_axes() const {
 void op::LRN::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_LRN_validate_and_infer_types);
     element::Type arg_type = get_input_element_type(0);
-    PartialShape arg_shape = get_input_partial_shape(0);
+    ov::PartialShape arg_shape = get_input_partial_shape(0);
     set_output_type(0, arg_type, arg_shape);
 
-    const PartialShape& input_shape = get_input_partial_shape(0);
+    const ov::PartialShape& input_shape = get_input_partial_shape(0);
     const auto input_shape_rank = input_shape.rank();
 
-    PartialShape axes_shape{PartialShape::dynamic()};
+    ov::PartialShape axes_shape{ov::PartialShape::dynamic()};
     if (get_input_partial_shape(1).is_static()) {
         axes_shape = get_input_partial_shape(1);
     }
@@ -102,5 +102,5 @@ bool ngraph::op::v0::LRN::visit_attributes(AttributeVisitor& visitor) {
 shared_ptr<Node> op::LRN::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_LRN_clone_with_new_inputs);
     check_new_args_count(this, new_args);
-    return make_shared<op::LRN>(new_args.at(0), new_args.at(1), m_alpha, m_beta, m_bias, m_size);
+    return make_shared<op::v0::LRN>(new_args.at(0), new_args.at(1), m_alpha, m_beta, m_bias, m_size);
 }
diff --git a/ngraph/core/src/op/lstm_cell.cpp b/ngraph/core/src/op/lstm_cell.cpp
index 9dfd9b2a4e7ed1..71a6cebec706ef 100644
--- a/ngraph/core/src/op/lstm_cell.cpp
+++ b/ngraph/core/src/op/lstm_cell.cpp
@@ -17,8 +17,8 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::LSTMCell, "LSTMCell", 0, op::util::RNNCellBase);
-NGRAPH_RTTI_DEFINITION(op::v4::LSTMCell, "LSTMCell", 4, op::util::RNNCellBase);
+OPENVINO_RTTI_DEFINITION(op::v0::LSTMCell, "LSTMCell", 0, op::util::RNNCellBase);
+OPENVINO_RTTI_DEFINITION(op::v4::LSTMCell, "LSTMCell", 4, op::util::RNNCellBase);
 
 op::v0::LSTMCell::LSTMCell() : m_input_forget(false), m_weights_format(LSTMWeightsFormat::IFCO) {
     m_activations = {"sigmoid", "tanh", "tanh"};
@@ -141,13 +141,13 @@ void op::v0::LSTMCell::validate_and_infer_types() {
 
     for (const auto& input : inputs()) {
         if (input.get_partial_shape().rank().is_dynamic()) {
-            set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
-            set_output_type(1, get_input_element_type(0), PartialShape::dynamic());
+            set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
+            set_output_type(1, get_input_element_type(0), ov::PartialShape::dynamic());
             return;
         }
     }
 
-    std::vector<ngraph::PartialShape> input_param{};
+    std::vector<ov::PartialShape> input_param{};
 
     auto merged_batch_size = Dimension::dynamic();
     auto merged_hidden_size = Dimension::dynamic();
@@ -273,14 +273,15 @@ void op::v0::LSTMCell::validate_and_infer_types() {
 }
 
 Output<Node> op::v0::LSTMCell::get_default_bias_input() const {
-    return Output<Node>{
-        op::Constant::create(get_input_element_type(0), Shape{s_gates_count * get_hidden_size()}, vector<float>{0.f})};
+    return Output<Node>{op::v0::Constant::create(get_input_element_type(0),
+                                                 Shape{s_gates_count * get_hidden_size()},
+                                                 vector<float>{0.f})};
 }
 
 Output<Node> op::v0::LSTMCell::get_default_peepholes_input() const {
-    return Output<Node>{op::Constant::create(get_input_element_type(0),
-                                             Shape{s_peepholes_count * get_hidden_size()},
-                                             vector<float>{0.f})};
+    return Output<Node>{op::v0::Constant::create(get_input_element_type(0),
+                                                 Shape{s_peepholes_count * get_hidden_size()},
+                                                 vector<float>{0.f})};
 }
 
 shared_ptr<Node> op::v0::LSTMCell::clone_with_new_inputs(const OutputVector& new_args) const {
@@ -335,17 +336,17 @@ shared_ptr<Node> op::v0::LSTMCell::clone_with_new_inputs(const OutputVector& new
 
 namespace ov {
 template <>
-EnumNames<op::LSTMWeightsFormat>& EnumNames<op::LSTMWeightsFormat>::get() {
-    static auto enum_names = EnumNames<op::LSTMWeightsFormat>("op::LSTMWeightsFormat",
-                                                              {{"fico", op::LSTMWeightsFormat::FICO},
-                                                               {"icof", op::LSTMWeightsFormat::ICOF},
-                                                               {"ifco", op::LSTMWeightsFormat::IFCO},
-                                                               {"ifoc", op::LSTMWeightsFormat::IFOC},
-                                                               {"iofc", op::LSTMWeightsFormat::IOFC}});
+EnumNames<ngraph::op::LSTMWeightsFormat>& EnumNames<ngraph::op::LSTMWeightsFormat>::get() {
+    static auto enum_names = EnumNames<ngraph::op::LSTMWeightsFormat>("op::LSTMWeightsFormat",
+                                                                      {{"fico", ngraph::op::LSTMWeightsFormat::FICO},
+                                                                       {"icof", ngraph::op::LSTMWeightsFormat::ICOF},
+                                                                       {"ifco", ngraph::op::LSTMWeightsFormat::IFCO},
+                                                                       {"ifoc", ngraph::op::LSTMWeightsFormat::IFOC},
+                                                                       {"iofc", ngraph::op::LSTMWeightsFormat::IOFC}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::LSTMWeightsFormat>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::LSTMWeightsFormat>::type_info;
 
 }  // namespace ov
 
@@ -415,8 +416,8 @@ void op::v4::LSTMCell::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v4_LSTMCell_validate_and_infer_types);
     for (const auto& input : inputs()) {
         if (input.get_partial_shape().rank().is_dynamic()) {
-            set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
-            set_output_type(1, get_input_element_type(0), PartialShape::dynamic());
+            set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
+            set_output_type(1, get_input_element_type(0), ov::PartialShape::dynamic());
             return;
         }
     }
@@ -511,8 +512,9 @@ void op::v4::LSTMCell::validate_and_infer_types() {
 }
 
 Output<Node> op::v4::LSTMCell::get_default_bias_input() const {
-    return Output<Node>{
-        op::Constant::create(get_input_element_type(0), Shape{s_gates_count * get_hidden_size()}, vector<float>{0.f})};
+    return Output<Node>{op::v0::Constant::create(get_input_element_type(0),
+                                                 Shape{s_gates_count * get_hidden_size()},
+                                                 vector<float>{0.f})};
 }
 
 shared_ptr<Node> op::v4::LSTMCell::clone_with_new_inputs(const OutputVector& new_args) const {
diff --git a/ngraph/core/src/op/lstm_sequence.cpp b/ngraph/core/src/op/lstm_sequence.cpp
index 5a1229986a6057..7830c9d0ddc92d 100644
--- a/ngraph/core/src/op/lstm_sequence.cpp
+++ b/ngraph/core/src/op/lstm_sequence.cpp
@@ -16,8 +16,8 @@
 using namespace ngraph;
 using namespace std;
 
-NGRAPH_RTTI_DEFINITION(op::v0::LSTMSequence, "LSTMSequence", 0);
-NGRAPH_RTTI_DEFINITION(op::v5::LSTMSequence, "LSTMSequence", 5);
+OPENVINO_RTTI_DEFINITION(op::v0::LSTMSequence, "LSTMSequence", 0);
+OPENVINO_RTTI_DEFINITION(op::v5::LSTMSequence, "LSTMSequence", 5, util::RNNCellBase);
 
 op::v0::LSTMSequence::LSTMSequence()
     : Op(),
@@ -291,7 +291,7 @@ shared_ptr<Node> op::v0::LSTMSequence::prepare_input(Output<Node> node,
 
 void op::v0::LSTMSequence::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_LSTMSequence_validate_and_infer_types);
-    std::vector<ngraph::PartialShape> input_param{};
+    std::vector<ov::PartialShape> input_param{};
 
     auto lstm_seq_gates_count = 4;
     auto lstm_seq_peepholes_count = 3;
@@ -464,13 +464,13 @@ void op::v5::LSTMSequence::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v5_LSTMSequence_validate_and_infer_types);
     for (const auto& input : inputs()) {
         if (input.get_partial_shape().rank().is_dynamic()) {
-            set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
-            set_output_type(1, get_input_element_type(0), PartialShape::dynamic());
-            set_output_type(2, get_input_element_type(0), PartialShape::dynamic());
+            set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
+            set_output_type(1, get_input_element_type(0), ov::PartialShape::dynamic());
+            set_output_type(2, get_input_element_type(0), ov::PartialShape::dynamic());
             return;
         }
     }
-    std::vector<ngraph::PartialShape> input_param{};
+    std::vector<ov::PartialShape> input_param{};
 
     auto lstm_seq_gates_count = 4;
     auto merged_batch_size = Dimension::dynamic();
diff --git a/ngraph/core/src/op/matmul.cpp b/ngraph/core/src/op/matmul.cpp
index 4175fafcd57629..41258528ccc857 100644
--- a/ngraph/core/src/op/matmul.cpp
+++ b/ngraph/core/src/op/matmul.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::MatMul, "MatMul", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::MatMul, "MatMul", 0);
 
 op::MatMul::MatMul(const Output<Node>& A, const Output<Node>& B, const bool& transpose_a, const bool& transpose_b)
     : Op(OutputVector{A, B}),
@@ -38,10 +38,10 @@ shared_ptr<Node> op::MatMul::clone_with_new_inputs(const OutputVector& new_args)
 }
 
 namespace matmul {
-PartialShape validate_matmul_output_shape(const PartialShape& arg0_shape,
-                                          const PartialShape& arg1_shape,
-                                          bool transpose_a,
-                                          bool transpose_b) {
+ov::PartialShape validate_matmul_output_shape(const ov::PartialShape& arg0_shape,
+                                              const ov::PartialShape& arg1_shape,
+                                              bool transpose_a,
+                                              bool transpose_b) {
     auto arg0_rank = arg0_shape.rank().get_length();
     auto arg1_rank = arg1_shape.rank().get_length();
 
@@ -169,7 +169,7 @@ PartialShape validate_matmul_output_shape(const PartialShape& arg0_shape,
         output_shape.erase(output_shape.begin() + output_shape.size() - 1);
     }
 
-    return PartialShape(output_shape);
+    return ov::PartialShape(output_shape);
 }
 
 template <element::Type_t ET>
@@ -180,12 +180,14 @@ bool evaluate(const HostTensorPtr& arg0,
               bool transpose_b) {
     using T = typename element_type_traits<ET>::value_type;
 
-    Shape arg0_shape = arg0->get_shape();
-    Shape arg1_shape = arg1->get_shape();
+    ov::Shape arg0_shape = arg0->get_shape();
+    ov::Shape arg1_shape = arg1->get_shape();
 
-    PartialShape output_partial_shape =
-        validate_matmul_output_shape(PartialShape(arg0_shape), PartialShape(arg1_shape), transpose_a, transpose_b);
-    Shape output_shape = output_partial_shape.to_shape();
+    ov::PartialShape output_partial_shape = validate_matmul_output_shape(ov::PartialShape(arg0_shape),
+                                                                         ov::PartialShape(arg1_shape),
+                                                                         transpose_a,
+                                                                         transpose_b);
+    ov::Shape output_shape = output_partial_shape.to_shape();
     output->set_element_type(arg0->get_element_type());
     output->set_shape(output_shape);
 
@@ -259,7 +261,7 @@ void ngraph::op::v0::MatMul::validate_and_infer_types() {
     const auto& B_partial_shape = get_input_partial_shape(1);
 
     if (A_partial_shape.rank().is_static() && B_partial_shape.rank().is_static()) {
-        PartialShape output_shape;
+        ov::PartialShape output_shape;
 
         const bool transpose_a = get_transpose_a();
         const bool transpose_b = get_transpose_b();
@@ -268,6 +270,6 @@ void ngraph::op::v0::MatMul::validate_and_infer_types() {
 
         set_output_type(0, result_et, output_shape);
     } else {
-        set_output_type(0, result_et, PartialShape::dynamic());
+        set_output_type(0, result_et, ov::PartialShape::dynamic());
     }
 }
diff --git a/ngraph/core/src/op/matrix_nms.cpp b/ngraph/core/src/op/matrix_nms.cpp
index 6a5af0f0d47492..5df137505ae8b5 100644
--- a/ngraph/core/src/op/matrix_nms.cpp
+++ b/ngraph/core/src/op/matrix_nms.cpp
@@ -18,7 +18,7 @@
 
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v8::MatrixNms, "MatrixNms", 8, op::util::NmsBase);
+OPENVINO_RTTI_DEFINITION(op::v8::MatrixNms, "MatrixNms", 8, op::util::NmsBase);
 
 op::v8::MatrixNms::MatrixNms() : NmsBase(m_attrs.output_type, m_attrs.nms_top_k, m_attrs.keep_top_k) {}
 
@@ -64,20 +64,21 @@ bool ngraph::op::v8::MatrixNms::visit_attributes(AttributeVisitor& visitor) {
     return true;
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v8::MatrixNms::DecayFunction& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v8::MatrixNms::DecayFunction& type) {
     return s << as_string(type);
 }
 
 namespace ov {
 template <>
-NGRAPH_API EnumNames<op::v8::MatrixNms::DecayFunction>& EnumNames<op::v8::MatrixNms::DecayFunction>::get() {
-    static auto enum_names =
-        EnumNames<op::v8::MatrixNms::DecayFunction>("op::v8::MatrixNms::DecayFunction",
-                                                    {{"gaussian", op::v8::MatrixNms::DecayFunction::GAUSSIAN},
-                                                     {"linear", op::v8::MatrixNms::DecayFunction::LINEAR}});
+NGRAPH_API EnumNames<ngraph::op::v8::MatrixNms::DecayFunction>&
+EnumNames<ngraph::op::v8::MatrixNms::DecayFunction>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v8::MatrixNms::DecayFunction>(
+        "op::v8::MatrixNms::DecayFunction",
+        {{"gaussian", ngraph::op::v8::MatrixNms::DecayFunction::GAUSSIAN},
+         {"linear", ngraph::op::v8::MatrixNms::DecayFunction::LINEAR}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v8::MatrixNms::DecayFunction>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v8::MatrixNms::DecayFunction>::type_info;
 
 }  // namespace ov
diff --git a/ngraph/core/src/op/max.cpp b/ngraph/core/src/op/max.cpp
index fe929584dc1d9c..66def527bf95f0 100644
--- a/ngraph/core/src/op/max.cpp
+++ b/ngraph/core/src/op/max.cpp
@@ -41,7 +41,7 @@ bool evaluate_max(const HostTensorPtr& arg, const HostTensorPtr& out, const Axis
 }
 }  // namespace maxop
 
-NGRAPH_RTTI_DEFINITION(op::v1::ReduceMax, "ReduceMax", 1, util::ArithmeticReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v1::ReduceMax, "ReduceMax", 1, util::ArithmeticReductionKeepDims);
 
 op::v1::ReduceMax::ReduceMax(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims)
     : ArithmeticReductionKeepDims(arg, reduction_axes, keep_dims) {
diff --git a/ngraph/core/src/op/max_pool.cpp b/ngraph/core/src/op/max_pool.cpp
index 5e5755fa485dea..d2ecdb61346c6a 100644
--- a/ngraph/core/src/op/max_pool.cpp
+++ b/ngraph/core/src/op/max_pool.cpp
@@ -15,13 +15,13 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::MaxPool, "MaxPool", 1, op::util::MaxPoolBase);
+OPENVINO_RTTI_DEFINITION(op::v1::MaxPool, "MaxPool", 1, op::util::MaxPoolBase);
 
 op::v1::MaxPool::MaxPool(const Output<Node>& arg,
                          const Strides& strides,
-                         const Shape& pads_begin,
-                         const Shape& pads_end,
-                         const Shape& kernel,
+                         const ov::Shape& pads_begin,
+                         const ov::Shape& pads_end,
+                         const ov::Shape& kernel,
                          const op::RoundingType rounding_type,
                          const PadType auto_pad)
     : op::util::MaxPoolBase(arg, strides, pads_begin, pads_end, kernel, rounding_type, auto_pad) {
@@ -44,7 +44,7 @@ void op::v1::MaxPool::validate_and_infer_types() {
 
     MaxPoolBase::validate_and_infer_types();
 
-    const PartialShape output_shape = infer_output_shape(Strides{});  // no dilations of the filter window
+    const ov::PartialShape output_shape = infer_output_shape(Strides{});  // no dilations of the filter window
 
     set_output_type(0, get_input_element_type(0), output_shape);
 }
@@ -62,18 +62,18 @@ shared_ptr<Node> op::v1::MaxPool::clone_with_new_inputs(const OutputVector& new_
 }
 
 shared_ptr<Node> op::v1::MaxPool::get_default_value() const {
-    return op::Constant::create(get_element_type(), get_shape(), {0});
+    return op::v0::Constant::create(get_element_type(), get_shape(), {0});
 }
 
 namespace maxpool {
 template <element::Type_t ET>
 inline bool evaluate(const HostTensorPtr& arg,
                      const HostTensorPtr& out,
-                     const Shape& out_shape,
-                     const Shape& window_shape,
+                     const ov::Shape& out_shape,
+                     const ov::Shape& window_shape,
                      const Strides& window_movement_strides,
-                     const Shape& padding_below,
-                     const Shape& padding_above) {
+                     const ov::Shape& padding_below,
+                     const ov::Shape& padding_above) {
     using T = typename element_type_traits<ET>::value_type;
     out->set_shape(out_shape);
     runtime::reference::max_pool<T>(arg->get_data_ptr<ET>(),
@@ -89,11 +89,11 @@ inline bool evaluate(const HostTensorPtr& arg,
 
 bool evaluate_maxpool(const HostTensorPtr& arg,
                       const HostTensorPtr& out,
-                      const Shape& out_shape,
-                      const Shape& kernel,
+                      const ov::Shape& out_shape,
+                      const ov::Shape& kernel,
                       const Strides& strides,
-                      const Shape& pad_begin,
-                      const Shape& pad_end) {
+                      const ov::Shape& pad_begin,
+                      const ov::Shape& pad_end) {
     bool rc = true;
     auto arg_shape = arg->get_shape();
 
@@ -160,14 +160,104 @@ bool op::v1::MaxPool::has_evaluate() const {
 
 // ------------------------------ V8 ------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v8::MaxPool, "MaxPool", 8, op::util::MaxPoolBase);
+namespace maxpool_v8 {
+template <element::Type_t Values, element::Type_t Indices>
+inline bool evaluate(const HostTensorPtr& data,
+                     const HostTensorPtr& values,
+                     const HostTensorPtr& indices,
+                     const ov::Shape& out_shape,
+                     const ov::Shape& kernel,
+                     const Strides& strides,
+                     const Strides& dilations,
+                     const ov::Shape& pads_begin,
+                     const ov::Shape& pads_end,
+                     const int64_t axis) {
+    using Values_t = typename element_type_traits<Values>::value_type;
+    using Indices_t = typename element_type_traits<Indices>::value_type;
+    runtime::reference::max_pool<Values_t, Indices_t>(data->get_data_ptr<Values_t>(),
+                                                      values->get_data_ptr<Values_t>(),
+                                                      indices->get_data_ptr<Indices_t>(),
+                                                      data->get_shape(),
+                                                      out_shape,
+                                                      kernel,
+                                                      strides,
+                                                      dilations,
+                                                      pads_begin,
+                                                      pads_end,
+                                                      axis);
+    return true;
+}
+
+bool evaluate_maxpool(const HostTensorPtr& data,
+                      const HostTensorPtr& values,
+                      const HostTensorPtr& indices,
+                      const ov::Shape& out_shape,
+                      const ov::Shape& kernel,
+                      const Strides& strides,
+                      const Strides& dilations,
+                      const ov::Shape& pads_begin,
+                      const ov::Shape& pads_end,
+                      const int64_t axis) {
+#define EVAL_MAX_POOL_8(data_et, index_et)            \
+    NGRAPH_2_TYPES_CASE(maxpool_v8::evaluate_maxpool, \
+                        data_et,                      \
+                        index_et,                     \
+                        data,                         \
+                        values,                       \
+                        indices,                      \
+                        out_shape,                    \
+                        kernel,                       \
+                        strides,                      \
+                        dilations,                    \
+                        pads_begin,                   \
+                        pads_end,                     \
+                        axis)
+
+    bool rc = true;
+    switch (indices->get_element_type()) {
+    case element::Type_t::i32: {
+        switch (data->get_element_type()) {
+            EVAL_MAX_POOL_8(i32, i32);
+            EVAL_MAX_POOL_8(i64, i32);
+            EVAL_MAX_POOL_8(u32, i32);
+            EVAL_MAX_POOL_8(u64, i32);
+            EVAL_MAX_POOL_8(f16, i32);
+            EVAL_MAX_POOL_8(f32, i32);
+        default:
+            rc = false;
+            break;
+        }
+    } break;
+    case element::Type_t::i64: {
+        switch (data->get_element_type()) {
+            EVAL_MAX_POOL_8(i32, i64);
+            EVAL_MAX_POOL_8(i64, i64);
+            EVAL_MAX_POOL_8(u32, i64);
+            EVAL_MAX_POOL_8(u64, i64);
+            EVAL_MAX_POOL_8(f16, i64);
+            EVAL_MAX_POOL_8(f32, i64);
+        default:
+            rc = false;
+            break;
+        }
+    } break;
+    default:
+        rc = false;
+        break;
+    }
+
+    return rc;
+}
+}  // namespace maxpool_v8
+
+OPENVINO_RTTI_DEFINITION(op::v8::MaxPool, "MaxPool", 8, op::util::MaxPoolBase);
 
 op::v8::MaxPool::MaxPool(const Output<Node>& arg,
                          const Strides& strides,
                          const Strides& dilations,
-                         const Shape& pads_begin,
-                         const Shape& pads_end,
-                         const Shape& kernel,
+                         const ov::Shape& pads_begin,
+                         const ov::Shape& pads_end,
+                         const ov::Shape& kernel,
                          const op::RoundingType rounding_type,
                          const PadType auto_pad,
                          const element::Type index_element_type,
@@ -203,7 +293,7 @@ void op::v8::MaxPool::validate_and_infer_types() {
         m_axis = ngraph::normalize_axis(this, m_axis, input_shape.rank());
     }
 
-    const PartialShape output_shape = infer_output_shape(m_dilations);
+    const ov::PartialShape output_shape = infer_output_shape(m_dilations);
 
     set_output_type(0, get_input_element_type(0), output_shape);
     set_output_type(1, m_index_element_type, output_shape);
@@ -223,3 +313,50 @@ shared_ptr<Node> op::v8::MaxPool::clone_with_new_inputs(const OutputVector& new_
                                     m_index_element_type,
                                     m_axis);
 }
+
+bool op::v8::MaxPool::has_evaluate() const {
+    NGRAPH_OP_SCOPE(v8_MaxPool_has_evaluate);
+    switch (get_input_element_type(0)) {
+    case ngraph::element::i32:
+    case ngraph::element::i64:
+    case ngraph::element::u32:
+    case ngraph::element::u64:
+    case ngraph::element::f16:
+    case ngraph::element::f32:
+        return true;
+    default:
+        break;
+    }
+    return false;
+}
+
+bool op::v8::MaxPool::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+    NGRAPH_OP_SCOPE(v8_MaxPool_evaluate);
+
+    const auto arg_shape = inputs[0]->get_partial_shape();
+    auto pads_begin_s = get_pads_begin();
+    auto pads_end_s = get_pads_end();
+    update_auto_padding(arg_shape, get_dilations(), pads_begin_s, pads_end_s);
+    CoordinateDiff pads_begin(pads_begin_s.begin(), pads_begin_s.end());
+    CoordinateDiff pads_end(pads_end_s.begin(), pads_end_s.end());
+    auto out_shape = infer_batched_pooling_forward(this,
+                                                   arg_shape,
+                                                   pads_begin,
+                                                   pads_end,
+                                                   get_kernel(),
+                                                   get_strides(),
+                                                   true,
+                                                   get_rounding_type() == op::RoundingType::CEIL,
+                                                   get_dilations());
+
+    return maxpool_v8::evaluate_maxpool(inputs[0],
+                                        outputs[0],
+                                        outputs[1],
+                                        out_shape.get_shape(),
+                                        get_kernel(),
+                                        get_strides(),
+                                        get_dilations(),
+                                        get_pads_begin(),
+                                        get_pads_end(),
+                                        get_axis());
+}
diff --git a/ngraph/core/src/op/maximum.cpp b/ngraph/core/src/op/maximum.cpp
index 20788312bd638f..b88b7751527245 100644
--- a/ngraph/core/src/op/maximum.cpp
+++ b/ngraph/core/src/op/maximum.cpp
@@ -57,7 +57,7 @@ bool evaluate_maximum(const HostTensorPtr& arg0,
 
 // ------------------------------------ v1 -------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Maximum, "Maximum", 1, op::util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::Maximum, "Maximum", 1, op::util::BinaryElementwiseArithmetic);
 
 op::v1::Maximum::Maximum(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/minimum.cpp b/ngraph/core/src/op/minimum.cpp
index 5e233eabd9accc..ec195c5f775b24 100644
--- a/ngraph/core/src/op/minimum.cpp
+++ b/ngraph/core/src/op/minimum.cpp
@@ -41,6 +41,8 @@ bool evaluate_minimum(const HostTensorPtr& arg0,
     switch (arg0->get_element_type()) {
         NGRAPH_TYPE_CASE(evaluate_minimum, i32, arg0, arg1, out, broadcast_spec);
         NGRAPH_TYPE_CASE(evaluate_minimum, i64, arg0, arg1, out, broadcast_spec);
+        NGRAPH_TYPE_CASE(evaluate_minimum, u8, arg0, arg1, out, broadcast_spec);
+        NGRAPH_TYPE_CASE(evaluate_minimum, u16, arg0, arg1, out, broadcast_spec);
         NGRAPH_TYPE_CASE(evaluate_minimum, u32, arg0, arg1, out, broadcast_spec);
         NGRAPH_TYPE_CASE(evaluate_minimum, u64, arg0, arg1, out, broadcast_spec);
         NGRAPH_TYPE_CASE(evaluate_minimum, f16, arg0, arg1, out, broadcast_spec);
@@ -55,7 +57,7 @@ bool evaluate_minimum(const HostTensorPtr& arg0,
 
 // ------------------------------ v1 -------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Minimum, "Minimum", 1, op::util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::Minimum, "Minimum", 1, op::util::BinaryElementwiseArithmetic);
 
 op::v1::Minimum::Minimum(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/mish.cpp b/ngraph/core/src/op/mish.cpp
index 970b78d910502e..f09f23e81ea8f9 100644
--- a/ngraph/core/src/op/mish.cpp
+++ b/ngraph/core/src/op/mish.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v4::Mish, "Mish", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::Mish, "Mish", 4);
 
 op::v4::Mish::Mish(const Output<Node>& arg) : Op({arg}) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/mod.cpp b/ngraph/core/src/op/mod.cpp
index d1a1e54b96fc75..d64b8cd9ecaf2d 100644
--- a/ngraph/core/src/op/mod.cpp
+++ b/ngraph/core/src/op/mod.cpp
@@ -11,7 +11,7 @@ using namespace ngraph;
 
 // ------------------------------ v1 -------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Mod, "Mod", 1, op::util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::Mod, "Mod", 1, op::util::BinaryElementwiseArithmetic);
 
 op::v1::Mod::Mod(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
@@ -22,4 +22,4 @@ shared_ptr<Node> op::v1::Mod::clone_with_new_inputs(const OutputVector& new_args
     NGRAPH_OP_SCOPE(v1_Mod_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<Mod>(new_args.at(0), new_args.at(1), this->get_autob());
-}
\ No newline at end of file
+}
diff --git a/ngraph/core/src/op/multiclass_nms.cpp b/ngraph/core/src/op/multiclass_nms.cpp
index 20c6174bd29a1b..84078ad25e5648 100644
--- a/ngraph/core/src/op/multiclass_nms.cpp
+++ b/ngraph/core/src/op/multiclass_nms.cpp
@@ -18,7 +18,7 @@
 
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v8::MulticlassNms, "MulticlassNms", 8, op::util::NmsBase);
+OPENVINO_RTTI_DEFINITION(op::v8::MulticlassNms, "MulticlassNms", 8, op::util::NmsBase);
 
 op::v8::MulticlassNms::MulticlassNms() : NmsBase(m_attrs.output_type, m_attrs.nms_top_k, m_attrs.keep_top_k) {}
 
diff --git a/ngraph/core/src/op/multiply.cpp b/ngraph/core/src/op/multiply.cpp
index 5af58e6205254e..7fc75453ce92da 100644
--- a/ngraph/core/src/op/multiply.cpp
+++ b/ngraph/core/src/op/multiply.cpp
@@ -50,7 +50,7 @@ bool evaluate_multiply(const HostTensorPtr& arg0,
 
 // ------------------------------------ v1 -------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Multiply, "Multiply", 1, util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::Multiply, "Multiply", 1, util::BinaryElementwiseArithmetic);
 
 op::v1::Multiply::Multiply(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/mvn.cpp b/ngraph/core/src/op/mvn.cpp
index ed53701375dc71..10cd0e74ab4bb8 100644
--- a/ngraph/core/src/op/mvn.cpp
+++ b/ngraph/core/src/op/mvn.cpp
@@ -13,7 +13,7 @@ using namespace ngraph;
 
 // ------------------------------ V0 ------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v0::MVN, "MVN", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::MVN, "MVN", 0);
 
 op::v0::MVN::MVN(const Output<Node>& data, bool across_channels, bool normalize_variance, double eps)
     : Op({data}),
@@ -72,22 +72,22 @@ bool op::v0::MVN::visit_attributes(AttributeVisitor& visitor) {
 
 namespace ov {
 template <>
-NGRAPH_API EnumNames<op::MVNEpsMode>& EnumNames<op::MVNEpsMode>::get() {
-    static auto enum_names = EnumNames<op::MVNEpsMode>(
+NGRAPH_API EnumNames<ngraph::op::MVNEpsMode>& EnumNames<ngraph::op::MVNEpsMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::MVNEpsMode>(
         "op::MVNEpsMode",
-        {{"OUTSIDE_SQRT", op::MVNEpsMode::OUTSIDE_SQRT}, {"INSIDE_SQRT", op::MVNEpsMode::INSIDE_SQRT}});
+        {{"OUTSIDE_SQRT", ngraph::op::MVNEpsMode::OUTSIDE_SQRT}, {"INSIDE_SQRT", ngraph::op::MVNEpsMode::INSIDE_SQRT}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::MVNEpsMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::MVNEpsMode>::type_info;
 
 }  // namespace ov
 
-std::ostream& op::operator<<(std::ostream& s, const op::MVNEpsMode& type) {
+std::ostream& ov::op::operator<<(std::ostream& s, const ngraph::op::MVNEpsMode& type) {
     return s << as_string(type);
 }
 
-NGRAPH_RTTI_DEFINITION(op::v6::MVN, "MVN", 6);
+OPENVINO_RTTI_DEFINITION(op::v6::MVN, "MVN", 6);
 
 op::v6::MVN::MVN(const Output<Node>& data,
                  const Output<Node>& reduction_axes,
diff --git a/ngraph/core/src/op/negative.cpp b/ngraph/core/src/op/negative.cpp
index 10454d7a3a172f..2f9360226b8436 100644
--- a/ngraph/core/src/op/negative.cpp
+++ b/ngraph/core/src/op/negative.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Negative, "Negative", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Negative, "Negative", 0, util::UnaryElementwiseArithmetic);
 
 op::Negative::Negative(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/non_max_suppression.cpp b/ngraph/core/src/op/non_max_suppression.cpp
index 9a124547051622..e953d440ada491 100644
--- a/ngraph/core/src/op/non_max_suppression.cpp
+++ b/ngraph/core/src/op/non_max_suppression.cpp
@@ -20,7 +20,7 @@ using namespace ngraph;
 
 // ------------------------------ V1 ------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::NonMaxSuppression, "NonMaxSuppression", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::NonMaxSuppression, "NonMaxSuppression", 1);
 
 op::v1::NonMaxSuppression::NonMaxSuppression(const Output<Node>& boxes,
                                              const Output<Node>& scores,
@@ -41,9 +41,9 @@ op::v1::NonMaxSuppression::NonMaxSuppression(const Output<Node>& boxes,
                                              const bool sort_result_descending)
     : Op({boxes,
           scores,
-          op::Constant::create(element::i64, Shape{}, {0}),
-          op::Constant::create(element::f32, Shape{}, {.0f}),
-          op::Constant::create(element::f32, Shape{}, {.0f})}),
+          op::v0::Constant::create(element::i64, ov::Shape{}, {0}),
+          op::v0::Constant::create(element::f32, ov::Shape{}, {.0f}),
+          op::v0::Constant::create(element::f32, ov::Shape{}, {.0f})}),
       m_box_encoding{box_encoding},
       m_sort_result_descending{sort_result_descending} {
     constructor_validate_and_infer_types();
@@ -54,11 +54,12 @@ std::shared_ptr<Node> op::v1::NonMaxSuppression::clone_with_new_inputs(const Out
     check_new_args_count(this, new_args);
     NODE_VALIDATION_CHECK(this, new_args.size() >= 2 && new_args.size() <= 5, "Number of inputs must be 2, 3, 4 or 5");
 
-    const auto& arg2 = new_args.size() > 2 ? new_args.at(2) : ngraph::op::Constant::create(element::i32, Shape{}, {0});
+    const auto& arg2 =
+        new_args.size() > 2 ? new_args.at(2) : ngraph::op::v0::Constant::create(element::i32, ov::Shape{}, {0});
     const auto& arg3 =
-        new_args.size() > 3 ? new_args.at(3) : ngraph::op::Constant::create(element::f32, Shape{}, {.0f});
+        new_args.size() > 3 ? new_args.at(3) : ngraph::op::v0::Constant::create(element::f32, ov::Shape{}, {.0f});
     const auto& arg4 =
-        new_args.size() > 4 ? new_args.at(4) : ngraph::op::Constant::create(element::f32, Shape{}, {.0f});
+        new_args.size() > 4 ? new_args.at(4) : ngraph::op::v0::Constant::create(element::f32, ov::Shape{}, {.0f});
 
     return std::make_shared<op::v1::NonMaxSuppression>(new_args.at(0),
                                                        new_args.at(1),
@@ -89,7 +90,7 @@ void op::v1::NonMaxSuppression::validate_and_infer_types() {
 
     // NonMaxSuppression produces triplets
     // that have the following format: [batch_index, class_index, box_index]
-    PartialShape out_shape = {Dimension::dynamic(), 3};
+    ov::PartialShape out_shape = {Dimension::dynamic(), 3};
 
     if (boxes_ps.is_dynamic() || scores_ps.is_dynamic()) {
         set_output_type(0, output_element_type, out_shape);
@@ -109,7 +110,7 @@ void op::v1::NonMaxSuppression::validate_and_infer_types() {
     if (inputs().size() >= 3) {
         const auto max_boxes_ps = get_input_partial_shape(2);
         NODE_VALIDATION_CHECK(this,
-                              max_boxes_ps.is_dynamic() || is_scalar(max_boxes_ps.to_shape()),
+                              max_boxes_ps.is_dynamic() || ngraph::is_scalar(max_boxes_ps.to_shape()),
                               "Expected a scalar for the 'max_output_boxes_per_class' input. Got: ",
                               max_boxes_ps);
     }
@@ -117,7 +118,7 @@ void op::v1::NonMaxSuppression::validate_and_infer_types() {
     if (inputs().size() >= 4) {
         const auto iou_threshold_ps = get_input_partial_shape(3);
         NODE_VALIDATION_CHECK(this,
-                              iou_threshold_ps.is_dynamic() || is_scalar(iou_threshold_ps.to_shape()),
+                              iou_threshold_ps.is_dynamic() || ngraph::is_scalar(iou_threshold_ps.to_shape()),
                               "Expected a scalar for the 'iou_threshold' input. Got: ",
                               iou_threshold_ps);
     }
@@ -125,7 +126,7 @@ void op::v1::NonMaxSuppression::validate_and_infer_types() {
     if (inputs().size() >= 5) {
         const auto score_threshold_ps = get_input_partial_shape(4);
         NODE_VALIDATION_CHECK(this,
-                              score_threshold_ps.is_dynamic() || is_scalar(score_threshold_ps.to_shape()),
+                              score_threshold_ps.is_dynamic() || ngraph::is_scalar(score_threshold_ps.to_shape()),
                               "Expected a scalar for the 'score_threshold' input. Got: ",
                               score_threshold_ps);
     }
@@ -176,25 +177,25 @@ int64_t op::v1::NonMaxSuppression::max_boxes_output_from_input() const {
 
 namespace ov {
 template <>
-EnumNames<op::v1::NonMaxSuppression::BoxEncodingType>& EnumNames<op::v1::NonMaxSuppression::BoxEncodingType>::get() {
-    static auto enum_names = EnumNames<op::v1::NonMaxSuppression::BoxEncodingType>(
+EnumNames<ngraph::op::v1::NonMaxSuppression::BoxEncodingType>&
+EnumNames<ngraph::op::v1::NonMaxSuppression::BoxEncodingType>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v1::NonMaxSuppression::BoxEncodingType>(
         "op::v1::NonMaxSuppression::BoxEncodingType",
-        {{"corner", op::v1::NonMaxSuppression::BoxEncodingType::CORNER},
-         {"center", op::v1::NonMaxSuppression::BoxEncodingType::CENTER}});
+        {{"corner", ngraph::op::v1::NonMaxSuppression::BoxEncodingType::CORNER},
+         {"center", ngraph::op::v1::NonMaxSuppression::BoxEncodingType::CENTER}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v1::NonMaxSuppression::BoxEncodingType>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v1::NonMaxSuppression::BoxEncodingType>::type_info;
 
 }  // namespace ov
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v1::NonMaxSuppression::BoxEncodingType& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v1::NonMaxSuppression::BoxEncodingType& type) {
     return s << as_string(type);
 }
 
 // ------------------------------ V3 ------------------------------
-
-constexpr NodeTypeInfo op::v3::NonMaxSuppression::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::NonMaxSuppression, "NonMaxSuppression", 3);
 
 op::v3::NonMaxSuppression::NonMaxSuppression(const Output<Node>& boxes,
                                              const Output<Node>& scores,
@@ -218,9 +219,9 @@ op::v3::NonMaxSuppression::NonMaxSuppression(const Output<Node>& boxes,
                                              const element::Type& output_type)
     : Op({boxes,
           scores,
-          op::Constant::create(element::i64, Shape{}, {0}),
-          op::Constant::create(element::f32, Shape{}, {.0f}),
-          op::Constant::create(element::f32, Shape{}, {.0f})}),
+          op::v0::Constant::create(element::i64, ov::Shape{}, {0}),
+          op::v0::Constant::create(element::f32, ov::Shape{}, {.0f}),
+          op::v0::Constant::create(element::f32, ov::Shape{}, {.0f})}),
       m_box_encoding{box_encoding},
       m_sort_result_descending{sort_result_descending},
       m_output_type{output_type} {
@@ -232,11 +233,12 @@ std::shared_ptr<Node> op::v3::NonMaxSuppression::clone_with_new_inputs(const Out
     check_new_args_count(this, new_args);
     NODE_VALIDATION_CHECK(this, new_args.size() >= 2 && new_args.size() <= 5, "Number of inputs must be 2, 3, 4 or 5");
 
-    const auto& arg2 = new_args.size() > 2 ? new_args.at(2) : ngraph::op::Constant::create(element::i32, Shape{}, {0});
+    const auto& arg2 =
+        new_args.size() > 2 ? new_args.at(2) : ngraph::op::v0::Constant::create(element::i32, ov::Shape{}, {0});
     const auto& arg3 =
-        new_args.size() > 3 ? new_args.at(3) : ngraph::op::Constant::create(element::f32, Shape{}, {.0f});
+        new_args.size() > 3 ? new_args.at(3) : ngraph::op::v0::Constant::create(element::f32, ov::Shape{}, {.0f});
     const auto& arg4 =
-        new_args.size() > 4 ? new_args.at(4) : ngraph::op::Constant::create(element::f32, Shape{}, {.0f});
+        new_args.size() > 4 ? new_args.at(4) : ngraph::op::v0::Constant::create(element::f32, ov::Shape{}, {.0f});
 
     return std::make_shared<op::v3::NonMaxSuppression>(new_args.at(0),
                                                        new_args.at(1),
@@ -281,7 +283,7 @@ void op::v3::NonMaxSuppression::validate() {
     if (inputs().size() >= 3) {
         const auto max_boxes_ps = get_input_partial_shape(2);
         NODE_VALIDATION_CHECK(this,
-                              max_boxes_ps.is_dynamic() || is_scalar(max_boxes_ps.to_shape()),
+                              max_boxes_ps.is_dynamic() || ngraph::is_scalar(max_boxes_ps.to_shape()),
                               "Expected a scalar for the 'max_output_boxes_per_class' input. Got: ",
                               max_boxes_ps);
     }
@@ -289,7 +291,7 @@ void op::v3::NonMaxSuppression::validate() {
     if (inputs().size() >= 4) {
         const auto iou_threshold_ps = get_input_partial_shape(3);
         NODE_VALIDATION_CHECK(this,
-                              iou_threshold_ps.is_dynamic() || is_scalar(iou_threshold_ps.to_shape()),
+                              iou_threshold_ps.is_dynamic() || ngraph::is_scalar(iou_threshold_ps.to_shape()),
                               "Expected a scalar for the 'iou_threshold' input. Got: ",
                               iou_threshold_ps);
     }
@@ -297,7 +299,7 @@ void op::v3::NonMaxSuppression::validate() {
     if (inputs().size() >= 5) {
         const auto score_threshold_ps = get_input_partial_shape(4);
         NODE_VALIDATION_CHECK(this,
-                              score_threshold_ps.is_dynamic() || is_scalar(score_threshold_ps.to_shape()),
+                              score_threshold_ps.is_dynamic() || ngraph::is_scalar(score_threshold_ps.to_shape()),
                               "Expected a scalar for the 'score_threshold' input. Got: ",
                               score_threshold_ps);
     }
@@ -334,7 +336,7 @@ void op::v3::NonMaxSuppression::validate_and_infer_types() {
 
     // NonMaxSuppression produces triplets
     // that have the following format: [batch_index, class_index, box_index]
-    PartialShape out_shape = {Dimension::dynamic(), 3};
+    ov::PartialShape out_shape = {Dimension::dynamic(), 3};
 
     validate();
 
@@ -363,25 +365,26 @@ int64_t op::v3::NonMaxSuppression::max_boxes_output_from_input() const {
 
 namespace ov {
 template <>
-EnumNames<op::v3::NonMaxSuppression::BoxEncodingType>& EnumNames<op::v3::NonMaxSuppression::BoxEncodingType>::get() {
-    static auto enum_names = EnumNames<op::v3::NonMaxSuppression::BoxEncodingType>(
+EnumNames<ngraph::op::v3::NonMaxSuppression::BoxEncodingType>&
+EnumNames<ngraph::op::v3::NonMaxSuppression::BoxEncodingType>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v3::NonMaxSuppression::BoxEncodingType>(
         "op::v3::NonMaxSuppression::BoxEncodingType",
-        {{"corner", op::v3::NonMaxSuppression::BoxEncodingType::CORNER},
-         {"center", op::v3::NonMaxSuppression::BoxEncodingType::CENTER}});
+        {{"corner", ngraph::op::v3::NonMaxSuppression::BoxEncodingType::CORNER},
+         {"center", ngraph::op::v3::NonMaxSuppression::BoxEncodingType::CENTER}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v3::NonMaxSuppression::BoxEncodingType>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v3::NonMaxSuppression::BoxEncodingType>::type_info;
 
 }  // namespace ov
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v3::NonMaxSuppression::BoxEncodingType& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v3::NonMaxSuppression::BoxEncodingType& type) {
     return s << as_string(type);
 }
 
 // ------------------------------ V4 ------------------------------
 
-constexpr NodeTypeInfo op::v4::NonMaxSuppression::type_info;
+OPENVINO_RTTI_DEFINITION(op::v4::NonMaxSuppression, "NonMaxSuppression", 4);
 
 op::v4::NonMaxSuppression::NonMaxSuppression(const Output<Node>& boxes,
                                              const Output<Node>& scores,
@@ -409,9 +412,9 @@ op::v4::NonMaxSuppression::NonMaxSuppression(const Output<Node>& boxes,
                                              const element::Type& output_type)
     : op::v3::NonMaxSuppression(boxes,
                                 scores,
-                                op::Constant::create(element::i64, Shape{}, {0}),
-                                op::Constant::create(element::f32, Shape{}, {.0f}),
-                                op::Constant::create(element::f32, Shape{}, {.0f}),
+                                op::v0::Constant::create(element::i64, ov::Shape{}, {0}),
+                                op::v0::Constant::create(element::f32, ov::Shape{}, {.0f}),
+                                op::v0::Constant::create(element::f32, ov::Shape{}, {.0f}),
                                 box_encoding,
                                 sort_result_descending,
                                 output_type) {
@@ -423,11 +426,12 @@ std::shared_ptr<Node> op::v4::NonMaxSuppression::clone_with_new_inputs(const Out
     check_new_args_count(this, new_args);
     NODE_VALIDATION_CHECK(this, new_args.size() >= 2 && new_args.size() <= 5, "Number of inputs must be 2, 3, 4 or 5");
 
-    const auto& arg2 = new_args.size() > 2 ? new_args.at(2) : ngraph::op::Constant::create(element::i32, Shape{}, {0});
+    const auto& arg2 =
+        new_args.size() > 2 ? new_args.at(2) : ngraph::op::v0::Constant::create(element::i32, ov::Shape{}, {0});
     const auto& arg3 =
-        new_args.size() > 3 ? new_args.at(3) : ngraph::op::Constant::create(element::f32, Shape{}, {.0f});
+        new_args.size() > 3 ? new_args.at(3) : ngraph::op::v0::Constant::create(element::f32, ov::Shape{}, {.0f});
     const auto& arg4 =
-        new_args.size() > 4 ? new_args.at(4) : ngraph::op::Constant::create(element::f32, Shape{}, {.0f});
+        new_args.size() > 4 ? new_args.at(4) : ngraph::op::v0::Constant::create(element::f32, ov::Shape{}, {.0f});
 
     return std::make_shared<op::v4::NonMaxSuppression>(new_args.at(0),
                                                        new_args.at(1),
@@ -446,7 +450,7 @@ void op::v4::NonMaxSuppression::validate_and_infer_types() {
 
     // NonMaxSuppression produces triplets
     // that have the following format: [batch_index, class_index, box_index]
-    PartialShape out_shape = {Dimension::dynamic(), 3};
+    ov::PartialShape out_shape = {Dimension::dynamic(), 3};
 
     op::v3::NonMaxSuppression::validate();
 
@@ -467,7 +471,7 @@ void op::v4::NonMaxSuppression::validate_and_infer_types() {
 
 // ------------------------------ V5 ------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v5::NonMaxSuppression, "NonMaxSuppression", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::NonMaxSuppression, "NonMaxSuppression", 5);
 
 op::v5::NonMaxSuppression::NonMaxSuppression(const Output<Node>& boxes,
                                              const Output<Node>& scores,
@@ -605,12 +609,12 @@ inline bool is_float_type_admissible(const element::Type& t) {
     return t == element::f32 || t == element::f16 || t == element::bf16;
 }
 
-inline bool is_scalar_or_1d_tensor_with_1_element(const PartialShape& p) {
+inline bool is_scalar_or_1d_tensor_with_1_element(const ov::PartialShape& p) {
     if (p.is_dynamic()) {
         return false;
     }
 
-    Shape shape = p.to_shape();
+    ov::Shape shape = p.to_shape();
 
     return ngraph::is_scalar(shape) || (is_vector(shape) && (shape[0] == 1));
 }
@@ -774,7 +778,7 @@ bool op::v5::NonMaxSuppression::is_soft_nms_sigma_constant_and_default() const {
     if (inputs().size() < 6 || !ngraph::op::is_constant(soft_nms_sigma_node)) {
         return false;
     }
-    const auto soft_nms_sigma_input = ov::as_type_ptr<op::Constant>(soft_nms_sigma_node);
+    const auto soft_nms_sigma_input = ov::as_type_ptr<op::v0::Constant>(soft_nms_sigma_node);
     return soft_nms_sigma_input->cast_vector<float>().at(0) == 0.0f;
 }
 
@@ -793,7 +797,7 @@ void op::v5::NonMaxSuppression::validate_and_infer_types() {
 
     // NonMaxSuppression produces triplets
     // that have the following format: [batch_index, class_index, box_index]
-    PartialShape out_shape = {Dimension::dynamic(), 3};
+    ov::PartialShape out_shape = {Dimension::dynamic(), 3};
 
     validate();
 
@@ -812,23 +816,23 @@ void op::v5::NonMaxSuppression::validate_and_infer_types() {
 
     set_output_type(0, m_output_type, out_shape);
     set_output_type(1, element::f32, out_shape);
-    set_output_type(2, m_output_type, Shape{1});
+    set_output_type(2, m_output_type, ov::Shape{1});
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v5::NonMaxSuppression::BoxEncodingType& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v5::NonMaxSuppression::BoxEncodingType& type) {
     return s << as_string(type);
 }
 
 namespace ov {
 template <>
-EnumNames<op::v5::NonMaxSuppression::BoxEncodingType>& EnumNames<op::v5::NonMaxSuppression::BoxEncodingType>::get() {
-    static auto enum_names = EnumNames<op::v5::NonMaxSuppression::BoxEncodingType>(
+EnumNames<ngraph::op::v5::NonMaxSuppression::BoxEncodingType>&
+EnumNames<ngraph::op::v5::NonMaxSuppression::BoxEncodingType>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v5::NonMaxSuppression::BoxEncodingType>(
         "op::v5::NonMaxSuppression::BoxEncodingType",
-        {{"corner", op::v5::NonMaxSuppression::BoxEncodingType::CORNER},
-         {"center", op::v5::NonMaxSuppression::BoxEncodingType::CENTER}});
+        {{"corner", ngraph::op::v5::NonMaxSuppression::BoxEncodingType::CORNER},
+         {"center", ngraph::op::v5::NonMaxSuppression::BoxEncodingType::CENTER}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v5::NonMaxSuppression::BoxEncodingType>::type_info;
-
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v5::NonMaxSuppression::BoxEncodingType>::type_info;
 }  // namespace ov
diff --git a/ngraph/core/src/op/non_zero.cpp b/ngraph/core/src/op/non_zero.cpp
index dce70de461df35..3630051763e576 100644
--- a/ngraph/core/src/op/non_zero.cpp
+++ b/ngraph/core/src/op/non_zero.cpp
@@ -16,7 +16,7 @@
 using namespace ngraph;
 using namespace std;
 
-NGRAPH_RTTI_DEFINITION(op::v3::NonZero, "NonZero", 3);
+OPENVINO_RTTI_DEFINITION(op::v3::NonZero, "NonZero", 3);
 
 op::v3::NonZero::NonZero(const Output<Node>& arg) : Op({arg}) {
     constructor_validate_and_infer_types();
@@ -47,13 +47,13 @@ void op::v3::NonZero::validate_and_infer_types() {
                           m_output_type == element::i64 || m_output_type == element::i32,
                           "Output type must be i32 or i64");
     // For scalar non-zero value case, onnx test case expects output shape {1, 1}
-    const PartialShape& input_shape = get_input_partial_shape(0);
+    const ov::PartialShape& input_shape = get_input_partial_shape(0);
     if (input_shape.rank().compatible(0)) {
-        set_output_type(0, m_output_type, PartialShape{Dimension::dynamic(), Dimension::dynamic()});
+        set_output_type(0, m_output_type, ov::PartialShape{Dimension::dynamic(), Dimension::dynamic()});
     } else {
         const Dimension dim =
             std::accumulate(begin(input_shape), end(input_shape), Dimension(0, 1), std::multiplies<Dimension>());
-        set_output_type(0, m_output_type, PartialShape{input_shape.rank(), dim});
+        set_output_type(0, m_output_type, ov::PartialShape{input_shape.rank(), dim});
     }
 
     set_input_is_relevant_to_shape(0);
@@ -82,16 +82,16 @@ bool evaluate_nonzero_execute(const HostTensorPtr& input, const HostTensorPtr& o
     using IN_T = typename element_type_traits<INPUT_ET>::value_type;
     using OUT_T = typename element_type_traits<OUT_ET>::value_type;
 
-    Shape input_shape = input->get_shape();
+    ov::Shape input_shape = input->get_shape();
     size_t input_rank = input_shape.size();
 
     size_t non_zero_count = runtime::reference::non_zero_get_count<IN_T>(input->get_data_ptr<INPUT_ET>(), input_shape);
 
-    Shape out_shape;
+    ov::Shape out_shape;
     if (input_rank == 0 && non_zero_count > 0) {
-        out_shape = Shape{1, 1};
+        out_shape = ov::Shape{1, 1};
     } else {
-        out_shape = Shape{input_rank, non_zero_count};
+        out_shape = ov::Shape{input_rank, non_zero_count};
     }
 
     output->set_shape(out_shape);
diff --git a/ngraph/core/src/op/normalize_l2.cpp b/ngraph/core/src/op/normalize_l2.cpp
index ed36f34fdbc90b..3ea426b27ca3c9 100644
--- a/ngraph/core/src/op/normalize_l2.cpp
+++ b/ngraph/core/src/op/normalize_l2.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::NormalizeL2, "NormalizeL2", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::NormalizeL2, "NormalizeL2", 0);
 
 op::v0::NormalizeL2::NormalizeL2(const Output<Node>& data, const Output<Node>& axes, float eps, EpsMode eps_mode)
     : Op({data, axes}),
diff --git a/ngraph/core/src/op/not_equal.cpp b/ngraph/core/src/op/not_equal.cpp
index 56f969b214cdeb..cebed042fedf0c 100644
--- a/ngraph/core/src/op/not_equal.cpp
+++ b/ngraph/core/src/op/not_equal.cpp
@@ -7,6 +7,7 @@
 #include "itt.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
 #include "ngraph/runtime/reference/not_equal.hpp"
+#include "ngraph/validation_util.hpp"
 
 using namespace std;
 using namespace ngraph;
@@ -50,7 +51,7 @@ bool evaluate_not_equal(const HostTensorPtr& arg0,
 
 // ----------------------------------- v1 --------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::NotEqual, "NotEqual", 1, op::util::BinaryElementwiseComparison);
+OPENVINO_RTTI_DEFINITION(op::v1::NotEqual, "NotEqual", 1, op::util::BinaryElementwiseComparison);
 
 op::v1::NotEqual::NotEqual(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseComparison(arg0, arg1, auto_broadcast) {
@@ -65,6 +66,7 @@ shared_ptr<Node> op::v1::NotEqual::clone_with_new_inputs(const OutputVector& new
 
 bool op::v1::NotEqual::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v1_NotEqual_evaluate);
+    NGRAPH_CHECK(validate_host_tensor_vector(outputs, 1) && validate_host_tensor_vector(inputs, 2));
     return not_equalop::evaluate_not_equal(inputs[0], inputs[1], outputs[0], get_autob());
 }
 
diff --git a/ngraph/core/src/op/one_hot.cpp b/ngraph/core/src/op/one_hot.cpp
index 2ca430fca06db5..b99d3ec3d64703 100644
--- a/ngraph/core/src/op/one_hot.cpp
+++ b/ngraph/core/src/op/one_hot.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::OneHot, "OneHot", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::OneHot, "OneHot", 1);
 
 op::v1::OneHot::OneHot(const Output<Node>& indices,
                        const Output<Node>& depth,
@@ -50,18 +50,18 @@ void op::v1::OneHot::validate_and_infer_types() {
     const auto& off_value_shape = get_input_partial_shape(3);
 
     NODE_VALIDATION_CHECK(this,
-                          depth_shape.is_dynamic() || is_scalar(depth_shape.to_shape()),
+                          depth_shape.is_dynamic() || ngraph::is_scalar(depth_shape.to_shape()),
                           "depth input must be scalar.");
 
     NODE_VALIDATION_CHECK(this,
-                          on_value_shape.is_dynamic() || is_scalar(on_value_shape.to_shape()),
+                          on_value_shape.is_dynamic() || ngraph::is_scalar(on_value_shape.to_shape()),
                           "on_value input must be scalar.");
 
     NODE_VALIDATION_CHECK(this,
-                          off_value_shape.is_dynamic() || is_scalar(off_value_shape.to_shape()),
+                          off_value_shape.is_dynamic() || ngraph::is_scalar(off_value_shape.to_shape()),
                           "off_value input must be scalar.");
 
-    PartialShape result_shape{PartialShape::dynamic()};
+    ov::PartialShape result_shape{ov::PartialShape::dynamic()};
     const auto& depth = input_value(1).get_node_shared_ptr();
     const auto& depth_constant = get_constant_from_source(input_value(1));
     if (indices_shape.rank().is_static() && depth_constant) {
@@ -77,7 +77,7 @@ void op::v1::OneHot::validate_and_infer_types() {
                               ").");
 
         NODE_VALIDATION_CHECK(this,
-                              is_scalar(depth->get_shape()),
+                              ngraph::is_scalar(depth->get_shape()),
                               "A scalar input should be provided as 'depth' to OneHot",
                               " (got ",
                               depth->get_shape(),
diff --git a/ngraph/core/src/op/pad.cpp b/ngraph/core/src/op/pad.cpp
index d9353bd0324748..5055125a378907 100644
--- a/ngraph/core/src/op/pad.cpp
+++ b/ngraph/core/src/op/pad.cpp
@@ -17,7 +17,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::Pad, "Pad", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Pad, "Pad", 1);
 
 op::v1::Pad::Pad(const Output<Node>& arg,
                  const Output<Node>& pads_begin,
@@ -33,7 +33,7 @@ op::v1::Pad::Pad(const Output<Node>& arg,
                  const Output<Node>& pads_begin,
                  const Output<Node>& pads_end,
                  PadMode pad_mode)
-    : Op({arg, pads_begin, pads_end, op::Constant::create(arg.get_element_type(), Shape{}, {0})}),
+    : Op({arg, pads_begin, pads_end, op::v0::Constant::create(arg.get_element_type(), ov::Shape{}, {0})}),
       m_pad_mode{pad_mode} {
     constructor_validate_and_infer_types();
 }
@@ -80,7 +80,7 @@ void op::v1::Pad::validate_and_infer_types() {
                               ").");
 
         NODE_VALIDATION_CHECK(this,
-                              arg_pad_shape.compatible(PartialShape{}),
+                              arg_pad_shape.compatible(ov::PartialShape{}),
                               "Argument for padding value is not a scalar (shape: ",
                               arg_pad_shape,
                               ").");
@@ -158,7 +158,7 @@ void op::v1::Pad::validate_and_infer_types() {
         }
         set_output_type(0, get_input_element_type(0), result_dims);
     } else {
-        set_output_type(0, get_input_element_type(0), PartialShape::dynamic(arg_shape_rank));
+        set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic(arg_shape_rank));
     }
 }
 
diff --git a/ngraph/core/src/op/parameter.cpp b/ngraph/core/src/op/parameter.cpp
index 5f8ee481704756..f9b7342191263c 100644
--- a/ngraph/core/src/op/parameter.cpp
+++ b/ngraph/core/src/op/parameter.cpp
@@ -12,9 +12,9 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Parameter, "Parameter", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Parameter, "Parameter", 0);
 
-op::Parameter::Parameter(const element::Type& element_type, const PartialShape& pshape)
+op::Parameter::Parameter(const element::Type& element_type, const ov::PartialShape& pshape)
     : m_partial_shape(pshape),
       m_element_type(element_type),
       m_is_relevant_to_shapes(false) {
@@ -68,7 +68,7 @@ bool ov::AttributeAdapter<ParameterVector>::visit_attributes(AttributeVisitor& v
         }
         visitor.on_attribute(index.str(), id);
         if (!m_ref[i]) {
-            m_ref[i] = ov::as_type_ptr<op::v0::Parameter>(visitor.get_registered_node(id));
+            m_ref[i] = ov::as_type_ptr<ngraph::op::v0::Parameter>(visitor.get_registered_node(id));
         }
     }
     return true;
diff --git a/ngraph/core/src/op/power.cpp b/ngraph/core/src/op/power.cpp
index edfb815c10464c..ff3bf65aebd330 100644
--- a/ngraph/core/src/op/power.cpp
+++ b/ngraph/core/src/op/power.cpp
@@ -53,7 +53,7 @@ bool evaluate_power(const HostTensorPtr& arg0,
 
 // ------------------------------ v1 -------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Power, "Power", 1, op::util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::Power, "Power", 1, op::util::BinaryElementwiseArithmetic);
 
 op::v1::Power::Power(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/prelu.cpp b/ngraph/core/src/op/prelu.cpp
index afd178ca4be5a9..20a69dd49549dd 100644
--- a/ngraph/core/src/op/prelu.cpp
+++ b/ngraph/core/src/op/prelu.cpp
@@ -10,13 +10,12 @@
 #include "itt.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::PRelu, "PRelu", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::PRelu, "PRelu", 0);
 
-op::PRelu::PRelu() : Op() {}
+ov::op::v0::PRelu::PRelu() : Op() {}
 
-op::PRelu::PRelu(const Output<Node>& data, const Output<Node>& slope) : Op({data, slope}) {
+ov::op::v0::PRelu::PRelu(const Output<Node>& data, const Output<Node>& slope) : Op({data, slope}) {
     constructor_validate_and_infer_types();
 }
 
@@ -29,26 +28,28 @@ void ngraph::op::v0::PRelu::validate_and_infer_types() {
     set_output_type(0, get_input_element_type(0), get_input_partial_shape(0));
 }
 
-shared_ptr<Node> op::PRelu::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<ov::Node> ov::op::v0::PRelu::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_PRelu_clone_with_new_inputs);
     if (new_args.size() != 2) {
-        throw ngraph_error("Incorrect number of new arguments");
+        throw ov::Exception("Incorrect number of new arguments");
     }
     return make_shared<PRelu>(new_args.at(0), new_args.at(1));
 }
 
 namespace prelu {
-template <element::Type_t ET>
-bool evaluate(const HostTensorPtr& arg, const HostTensorPtr& slope, const HostTensorPtr& out) {
-    runtime::reference::prelu(arg->get_data_ptr<ET>(),
-                              slope->get_data_ptr<ET>(),
-                              out->get_data_ptr<ET>(),
-                              arg->get_shape(),
-                              slope->get_shape());
+template <ov::element::Type_t ET>
+bool evaluate(const ngraph::HostTensorPtr& arg, const ngraph::HostTensorPtr& slope, const ngraph::HostTensorPtr& out) {
+    ngraph::runtime::reference::prelu(arg->get_data_ptr<ET>(),
+                                      slope->get_data_ptr<ET>(),
+                                      out->get_data_ptr<ET>(),
+                                      arg->get_shape(),
+                                      slope->get_shape());
     return true;
 }
 
-bool evaluate_prelu(const HostTensorPtr& arg, const HostTensorPtr& slope, const HostTensorPtr& out) {
+bool evaluate_prelu(const ngraph::HostTensorPtr& arg,
+                    const ngraph::HostTensorPtr& slope,
+                    const ngraph::HostTensorPtr& out) {
     bool rc = true;
     switch (arg->get_element_type()) {
         NGRAPH_TYPE_CASE(evaluate_prelu, i8, arg, slope, out);
@@ -63,13 +64,13 @@ bool evaluate_prelu(const HostTensorPtr& arg, const HostTensorPtr& slope, const
 }
 }  // namespace prelu
 
-bool op::PRelu::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::v0::PRelu::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v0_PRelu_evaluate);
-    NGRAPH_CHECK(validate_host_tensor_vector(outputs, 1) && validate_host_tensor_vector(inputs, 2));
+    NGRAPH_CHECK(ngraph::validate_host_tensor_vector(outputs, 1) && ngraph::validate_host_tensor_vector(inputs, 2));
     return prelu::evaluate_prelu(inputs[0], inputs[1], outputs[0]);
 }
 
-bool op::PRelu::has_evaluate() const {
+bool ov::op::v0::PRelu::has_evaluate() const {
     NGRAPH_OP_SCOPE(v0_PRelu_has_evaluate);
     switch (get_input_element_type(0)) {
     case ngraph::element::i8:
diff --git a/ngraph/core/src/op/prior_box.cpp b/ngraph/core/src/op/prior_box.cpp
index d622176de1aeeb..8114cf52f4c45d 100644
--- a/ngraph/core/src/op/prior_box.cpp
+++ b/ngraph/core/src/op/prior_box.cpp
@@ -14,9 +14,11 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::PriorBox, "PriorBox", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::PriorBox, "PriorBox", 0);
 
-op::PriorBox::PriorBox(const Output<Node>& layer_shape, const Output<Node>& image_shape, const PriorBoxAttrs& attrs)
+op::PriorBox::PriorBox(const Output<Node>& layer_shape,
+                       const Output<Node>& image_shape,
+                       const PriorBox::Attributes& attrs)
     : Op({layer_shape, image_shape}),
       m_attrs(attrs) {
     constructor_validate_and_infer_types();
@@ -56,11 +58,12 @@ void op::PriorBox::validate_and_infer_types() {
 
         auto layer_shape = const_shape->get_shape_val();
 
-        set_output_type(0,
-                        element::f32,
-                        Shape{2, 4 * layer_shape[0] * layer_shape[1] * static_cast<size_t>(number_of_priors(m_attrs))});
+        set_output_type(
+            0,
+            element::f32,
+            ov::Shape{2, 4 * layer_shape[0] * layer_shape[1] * static_cast<size_t>(number_of_priors(m_attrs))});
     } else {
-        set_output_type(0, element::f32, PartialShape{2, Dimension::dynamic()});
+        set_output_type(0, element::f32, ov::PartialShape{2, Dimension::dynamic()});
     }
 }
 
@@ -70,7 +73,7 @@ shared_ptr<Node> op::PriorBox::clone_with_new_inputs(const OutputVector& new_arg
     return make_shared<PriorBox>(new_args.at(0), new_args.at(1), m_attrs);
 }
 
-int64_t op::PriorBox::number_of_priors(const PriorBoxAttrs& attrs) {
+int64_t op::PriorBox::number_of_priors(const PriorBox::Attributes& attrs) {
     // Starting with 0 number of prior and then various conditions on attributes will contribute
     // real number of prior boxes as PriorBox is a fat thing with several modes of
     // operation that will be checked in order in the next statements.
@@ -129,7 +132,10 @@ bool op::PriorBox::visit_attributes(AttributeVisitor& visitor) {
 
 namespace prior_box {
 template <element::Type_t ET>
-bool evaluate(const HostTensorPtr& arg0, const HostTensorPtr& arg1, const HostTensorPtr& out, op::PriorBoxAttrs attrs) {
+bool evaluate(const HostTensorPtr& arg0,
+              const HostTensorPtr& arg1,
+              const HostTensorPtr& out,
+              op::PriorBox::Attributes attrs) {
     runtime::reference::prior_box(arg0->get_data_ptr<ET>(),
                                   arg1->get_data_ptr<ET>(),
                                   out->get_data_ptr<float>(),
@@ -141,7 +147,7 @@ bool evaluate(const HostTensorPtr& arg0, const HostTensorPtr& arg1, const HostTe
 bool evaluate_prior_box(const HostTensorPtr& arg0,
                         const HostTensorPtr& arg1,
                         const HostTensorPtr& out,
-                        const op::PriorBoxAttrs& attrs) {
+                        const op::PriorBox::Attributes& attrs) {
     bool rc = true;
     switch (arg0->get_element_type()) {
         NGRAPH_TYPE_CASE(evaluate_prior_box, i8, arg0, arg1, out, attrs);
diff --git a/ngraph/core/src/op/prior_box_clustered.cpp b/ngraph/core/src/op/prior_box_clustered.cpp
index cf1ce9fa23cb2c..087884606b77c7 100644
--- a/ngraph/core/src/op/prior_box_clustered.cpp
+++ b/ngraph/core/src/op/prior_box_clustered.cpp
@@ -14,17 +14,17 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::PriorBoxClustered, "PriorBoxClustered", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::PriorBoxClustered, "PriorBoxClustered", 0);
 
-op::PriorBoxClustered::PriorBoxClustered(const Output<Node>& layer_shape,
-                                         const Output<Node>& image_shape,
-                                         const PriorBoxClusteredAttrs& attrs)
+ov::op::v0::PriorBoxClustered::PriorBoxClustered(const Output<Node>& layer_shape,
+                                                 const Output<Node>& image_shape,
+                                                 const Attributes& attrs)
     : Op({layer_shape, image_shape}),
       m_attrs(attrs) {
     constructor_validate_and_infer_types();
 }
 
-void op::PriorBoxClustered::validate_and_infer_types() {
+void ov::op::v0::PriorBoxClustered::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_PriorBoxClustered_validate_and_infer_types);
     // shape node should have integer data type. For now we only allow i64
     auto layer_shape_et = get_input_element_type(0);
@@ -66,19 +66,19 @@ void op::PriorBoxClustered::validate_and_infer_types() {
         auto layer_shape = const_shape->get_shape_val();
         // {Prior boxes, variances-adjusted prior boxes}
         const auto num_priors = m_attrs.widths.size();
-        set_output_type(0, element::f32, Shape{2, 4 * layer_shape[0] * layer_shape[1] * num_priors});
+        set_output_type(0, element::f32, ov::Shape{2, 4 * layer_shape[0] * layer_shape[1] * num_priors});
     } else {
-        set_output_type(0, element::f32, PartialShape::dynamic());
+        set_output_type(0, element::f32, ov::PartialShape::dynamic());
     }
 }
 
-shared_ptr<Node> op::PriorBoxClustered::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<Node> ov::op::v0::PriorBoxClustered::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_PriorBoxClustered_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<PriorBoxClustered>(new_args.at(0), new_args.at(1), m_attrs);
 }
 
-bool op::PriorBoxClustered::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::v0::PriorBoxClustered::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_PriorBoxClustered_visit_attributes);
     float step = 0;
     float step_w_tmp = m_attrs.step_widths;
@@ -110,7 +110,7 @@ template <element::Type_t ET>
 bool evaluate(const HostTensorPtr& arg0,
               const HostTensorPtr& arg1,
               const HostTensorPtr& out,
-              op::PriorBoxClusteredAttrs attrs) {
+              ov::op::v0::PriorBoxClustered::Attributes attrs) {
     runtime::reference::prior_box_clustered(arg0->get_data_ptr<ET>(),
                                             arg1->get_data_ptr<ET>(),
                                             out->get_data_ptr<float>(),
@@ -122,7 +122,7 @@ bool evaluate(const HostTensorPtr& arg0,
 bool evaluate_prior_box(const HostTensorPtr& arg0,
                         const HostTensorPtr& arg1,
                         const HostTensorPtr& out,
-                        const op::PriorBoxClusteredAttrs& attrs) {
+                        const ov::op::v0::PriorBoxClustered::Attributes& attrs) {
     bool rc = true;
     switch (arg0->get_element_type()) {
         NGRAPH_TYPE_CASE(evaluate_prior_box, i8, arg0, arg1, out, attrs);
diff --git a/ngraph/core/src/op/proposal.cpp b/ngraph/core/src/op/proposal.cpp
index 54813c5418fc3a..87dbe38af38afc 100644
--- a/ngraph/core/src/op/proposal.cpp
+++ b/ngraph/core/src/op/proposal.cpp
@@ -10,12 +10,12 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Proposal, "Proposal", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Proposal, "Proposal", 0);
 
 op::v0::Proposal::Proposal(const Output<Node>& class_probs,
                            const Output<Node>& bbox_deltas,
                            const Output<Node>& image_shape,
-                           const ProposalAttrs& attrs)
+                           const Attributes& attrs)
     : Op({class_probs, bbox_deltas, image_shape}),
       m_attrs(attrs) {
     constructor_validate_and_infer_types();
@@ -100,7 +100,7 @@ void op::v0::Proposal::validate_and_infer_types() {
     }
 
     // intersect the batch size
-    set_output_type(0, get_input_element_type(0), PartialShape{out_dim * m_attrs.post_nms_topn, 5});
+    set_output_type(0, get_input_element_type(0), ov::PartialShape{out_dim * m_attrs.post_nms_topn, 5});
 }
 
 shared_ptr<Node> op::v0::Proposal::clone_with_new_inputs(const OutputVector& new_args) const {
@@ -128,12 +128,12 @@ bool op::v0::Proposal::visit_attributes(AttributeVisitor& visitor) {
     return true;
 }
 
-NGRAPH_RTTI_DEFINITION(op::v4::Proposal, "Proposal", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::Proposal, "Proposal", 4);
 
 op::v4::Proposal::Proposal(const Output<Node>& class_probs,
                            const Output<Node>& class_bbox_deltas,
                            const Output<Node>& image_shape,
-                           const op::ProposalAttrs& attrs)
+                           const op::v0::Proposal::Attributes& attrs)
     : v0::Proposal(class_probs, class_bbox_deltas, image_shape, attrs) {
     constructor_validate_and_infer_types();
 }
@@ -143,9 +143,9 @@ void op::v4::Proposal::validate_and_infer_types() {
     v0::Proposal::validate_and_infer_types();
     // Output shape was inferred in v0's validate_and_infer_types
     const auto proposals_ps = get_output_partial_shape(0);
-    auto out_ps = PartialShape{Dimension::dynamic()};
+    auto out_ps = ov::PartialShape{Dimension::dynamic()};
     if (proposals_ps.rank().is_static() && proposals_ps.rank().compatible(2)) {
-        out_ps = PartialShape{proposals_ps[0]};
+        out_ps = ov::PartialShape{proposals_ps[0]};
     }
     set_output_type(1, get_input_element_type(0), out_ps);
 }
diff --git a/ngraph/core/src/op/psroi_pooling.cpp b/ngraph/core/src/op/psroi_pooling.cpp
index 9b6fdf41c94edf..6df21680d4df99 100644
--- a/ngraph/core/src/op/psroi_pooling.cpp
+++ b/ngraph/core/src/op/psroi_pooling.cpp
@@ -10,16 +10,16 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::PSROIPooling, "PSROIPooling", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::PSROIPooling, "PSROIPooling", 0);
 
-op::PSROIPooling::PSROIPooling(const Output<Node>& input,
-                               const Output<Node>& coords,
-                               const size_t output_dim,
-                               const size_t group_size,
-                               const float spatial_scale,
-                               int spatial_bins_x,
-                               int spatial_bins_y,
-                               const string& mode)
+ov::op::v0::PSROIPooling::PSROIPooling(const Output<Node>& input,
+                                       const Output<Node>& coords,
+                                       const size_t output_dim,
+                                       const size_t group_size,
+                                       const float spatial_scale,
+                                       int spatial_bins_x,
+                                       int spatial_bins_y,
+                                       const string& mode)
     : Op({input, coords}),
       m_output_dim(output_dim),
       m_group_size(group_size),
@@ -41,7 +41,7 @@ bool ngraph::op::v0::PSROIPooling::visit_attributes(AttributeVisitor& visitor) {
     return true;
 }
 
-void op::PSROIPooling::validate_and_infer_types() {
+void ov::op::v0::PSROIPooling::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_PSROIPooling_validate_and_infer_types);
     auto feat_maps_et = get_input_element_type(0);
     auto coords_et = get_input_element_type(1);
@@ -60,10 +60,10 @@ void op::PSROIPooling::validate_and_infer_types() {
         NODE_VALIDATION_CHECK(this, m_spatial_bins_y > 0, "spatial_bins_y has to be greater than 0");
     }
 
-    const PartialShape& feat_map_pshape = get_input_partial_shape(0);
-    const PartialShape& coords_pshape = get_input_partial_shape(1);
+    const ov::PartialShape& feat_map_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& coords_pshape = get_input_partial_shape(1);
     if (feat_map_pshape.rank().is_dynamic() || coords_pshape.rank().is_dynamic()) {
-        set_output_type(0, feat_maps_et, PartialShape::dynamic());
+        set_output_type(0, feat_maps_et, ov::PartialShape::dynamic());
     } else {
         NODE_VALIDATION_CHECK(this,
                               feat_map_pshape.rank().get_length() == 4,
@@ -104,7 +104,7 @@ void op::PSROIPooling::validate_and_infer_types() {
     }
 }
 
-shared_ptr<Node> op::PSROIPooling::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<Node> ov::op::v0::PSROIPooling::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_PSROIPooling_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<PSROIPooling>(new_args.at(0),
diff --git a/ngraph/core/src/op/random_uniform.cpp b/ngraph/core/src/op/random_uniform.cpp
index 9b0b6cdc9fcb93..260e078db78fcd 100644
--- a/ngraph/core/src/op/random_uniform.cpp
+++ b/ngraph/core/src/op/random_uniform.cpp
@@ -7,11 +7,12 @@
 #include <ngraph/validation_util.hpp>
 
 #include "itt.hpp"
+#include "ngraph/runtime/reference/random_uniform.hpp"
 
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v8::RandomUniform, "RandomUniform", 8);
+OPENVINO_RTTI_DEFINITION(op::v8::RandomUniform, "RandomUniform", 8);
 
 op::v8::RandomUniform::RandomUniform(const Output<Node>& out_shape,
                                      const Output<Node>& min_val,
@@ -34,14 +35,14 @@ void op::v8::RandomUniform::validate_and_infer_types() {
                           shape_et.is_dynamic() || shape_et == element::i32 || shape_et == element::i64,
                           "Type of the input should be int32 or int64.");
 
-    PartialShape output_shape = PartialShape::dynamic();
+    ov::PartialShape output_shape = ov::PartialShape::dynamic();
     const auto& input_shape = get_input_partial_shape(0);
     if (input_shape.rank().is_static()) {
         NODE_VALIDATION_CHECK(this,
                               input_shape.rank() == 1,
                               "The rank of the tensor defining output shape must be equal to 1.");
         if (const auto& const_shape = get_constant_from_source(input_value(0))) {
-            output_shape = PartialShape(const_shape->cast_vector<int64_t>());
+            output_shape = ov::PartialShape(const_shape->cast_vector<int64_t>());
         }
     }
 
@@ -52,7 +53,7 @@ void op::v8::RandomUniform::validate_and_infer_types() {
         NODE_VALIDATION_CHECK(this, min_rank <= 1, "Min value must be a scalar or 1D tensor.");
 
         if (min_rank == 1) {
-            NODE_VALIDATION_CHECK(this, min_pshape.compatible(Shape{1}), "'min_val' should have 1 element.");
+            NODE_VALIDATION_CHECK(this, min_pshape.compatible(ov::Shape{1}), "'min_val' should have 1 element.");
         }
     }
 
@@ -61,7 +62,7 @@ void op::v8::RandomUniform::validate_and_infer_types() {
         NODE_VALIDATION_CHECK(this, max_rank <= 1, "Max value must be a scalar or 1D tensor.");
 
         if (max_rank == 1) {
-            NODE_VALIDATION_CHECK(this, max_pshape.compatible(Shape{1}), "'max_val' should have 1 element.");
+            NODE_VALIDATION_CHECK(this, max_pshape.compatible(ov::Shape{1}), "'max_val' should have 1 element.");
         }
     }
 
@@ -116,7 +117,7 @@ bool op::v8::RandomUniform::visit_attributes(AttributeVisitor& visitor) {
 }
 
 shared_ptr<Node> op::v8::RandomUniform::clone_with_new_inputs(const OutputVector& new_args) const {
-    NGRAPH_OP_SCOPE(v8_Roll_clone_with_new_inputs);
+    NGRAPH_OP_SCOPE(v8_RandomUniform_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<v8::RandomUniform>(new_args[0],
                                           new_args[1],
@@ -125,3 +126,94 @@ shared_ptr<Node> op::v8::RandomUniform::clone_with_new_inputs(const OutputVector
                                           m_global_seed,
                                           m_op_seed);
 }
+
+bool op::v8::RandomUniform::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+    NGRAPH_OP_SCOPE(v8_RandomUniform_evaluate);
+    const uint64_t* out_shape;
+    std::vector<uint64_t> out_shape_uint64(shape_size(inputs[0]->get_shape()));
+
+    if (inputs[0]->get_element_type() == element::Type_t::u64) {
+        out_shape = inputs[0]->get_data_ptr<const uint64_t>();
+    } else if (inputs[0]->get_element_type() == element::Type_t::i32) {
+        auto out_shape_i32 = inputs[0]->get_data_ptr<const int32_t>();
+        std::transform(out_shape_i32,
+                       out_shape_i32 + shape_size(inputs[0]->get_shape()),
+                       out_shape_uint64.begin(),
+                       [](const int32_t& elem) {
+                           return static_cast<uint64_t>(elem);
+                       });
+        out_shape = out_shape_uint64.data();
+    } else if (inputs[0]->get_element_type() == element::Type_t::i64) {
+        auto out_shape_i64 = inputs[0]->get_data_ptr<const int64_t>();
+        std::transform(out_shape_i64,
+                       out_shape_i64 + shape_size(inputs[0]->get_shape()),
+                       out_shape_uint64.begin(),
+                       [](const int64_t& elem) {
+                           return static_cast<uint64_t>(elem);
+                       });
+        out_shape = out_shape_uint64.data();
+    } else {
+        throw ngraph_error("Unsupported type of out shape in RandomUniform operation: " +
+                           inputs[0]->get_element_type().get_type_name());
+    }
+
+    element::Type_t t_out = get_out_type();
+    char* out;
+    switch (t_out) {
+    case element::Type_t::i32:
+        out = (char*)outputs[0]->get_data_ptr<const int32_t>();
+        break;
+    case element::Type_t::i64:
+        out = (char*)outputs[0]->get_data_ptr<const int64_t>();
+        break;
+    case element::Type_t::f16:
+        out = (char*)outputs[0]->get_data_ptr<const float16>();
+        break;
+    case element::Type_t::bf16:
+        out = (char*)outputs[0]->get_data_ptr<const bfloat16>();
+        break;
+    case element::Type_t::f32:
+        out = (char*)outputs[0]->get_data_ptr<const float>();
+        break;
+    case element::Type_t::f64:
+        out = (char*)outputs[0]->get_data_ptr<const double>();
+        break;
+    default:
+        throw ngraph_error("Unsupported type of RandomUniform: " + get_out_type().get_type_name());
+    }
+
+    auto state = runtime::reference::random_uniform(out_shape,
+                                                    inputs[1]->get_data_ptr<const char>(),
+                                                    inputs[2]->get_data_ptr<const char>(),
+                                                    out,
+                                                    inputs[0]->get_shape(),
+                                                    get_out_type(),
+                                                    get_global_seed(),
+                                                    get_op_seed(),
+                                                    m_state);
+
+    // Update RandomUniform state
+    std::lock_guard<std::mutex> guard(m_state_mutex);
+    m_state = state;
+    return true;
+}
+
+bool op::v8::RandomUniform::has_evaluate() const {
+    NGRAPH_OP_SCOPE(v8_RandomUniform_has_evaluate);
+    if (get_input_element_type(0) != ngraph::element::i32 && get_input_element_type(0) != ngraph::element::i64) {
+        return false;
+    }
+
+    switch (get_out_type()) {
+    case ngraph::element::i32:
+    case ngraph::element::i64:
+    case ngraph::element::f16:
+    case ngraph::element::bf16:
+    case ngraph::element::f32:
+    case ngraph::element::f64:
+        return true;
+    default:
+        break;
+    }
+    return false;
+}
diff --git a/ngraph/core/src/op/range.cpp b/ngraph/core/src/op/range.cpp
index e3d7cd1da763c7..52fbc31cb1f18f 100644
--- a/ngraph/core/src/op/range.cpp
+++ b/ngraph/core/src/op/range.cpp
@@ -43,7 +43,7 @@ check_value(T value) {
     return value == value && value_minus_value == value_minus_value;
 }
 
-NGRAPH_RTTI_DEFINITION(op::v4::Range, "Range", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::Range, "Range", 4);
 
 op::v4::Range::Range(const Output<Node>& start,
                      const Output<Node>& stop,
@@ -71,9 +71,9 @@ void op::v4::Range::validate_and_infer_types() {
     set_input_is_relevant_to_shape(1);
     set_input_is_relevant_to_shape(2);
 
-    NODE_VALIDATION_CHECK(this, get_input_partial_shape(0).compatible(Shape{}), "'start' input is not a scalar");
-    NODE_VALIDATION_CHECK(this, get_input_partial_shape(1).compatible(Shape{}), "'stop' input is not a scalar");
-    NODE_VALIDATION_CHECK(this, get_input_partial_shape(2).compatible(Shape{}), "'step' input is not a scalar");
+    NODE_VALIDATION_CHECK(this, get_input_partial_shape(0).compatible(ov::Shape{}), "'start' input is not a scalar");
+    NODE_VALIDATION_CHECK(this, get_input_partial_shape(1).compatible(ov::Shape{}), "'stop' input is not a scalar");
+    NODE_VALIDATION_CHECK(this, get_input_partial_shape(2).compatible(ov::Shape{}), "'step' input is not a scalar");
 
     NODE_VALIDATION_CHECK(this,
                           get_input_element_type(0).is_integral_number() || get_input_element_type(0).is_real(),
@@ -117,7 +117,7 @@ void op::v4::Range::validate_and_infer_types() {
         NODE_VALIDATION_CHECK(this, std::isfinite(step) && !std::isnan(step), "'step' cannot be nan or infinite.");
     }
 
-    PartialShape result{PartialShape::dynamic(1)};
+    ov::PartialShape result{ov::PartialShape::dynamic(1)};
 
     if (const_start != nullptr && const_stop != nullptr && const_step != nullptr) {
         // all inputs must be casted to output_type before
@@ -142,7 +142,7 @@ void op::v4::Range::validate_and_infer_types() {
 
         double strided = ceil(fabs(span) / fabs(step));
 
-        result = PartialShape{Dimension(static_cast<int64_t>(strided))};
+        result = ov::PartialShape{Dimension(static_cast<int64_t>(strided))};
     }
     set_output_type(0, m_output_type, result);
 }
@@ -221,7 +221,7 @@ bool evaluate(const HostTensorPtr& out,
     if (steps > 0) {
         out_size = steps;
     }
-    Shape out_shape = Shape({static_cast<size_t>(out_size)});
+    ov::Shape out_shape = ov::Shape({static_cast<size_t>(out_size)});
     out->set_shape(out_shape);
     runtime::reference::range(&start_val, &step_val, shape_size(out_shape), out->get_data_ptr<ET>());
     return true;
@@ -286,7 +286,7 @@ bool op::v4::Range::has_evaluate() const {
     return false;
 }
 
-NGRAPH_RTTI_DEFINITION(op::v0::Range, "Range", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Range, "Range", 0);
 
 op::v0::Range::Range(const Output<Node>& start, const Output<Node>& stop, const Output<Node>& step)
     : Op({start, stop, step}) {
@@ -324,7 +324,7 @@ adjust_for_step_and_sign(T span, T step) {
 }
 
 template <typename T>
-static PartialShape infer_output_shape(const op::v0::Range* node, const element::Type& /* et */) {
+static ov::PartialShape infer_output_shape(const op::v0::Range* node, const element::Type& /* et */) {
     auto const_start = get_constant_from_source(node->input_value(0));
     auto const_stop = get_constant_from_source(node->input_value(1));
     auto const_step = get_constant_from_source(node->input_value(2));
@@ -354,7 +354,7 @@ static PartialShape infer_output_shape(const op::v0::Range* node, const element:
         check_step<T>(node, step);
     }
 
-    PartialShape result{PartialShape::dynamic(1)};
+    ov::PartialShape result{ov::PartialShape::dynamic(1)};
 
     if (const_start != nullptr && const_stop != nullptr && const_step != nullptr) {
         T span;
@@ -369,7 +369,7 @@ static PartialShape infer_output_shape(const op::v0::Range* node, const element:
 
         T strided = adjust_for_step_and_sign<T>(span, step);
 
-        result = PartialShape{Dimension(static_cast<int64_t>(strided))};
+        result = ov::PartialShape{Dimension(static_cast<int64_t>(strided))};
     }
 
     return result;
@@ -398,11 +398,11 @@ void op::v0::Range::validate_and_infer_types() {
                           result_et != element::boolean,
                           "Element type for start, stop, and step, must not be boolean.");
 
-    NODE_VALIDATION_CHECK(this, get_input_partial_shape(0).compatible(Shape{}), "'start' input is not a scalar");
-    NODE_VALIDATION_CHECK(this, get_input_partial_shape(1).compatible(Shape{}), "'stop' input is not a scalar");
-    NODE_VALIDATION_CHECK(this, get_input_partial_shape(2).compatible(Shape{}), "'step' input is not a scalar");
+    NODE_VALIDATION_CHECK(this, get_input_partial_shape(0).compatible(ov::Shape{}), "'start' input is not a scalar");
+    NODE_VALIDATION_CHECK(this, get_input_partial_shape(1).compatible(ov::Shape{}), "'stop' input is not a scalar");
+    NODE_VALIDATION_CHECK(this, get_input_partial_shape(2).compatible(ov::Shape{}), "'step' input is not a scalar");
 
-    PartialShape result_shape;
+    ov::PartialShape result_shape;
 
 #if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
 #    pragma GCC diagnostic push
@@ -447,7 +447,7 @@ void op::v0::Range::validate_and_infer_types() {
         result_shape = infer_output_shape<uint64_t>(this, result_et);
         break;
     case element::Type_t::dynamic:
-        result_shape = PartialShape::dynamic(1);
+        result_shape = ov::PartialShape::dynamic(1);
         break;
     case element::Type_t::u1:
     case element::Type_t::i4:
diff --git a/ngraph/core/src/op/read_value.cpp b/ngraph/core/src/op/read_value.cpp
index 9b77406acd2eb5..aec659fd4e98e4 100644
--- a/ngraph/core/src/op/read_value.cpp
+++ b/ngraph/core/src/op/read_value.cpp
@@ -11,9 +11,8 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::ReadValueBase, "ReadValueBase", 0);
-NGRAPH_RTTI_DEFINITION(op::v3::ReadValue, "ReadValue", 3);
-NGRAPH_RTTI_DEFINITION(op::v6::ReadValue, "ReadValue", 6);
+OPENVINO_RTTI_DEFINITION(ov::op::v3::ReadValue, "ReadValue", 3);
+OPENVINO_RTTI_DEFINITION(ov::op::v6::ReadValue, "ReadValue", 6);
 
 op::v3::ReadValue::ReadValue(const Output<Node>& init_value, const std::string& variable_id)
     : ReadValueBase({init_value}),
@@ -62,7 +61,7 @@ void op::v6::ReadValue::validate_and_infer_types() {
                           element::Type::merge(var_info.data_type, m_variable->get_info().data_type, arg_t),
                           "Variables types are inconsistent.");
     NODE_VALIDATION_CHECK(this,
-                          PartialShape::merge_into(var_info.data_shape, m_variable->get_info().data_shape),
+                          ov::PartialShape::merge_into(var_info.data_shape, m_variable->get_info().data_shape),
                           "Variable shape and output shape are inconsistent.");
     m_variable->update(var_info);
     set_output_type(0, arg_t, output_shape);
@@ -81,7 +80,7 @@ bool op::v6::ReadValue::visit_attributes(AttributeVisitor& visitor) {
 }
 
 void op::v6::ReadValue::revalidate_and_infer_types() {
-    VariableInfo var_info{PartialShape::dynamic(), element::dynamic, m_variable->get_info().variable_id};
+    VariableInfo var_info{ov::PartialShape::dynamic(), element::dynamic, m_variable->get_info().variable_id};
     m_variable->update(var_info);
     Node::revalidate_and_infer_types();
 }
@@ -101,7 +100,7 @@ bool op::v6::ReadValue::evaluate(const HostTensorVector& outputs,
     bool use_context = var_value != variable_values.end() && !var_value->second->get_reset();
 
     // initial value (inputs[0]) is not supported, use zeros
-    auto zero_const = make_shared<Constant>(inputs[0]->get_element_type(), inputs[0]->get_shape(), 0);
+    auto zero_const = make_shared<v0::Constant>(inputs[0]->get_element_type(), inputs[0]->get_shape(), 0);
     auto zero_tensor = make_shared<HostTensor>(zero_const);
     const auto& input_tensor = use_context ? var_value->second->get_value() : zero_tensor;
     outputs[0]->set_unary(input_tensor);
@@ -118,4 +117,4 @@ bool op::v6::ReadValue::has_evaluate() const {
 
 bool op::v6::ReadValue::constant_fold(OutputVector& output_values, const OutputVector& inputs_values) {
     return false;
-}
\ No newline at end of file
+}
diff --git a/ngraph/core/src/op/reduce_l1.cpp b/ngraph/core/src/op/reduce_l1.cpp
index c23b63173fca1e..997b9c57af1cf4 100644
--- a/ngraph/core/src/op/reduce_l1.cpp
+++ b/ngraph/core/src/op/reduce_l1.cpp
@@ -16,7 +16,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v4::ReduceL1, "ReduceL1", 4, util::ArithmeticReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v4::ReduceL1, "ReduceL1", 4, util::ArithmeticReductionKeepDims);
 
 op::v4::ReduceL1::ReduceL1(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims)
     : ArithmeticReductionKeepDims(arg, reduction_axes, keep_dims) {
diff --git a/ngraph/core/src/op/reduce_l2.cpp b/ngraph/core/src/op/reduce_l2.cpp
index 396c365f30eb0e..8bdfccd80cf6f5 100644
--- a/ngraph/core/src/op/reduce_l2.cpp
+++ b/ngraph/core/src/op/reduce_l2.cpp
@@ -16,7 +16,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v4::ReduceL2, "ReduceL2", 4, util::ArithmeticReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v4::ReduceL2, "ReduceL2", 4, util::ArithmeticReductionKeepDims);
 
 op::v4::ReduceL2::ReduceL2(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims)
     : ArithmeticReductionKeepDims(arg, reduction_axes, keep_dims) {
diff --git a/ngraph/core/src/op/reduce_logical_and.cpp b/ngraph/core/src/op/reduce_logical_and.cpp
index 081ea960e2362f..9c79c270a168e0 100644
--- a/ngraph/core/src/op/reduce_logical_and.cpp
+++ b/ngraph/core/src/op/reduce_logical_and.cpp
@@ -15,7 +15,7 @@
 using namespace ngraph;
 using namespace std;
 
-NGRAPH_RTTI_DEFINITION(op::v1::ReduceLogicalAnd, "ReduceLogicalAnd", 1, util::LogicalReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v1::ReduceLogicalAnd, "ReduceLogicalAnd", 1, util::LogicalReductionKeepDims);
 
 op::v1::ReduceLogicalAnd::ReduceLogicalAnd(const Output<Node>& data,
                                            const Output<Node>& reduction_axes,
diff --git a/ngraph/core/src/op/reduce_logical_or.cpp b/ngraph/core/src/op/reduce_logical_or.cpp
index f383cc51661744..6cca3903d35255 100644
--- a/ngraph/core/src/op/reduce_logical_or.cpp
+++ b/ngraph/core/src/op/reduce_logical_or.cpp
@@ -15,7 +15,7 @@
 using namespace ngraph;
 using namespace std;
 
-NGRAPH_RTTI_DEFINITION(op::v1::ReduceLogicalOr, "ReduceLogicalOr", 1, util::LogicalReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v1::ReduceLogicalOr, "ReduceLogicalOr", 1, util::LogicalReductionKeepDims);
 
 op::v1::ReduceLogicalOr::ReduceLogicalOr(const Output<Node>& data,
                                          const Output<Node>& reduction_axes,
diff --git a/ngraph/core/src/op/reduce_mean.cpp b/ngraph/core/src/op/reduce_mean.cpp
index b32bd7ac76e03b..ea92204c589353 100644
--- a/ngraph/core/src/op/reduce_mean.cpp
+++ b/ngraph/core/src/op/reduce_mean.cpp
@@ -17,7 +17,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::ReduceMean, "ReduceMean", 1, util::ArithmeticReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v1::ReduceMean, "ReduceMean", 1, util::ArithmeticReductionKeepDims);
 
 op::v1::ReduceMean::ReduceMean(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims)
     : ArithmeticReductionKeepDims(arg, reduction_axes, keep_dims) {
diff --git a/ngraph/core/src/op/min.cpp b/ngraph/core/src/op/reduce_min.cpp
similarity index 97%
rename from ngraph/core/src/op/min.cpp
rename to ngraph/core/src/op/reduce_min.cpp
index 06c0f3d4839d99..c3210c1a97f779 100644
--- a/ngraph/core/src/op/min.cpp
+++ b/ngraph/core/src/op/reduce_min.cpp
@@ -2,11 +2,10 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "ngraph/op/min.hpp"
-
 #include <ngraph/validation_util.hpp>
 
 #include "itt.hpp"
+#include "ngraph/op/min.hpp"
 #include "ngraph/op/util/evaluate_helpers.hpp"
 #include "ngraph/runtime/host_tensor.hpp"
 #include "ngraph/runtime/reference/min.hpp"
@@ -40,7 +39,7 @@ bool evaluate_min(const HostTensorPtr& arg, const HostTensorPtr& out, const Axis
 }
 }  // namespace minop
 
-NGRAPH_RTTI_DEFINITION(op::v1::ReduceMin, "ReduceMin", 1, util::ArithmeticReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v1::ReduceMin, "ReduceMin", 1, util::ArithmeticReductionKeepDims);
 
 op::v1::ReduceMin::ReduceMin(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims)
     : ArithmeticReductionKeepDims(arg, reduction_axes, keep_dims) {
diff --git a/ngraph/core/src/op/reduce_prod.cpp b/ngraph/core/src/op/reduce_prod.cpp
index 30bd01de272817..1dcbdb09575465 100644
--- a/ngraph/core/src/op/reduce_prod.cpp
+++ b/ngraph/core/src/op/reduce_prod.cpp
@@ -16,7 +16,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::ReduceProd, "ReduceProd", 1, util::ArithmeticReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v1::ReduceProd, "ReduceProd", 1, util::ArithmeticReductionKeepDims);
 
 op::v1::ReduceProd::ReduceProd(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims)
     : ArithmeticReductionKeepDims(arg, reduction_axes, keep_dims) {
diff --git a/ngraph/core/src/op/reduce_sum.cpp b/ngraph/core/src/op/reduce_sum.cpp
index ae0e9a603641b3..1055274312dc29 100644
--- a/ngraph/core/src/op/reduce_sum.cpp
+++ b/ngraph/core/src/op/reduce_sum.cpp
@@ -18,7 +18,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::ReduceSum, "ReduceSum", 1, util::ArithmeticReductionKeepDims);
+OPENVINO_RTTI_DEFINITION(op::v1::ReduceSum, "ReduceSum", 1, util::ArithmeticReductionKeepDims);
 
 op::v1::ReduceSum::ReduceSum(const Output<Node>& arg, const Output<Node>& reduction_axes, bool keep_dims)
     : ArithmeticReductionKeepDims(arg, reduction_axes, keep_dims) {
diff --git a/ngraph/core/src/op/region_yolo.cpp b/ngraph/core/src/op/region_yolo.cpp
index a481da20de5bec..226b702a4a681a 100644
--- a/ngraph/core/src/op/region_yolo.cpp
+++ b/ngraph/core/src/op/region_yolo.cpp
@@ -10,7 +10,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::RegionYolo, "RegionYolo", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::RegionYolo, "RegionYolo", 0);
 
 op::RegionYolo::RegionYolo(const Output<Node>& input,
                            const size_t coords,
@@ -56,8 +56,8 @@ void op::RegionYolo::validate_and_infer_types() {
                           input_et);
 
     if (get_input_partial_shape(0).is_static()) {
-        Shape input_shape = get_input_partial_shape(0).to_shape();
-        Shape output_shape;
+        ov::Shape input_shape = get_input_partial_shape(0).to_shape();
+        ov::Shape output_shape;
         int end_axis = m_end_axis;
         if (m_end_axis < 0) {
             m_end_axis += input_shape.size();
@@ -83,7 +83,7 @@ void op::RegionYolo::validate_and_infer_types() {
         }
         set_output_type(0, input_et, output_shape);
     } else {
-        set_output_type(0, input_et, PartialShape::dynamic());
+        set_output_type(0, input_et, ov::PartialShape::dynamic());
     }
 }
 
diff --git a/ngraph/core/src/op/relu.cpp b/ngraph/core/src/op/relu.cpp
index 4c65f2bc573cea..e5a053de0e9afd 100644
--- a/ngraph/core/src/op/relu.cpp
+++ b/ngraph/core/src/op/relu.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::Relu, "Relu", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Relu, "Relu", 0, util::UnaryElementwiseArithmetic);
 
 op::Relu::Relu(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/reorg_yolo.cpp b/ngraph/core/src/op/reorg_yolo.cpp
index ca6b20fa7dd163..752336c3c85478 100644
--- a/ngraph/core/src/op/reorg_yolo.cpp
+++ b/ngraph/core/src/op/reorg_yolo.cpp
@@ -10,7 +10,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::ReorgYolo, "ReorgYolo", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::ReorgYolo, "ReorgYolo", 0);
 
 op::ReorgYolo::ReorgYolo(const Output<Node>& input, const Strides& strides) : Op({input}), m_strides(strides) {
     constructor_validate_and_infer_types();
@@ -43,14 +43,14 @@ void op::ReorgYolo::validate_and_infer_types() {
                               input_shape[1] >= (m_strides[0] * m_strides[0]),
                               "For [N, C, H, W] input shape, C >= (stride*stride) is required.");
 
-        Shape output_shape{input_shape[0], input_shape[1]};
+        ov::Shape output_shape{input_shape[0], input_shape[1]};
         for (size_t i = 2; i < input_shape.size(); i++) {
             output_shape.push_back(input_shape[i] / m_strides[0]);
             output_shape[1] *= m_strides[0];
         }
         set_output_type(0, input_et, output_shape);
     } else {
-        set_output_type(0, input_et, PartialShape::dynamic());
+        set_output_type(0, input_et, ov::PartialShape::dynamic());
     }
 }
 
diff --git a/ngraph/core/src/op/reshape.cpp b/ngraph/core/src/op/reshape.cpp
index de161673a05d7a..bb5c9decddc00a 100644
--- a/ngraph/core/src/op/reshape.cpp
+++ b/ngraph/core/src/op/reshape.cpp
@@ -37,7 +37,7 @@ void compute_output_shape(const HostTensorPtr& shape_pattern, std::vector<int64_
 }
 }  // namespace reshapeop
 
-NGRAPH_RTTI_DEFINITION(op::v1::Reshape, "Reshape", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Reshape, "Reshape", 1);
 
 op::v1::Reshape::Reshape(const Output<Node>& arg, const Output<Node>& shape_pattern, bool zero_flag)
     : Op({arg, shape_pattern}),
@@ -54,11 +54,13 @@ void op::v1::Reshape::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_Reshape_validate_and_infer_types);
     auto shape_pattern_et = get_input_element_type(1);
     // check data types
-    NODE_VALIDATION_CHECK(this, shape_pattern_et.is_integral_number(), "Shape pattern must be an integral number.");
+    NODE_VALIDATION_CHECK(this,
+                          shape_pattern_et.is_integral_number(),
+                          "PartialShape pattern must be an integral number.");
 
     // check shapes
-    const PartialShape& input_pshape = get_input_partial_shape(0);
-    const PartialShape& shape_pattern_shape = get_input_partial_shape(1);
+    const ov::PartialShape& input_pshape = get_input_partial_shape(0);
+    const ov::PartialShape& shape_pattern_shape = get_input_partial_shape(1);
     NODE_VALIDATION_CHECK(this,
                           shape_pattern_shape.rank().compatible(1) ||
                               (shape_pattern_shape.rank().is_static() && shape_pattern_shape.rank().get_length() == 0),
@@ -68,7 +70,7 @@ void op::v1::Reshape::validate_and_infer_types() {
     Rank output_rank = shape_pattern_shape.rank().is_dynamic()
                            ? Rank::dynamic()
                            : shape_pattern_shape.rank().get_length() == 0 ? 0 : shape_pattern_shape[0];
-    set_output_type(0, get_input_element_type(0), PartialShape::dynamic(output_rank));
+    set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic(output_rank));
     set_input_is_relevant_to_shape(1);
 
     std::vector<Dimension> reshape_pattern;
@@ -78,8 +80,8 @@ void op::v1::Reshape::validate_and_infer_types() {
     HostTensorPtr lb, ub;
     std::tie(lb, ub) = evaluate_both_bounds(get_input_source_output(1));
     if (lb && ub) {
-        const auto lower_bound = std::make_shared<op::Constant>(lb)->cast_vector<int64_t>();
-        const auto upper_bound = std::make_shared<op::Constant>(ub)->cast_vector<int64_t>();
+        const auto lower_bound = std::make_shared<op::v0::Constant>(lb)->cast_vector<int64_t>();
+        const auto upper_bound = std::make_shared<op::v0::Constant>(ub)->cast_vector<int64_t>();
         shape_can_be_calculated = true;
         NGRAPH_CHECK(lower_bound.size() == upper_bound.size());
         for (size_t i = 0; i < lower_bound.size(); ++i) {
@@ -155,8 +157,8 @@ bool op::v1::Reshape::evaluate_reshape(const HostTensorVector& outputs, const Ho
 
     std::vector<Dimension> output_shape(out_shape_val.size());
     calculate_output_shape(reshape_pattern, minus_one_idx, inputs[0]->get_partial_shape(), output_shape);
-    NGRAPH_CHECK(PartialShape(output_shape).is_static());
-    outputs[0]->set_shape(PartialShape(output_shape).to_shape());
+    NGRAPH_CHECK(ov::PartialShape(output_shape).is_static());
+    outputs[0]->set_shape(ov::PartialShape(output_shape).to_shape());
 
     const AxisVector order = get_default_order(inputs[0]->get_shape());
     return reshapeop::evaluate_reshape(inputs[0], outputs[0], order);
@@ -206,8 +208,8 @@ bool op::v1::Reshape::constant_fold(OutputVector& output_values, const OutputVec
 
     const auto& shape = get_output_shape(0);
 
-    if (auto data_const = std::dynamic_pointer_cast<op::Constant>(inputs_values[0].get_node_shared_ptr())) {
-        output_values[0] = std::make_shared<op::Constant>(*data_const, shape);
+    if (auto data_const = std::dynamic_pointer_cast<op::v0::Constant>(inputs_values[0].get_node_shared_ptr())) {
+        output_values[0] = std::make_shared<op::v0::Constant>(*data_const, shape);
         return true;
     }
     return false;
@@ -215,7 +217,7 @@ bool op::v1::Reshape::constant_fold(OutputVector& output_values, const OutputVec
 
 void op::v1::Reshape::calculate_output_shape(vector<Dimension>& reshape_pattern,
                                              const int64_t& minus_one_idx,
-                                             const PartialShape& input_pshape,
+                                             const ov::PartialShape& input_pshape,
                                              vector<Dimension>& output_shape) const {
     Dimension output_product(1);
     for (int64_t i = 0; i < static_cast<int64_t>(reshape_pattern.size()); ++i) {
@@ -303,7 +305,7 @@ void op::v1::Reshape::calculate_output_shape(vector<Dimension>& reshape_pattern,
             }
         }
     }
-    PartialShape output_pshape(output_shape);
+    ov::PartialShape output_pshape(output_shape);
     if (input_pshape.is_static() && output_pshape.is_static()) {
         size_t zero_dims = std::count_if(reshape_pattern.begin(), reshape_pattern.end(), [](Dimension dim) {
             return dim.get_max_length() == 0 && dim.get_min_length() == 0;
diff --git a/ngraph/core/src/op/result.cpp b/ngraph/core/src/op/result.cpp
index 8111965cbc946d..40ce23ceb8ece8 100644
--- a/ngraph/core/src/op/result.cpp
+++ b/ngraph/core/src/op/result.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Result, "Result", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Result, "Result", 0);
 
 op::Result::Result(const Output<Node>& arg, bool needs_default_layout)
     : Op({arg}),
@@ -82,7 +82,7 @@ bool ov::AttributeAdapter<ResultVector>::visit_attributes(AttributeVisitor& visi
         }
         visitor.on_attribute(index.str(), id);
         if (!m_ref[i]) {
-            m_ref[i] = ov::as_type_ptr<op::v0::Result>(visitor.get_registered_node(id));
+            m_ref[i] = ov::as_type_ptr<ngraph::op::v0::Result>(visitor.get_registered_node(id));
         }
     }
     return true;
diff --git a/ngraph/core/src/op/reverse.cpp b/ngraph/core/src/op/reverse.cpp
index abb3f1e4bda096..f50ee79ab4d006 100644
--- a/ngraph/core/src/op/reverse.cpp
+++ b/ngraph/core/src/op/reverse.cpp
@@ -19,7 +19,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::Reverse, "Reverse", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Reverse, "Reverse", 1);
 
 op::v1::Reverse::Reverse(const Output<Node>& data, const Output<Node>& reversed_axes, const std::string& mode)
     : Op({data, reversed_axes}),
@@ -197,18 +197,18 @@ bool op::v1::Reverse::has_evaluate() const {
     }
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v1::Reverse::Mode& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v1::Reverse::Mode& type) {
     return s << as_string(type);
 }
 
 namespace ov {
 template <>
-EnumNames<op::v1::Reverse::Mode>& EnumNames<op::v1::Reverse::Mode>::get() {
-    static auto enum_names = EnumNames<op::v1::Reverse::Mode>(
+EnumNames<ngraph::op::v1::Reverse::Mode>& EnumNames<ngraph::op::v1::Reverse::Mode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v1::Reverse::Mode>(
         "op::v1::Reverse::Mode",
-        {{"index", op::v1::Reverse::Mode::INDEX}, {"mask", op::v1::Reverse::Mode::MASK}});
+        {{"index", ngraph::op::v1::Reverse::Mode::INDEX}, {"mask", ngraph::op::v1::Reverse::Mode::MASK}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v1::Reverse::Mode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v1::Reverse::Mode>::type_info;
 }  // namespace ov
diff --git a/ngraph/core/src/op/reverse_sequence.cpp b/ngraph/core/src/op/reverse_sequence.cpp
index 1eda1f50b1c8c4..fb3ccb47c6d2ff 100644
--- a/ngraph/core/src/op/reverse_sequence.cpp
+++ b/ngraph/core/src/op/reverse_sequence.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::ReverseSequence, "ReverseSequence", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::ReverseSequence, "ReverseSequence", 0);
 
 op::ReverseSequence::ReverseSequence(const Output<Node>& arg,
                                      const Output<Node>& seq_indices,
@@ -63,7 +63,7 @@ void op::ReverseSequence::validate_and_infer_types() {
                           "Sequence lengths rank must be equal to 1. Got: ",
                           seq_lengths_pshape);
 
-    PartialShape output_pshape{data_pshape};
+    ov::PartialShape output_pshape{data_pshape};
     if (data_rank.is_static() && seq_lengths_rank.is_static()) {
         Dimension merged_sequence_length;
         NODE_VALIDATION_CHECK(
diff --git a/ngraph/core/src/op/rnn_cell.cpp b/ngraph/core/src/op/rnn_cell.cpp
index 43cb8fd5c50314..209424625df492 100644
--- a/ngraph/core/src/op/rnn_cell.cpp
+++ b/ngraph/core/src/op/rnn_cell.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::RNNCell, "RNNCell", 0, util::RNNCellBase);
+OPENVINO_RTTI_DEFINITION(op::v0::RNNCell, "RNNCell", 0, util::RNNCellBase);
 
 op::v0::RNNCell::RNNCell() {
     m_activations = {"tanh"};
@@ -66,7 +66,7 @@ void op::v0::RNNCell::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_RNNCell_validate_and_infer_types);
     for (const auto& input : inputs()) {
         if (input.get_partial_shape().rank().is_dynamic()) {
-            set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
+            set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
             return;
         }
     }
@@ -148,7 +148,7 @@ void op::v0::RNNCell::validate_and_infer_types() {
 
 Output<Node> op::v0::RNNCell::get_default_bias_input() const {
     return Output<Node>{op::v0::Constant::create(get_input_element_type(0),
-                                                 Shape{s_gates_count * get_hidden_size()},
+                                                 ov::Shape{s_gates_count * get_hidden_size()},
                                                  vector<float>(s_gates_count * get_hidden_size(), 0.f))};
 }
 
diff --git a/ngraph/core/src/op/rnn_sequence.cpp b/ngraph/core/src/op/rnn_sequence.cpp
index 809baa02592f23..bbd2fd54ac1779 100644
--- a/ngraph/core/src/op/rnn_sequence.cpp
+++ b/ngraph/core/src/op/rnn_sequence.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v5::RNNSequence, "RNNSequence", 4);
+OPENVINO_RTTI_DEFINITION(op::v5::RNNSequence, "RNNSequence", 4, util::RNNCellBase);
 
 op::v5::RNNSequence::RNNSequence() : m_direction(op::RecurrentSequenceDirection::FORWARD) {}
 
@@ -45,8 +45,8 @@ void op::v5::RNNSequence::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v5_RNNSequence_validate_and_infer_types);
     for (const auto& input : inputs()) {
         if (input.get_partial_shape().rank().is_dynamic()) {
-            set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
-            set_output_type(1, get_input_element_type(0), PartialShape::dynamic());
+            set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
+            set_output_type(1, get_input_element_type(0), ov::PartialShape::dynamic());
             return;
         }
     }
@@ -97,6 +97,20 @@ void op::v5::RNNSequence::validate_and_infer_types() {
                               Dimension::merge(merged_num_directions, merged_num_directions, b_pshape[0]),
                           "Parameter num_directions not matched in RNNSequence.");
 
+    auto valid_num_directions = 0;
+    if (m_direction == op::RecurrentSequenceDirection::FORWARD ||
+        m_direction == op::RecurrentSequenceDirection::REVERSE) {
+        valid_num_directions = 1;
+    } else if (m_direction == op::RecurrentSequenceDirection::BIDIRECTIONAL) {
+        valid_num_directions = 2;
+    } else {
+        NODE_VALIDATION_CHECK(this, false, "Parameter direction must be FORWARD or REVERSE or BIDIRECTIONAL.");
+    }
+
+    NODE_VALIDATION_CHECK(this,
+                          Dimension::merge(merged_num_directions, merged_num_directions, valid_num_directions),
+                          "Parameter num_directions not match direction in RNNSequence.");
+
     // Validate hidden_size value for W, R, B inputs
     if (merged_hidden_size.is_static()) {
         if (w_pshape[1].is_static()) {
diff --git a/ngraph/core/src/op/roi_align.cpp b/ngraph/core/src/op/roi_align.cpp
index 34376a43997d2b..91d6a2c39b0c17 100644
--- a/ngraph/core/src/op/roi_align.cpp
+++ b/ngraph/core/src/op/roi_align.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::ROIAlign::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::ROIAlign, "ROIAlign", 3);
 
 op::v3::ROIAlign::ROIAlign(const Output<Node>& input,
                            const Output<Node>& rois,
@@ -107,10 +107,10 @@ void op::v3::ROIAlign::validate_and_infer_types() {
     }
 
     // the output shape should have the following format [NUM_ROIS, C, pooled_h, pooled_w]
-    auto output_shape = PartialShape{{Dimension::dynamic(),
-                                      input_ps[1],
-                                      Dimension{static_cast<int64_t>(m_pooled_h)},
-                                      Dimension{static_cast<int64_t>(m_pooled_w)}}};
+    auto output_shape = ov::PartialShape{{Dimension::dynamic(),
+                                          input_ps[1],
+                                          Dimension{static_cast<int64_t>(m_pooled_h)},
+                                          Dimension{static_cast<int64_t>(m_pooled_w)}}};
 
     // if either of those 2 dimensions is static its value will be used
     // for the first dimension of the output shape - 'NUM_ROIS'
@@ -162,13 +162,13 @@ shared_ptr<Node> op::v3::ROIAlign::clone_with_new_inputs(const OutputVector& new
 }
 
 namespace ov {
-constexpr DiscreteTypeInfo AttributeAdapter<op::v3::ROIAlign::PoolingMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v3::ROIAlign::PoolingMode>::type_info;
 
 template <>
-NGRAPH_API EnumNames<op::v3::ROIAlign::PoolingMode>& EnumNames<op::v3::ROIAlign::PoolingMode>::get() {
-    static auto enum_names = EnumNames<op::v3::ROIAlign::PoolingMode>(
+NGRAPH_API EnumNames<ngraph::op::v3::ROIAlign::PoolingMode>& EnumNames<ngraph::op::v3::ROIAlign::PoolingMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v3::ROIAlign::PoolingMode>(
         "op::v3::ROIAlign::PoolingMode",
-        {{"avg", op::v3::ROIAlign::PoolingMode::AVG}, {"max", op::v3::ROIAlign::PoolingMode::MAX}});
+        {{"avg", ngraph::op::v3::ROIAlign::PoolingMode::AVG}, {"max", ngraph::op::v3::ROIAlign::PoolingMode::MAX}});
     return enum_names;
 }
 
@@ -189,7 +189,7 @@ bool evaluate(const HostTensorPtr& feature_maps,
               const int sampling_ratio,
               const float spatial_scale,
               const op::v3::ROIAlign::PoolingMode& pooling_mode,
-              const Shape& batch_indices_shape) {
+              const ov::Shape& batch_indices_shape) {
     using T = typename element_type_traits<ET>::value_type;
     runtime::reference::roi_align<T>(feature_maps->get_data_ptr<ET>(),
                                      rois->get_data_ptr<ET>(),
diff --git a/ngraph/core/src/op/roi_pooling.cpp b/ngraph/core/src/op/roi_pooling.cpp
index 433d70c5a6ca36..646155f76f2f83 100644
--- a/ngraph/core/src/op/roi_pooling.cpp
+++ b/ngraph/core/src/op/roi_pooling.cpp
@@ -9,11 +9,11 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::ROIPooling, "ROIPooling", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::ROIPooling, "ROIPooling", 0);
 
 op::ROIPooling::ROIPooling(const Output<Node>& input,
                            const Output<Node>& coords,
-                           const Shape& output_size,
+                           const ov::Shape& output_size,
                            const float spatial_scale,
                            const string& method)
     : Op({input, coords}),
@@ -87,10 +87,10 @@ void op::ROIPooling::validate_and_infer_types() {
     }
 
     // output shape should be {NUM_ROIS, C, pooled_h, pooled_w}
-    auto output_shape = PartialShape{{Dimension::dynamic(),
-                                      Dimension::dynamic(),
-                                      Dimension{static_cast<int64_t>(m_output_size[0])},
-                                      Dimension{static_cast<int64_t>(m_output_size[1])}}};
+    auto output_shape = ov::PartialShape{{Dimension::dynamic(),
+                                          Dimension::dynamic(),
+                                          Dimension{static_cast<int64_t>(m_output_size[0])},
+                                          Dimension{static_cast<int64_t>(m_output_size[1])}}};
 
     if (coords_ps.rank().is_static() && coords_ps[0].is_static()) {
         output_shape[0] = coords_ps[0];
diff --git a/ngraph/core/src/op/roll.cpp b/ngraph/core/src/op/roll.cpp
index b9027f12b3a7b8..088a593852f791 100644
--- a/ngraph/core/src/op/roll.cpp
+++ b/ngraph/core/src/op/roll.cpp
@@ -11,7 +11,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v7::Roll, "Roll", 7);
+OPENVINO_RTTI_DEFINITION(op::v7::Roll, "Roll", 7);
 
 op::v7::Roll::Roll(const Output<Node>& data, const Output<Node>& shift, const Output<Node>& axes)
     : Op({data, shift, axes}) {
@@ -47,7 +47,7 @@ void op::v7::Roll::validate_and_infer_types() {
 
     // If shift is a scalar, than axes can be arbitrary 1d tensor and we don't need
     // to check shift shape consistency with axes, otherwise the check is needed.
-    if (!(shift_pshape.is_static() && is_scalar(shift_pshape.to_shape()))) {
+    if (!(shift_pshape.is_static() && ngraph::is_scalar(shift_pshape.to_shape()))) {
         NODE_VALIDATION_CHECK(this,
                               shift_pshape.compatible(axes_pshape),
                               "If shift is a 1D vector, axes must be a 1D tensor of the same size.");
diff --git a/ngraph/core/src/op/round.cpp b/ngraph/core/src/op/round.cpp
index 3323ec6596ac30..36f74be1bfa337 100644
--- a/ngraph/core/src/op/round.cpp
+++ b/ngraph/core/src/op/round.cpp
@@ -61,7 +61,7 @@ bool evaluate_round(const HostTensorPtr& arg0,
 }
 }  // namespace roundop
 
-NGRAPH_RTTI_DEFINITION(op::v5::Round, "Round", 5);
+OPENVINO_RTTI_DEFINITION(op::v5::Round, "Round", 5);
 
 op::v5::Round::Round(const Output<Node>& arg, RoundMode mode) : Op({arg}), m_mode(mode) {
     constructor_validate_and_infer_types();
@@ -113,19 +113,19 @@ bool op::v5::Round::has_evaluate() const {
     return false;
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v5::Round::RoundMode& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v5::Round::RoundMode& type) {
     return s << as_string(type);
 }
 
 namespace ov {
 template <>
-EnumNames<op::v5::Round::RoundMode>& EnumNames<op::v5::Round::RoundMode>::get() {
-    static auto enum_names =
-        EnumNames<op::v5::Round::RoundMode>("op::v5::Round::RoundMode",
-                                            {{"half_to_even", op::v5::Round::RoundMode::HALF_TO_EVEN},
-                                             {"half_away_from_zero", op::v5::Round::RoundMode::HALF_AWAY_FROM_ZERO}});
+EnumNames<ngraph::op::v5::Round::RoundMode>& EnumNames<ngraph::op::v5::Round::RoundMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v5::Round::RoundMode>(
+        "op::v5::Round::RoundMode",
+        {{"half_to_even", ngraph::op::v5::Round::RoundMode::HALF_TO_EVEN},
+         {"half_away_from_zero", ngraph::op::v5::Round::RoundMode::HALF_AWAY_FROM_ZERO}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v5::Round::RoundMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v5::Round::RoundMode>::type_info;
 }  // namespace ov
diff --git a/ngraph/core/src/op/scatter_elements_update.cpp b/ngraph/core/src/op/scatter_elements_update.cpp
index 46275a703f4270..004a5ecd64a96b 100644
--- a/ngraph/core/src/op/scatter_elements_update.cpp
+++ b/ngraph/core/src/op/scatter_elements_update.cpp
@@ -13,7 +13,7 @@
 using namespace ngraph;
 using namespace std;
 
-NGRAPH_RTTI_DEFINITION(op::ScatterElementsUpdate, "ScatterElementsUpdate", 3);
+OPENVINO_RTTI_DEFINITION(op::v3::ScatterElementsUpdate, "ScatterElementsUpdate", 3);
 
 op::v3::ScatterElementsUpdate::ScatterElementsUpdate(const Output<Node>& data,
                                                      const Output<Node>& indices,
@@ -35,10 +35,10 @@ void op::v3::ScatterElementsUpdate::validate_and_infer_types() {
     element::Type updates_et = get_input_element_type(2);
     element::Type axis_et = get_input_element_type(3);
 
-    const PartialShape& data_shape = get_input_partial_shape(0);
-    const PartialShape& indices_shape = get_input_partial_shape(1);
-    const PartialShape& updates_shape = get_input_partial_shape(2);
-    const PartialShape& axis_shape = get_input_partial_shape(3);
+    const ov::PartialShape& data_shape = get_input_partial_shape(0);
+    const ov::PartialShape& indices_shape = get_input_partial_shape(1);
+    const ov::PartialShape& updates_shape = get_input_partial_shape(2);
+    const ov::PartialShape& axis_shape = get_input_partial_shape(3);
 
     NODE_VALIDATION_CHECK(this,
                           indices_et.is_integral(),
@@ -56,7 +56,7 @@ void op::v3::ScatterElementsUpdate::validate_and_infer_types() {
                           updates_et);
 
     NODE_VALIDATION_CHECK(this,
-                          axis_shape.compatible(PartialShape{}) || axis_shape.compatible(PartialShape{1}),
+                          axis_shape.compatible(ov::PartialShape{}) || axis_shape.compatible(ov::PartialShape{1}),
                           "Axis input shape are required to be scalar or 1D tensor. ",
                           "Got: ",
                           axis_shape);
diff --git a/ngraph/core/src/op/scatter_nd_update.cpp b/ngraph/core/src/op/scatter_nd_update.cpp
index e06660d4992ed2..6312b031e03460 100644
--- a/ngraph/core/src/op/scatter_nd_update.cpp
+++ b/ngraph/core/src/op/scatter_nd_update.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::ScatterNDUpdate::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::ScatterNDUpdate, "ScatterNDUpdate", 3, util::ScatterNDBase);
 
 shared_ptr<Node> op::v3::ScatterNDUpdate::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v3_ScatterNDUpdate_clone_with_new_inputs);
@@ -29,10 +29,10 @@ bool evaluate(const HostTensorPtr& arg0,
               const HostTensorPtr& arg2,
               const HostTensorPtr& out) {
     using T = typename element_type_traits<ET>::value_type;
-    Shape params_shape = arg0->get_shape();
-    Shape indices_shape = arg1->get_shape();
-    Shape updates_shape = arg1->get_shape();
-    Shape out_shape(params_shape);
+    ov::Shape params_shape = arg0->get_shape();
+    ov::Shape indices_shape = arg1->get_shape();
+    ov::Shape updates_shape = arg1->get_shape();
+    const ov::Shape& out_shape(params_shape);
     out->set_shape(out_shape);
 
     if (arg1->get_element_type() == element::i64) {
diff --git a/ngraph/core/src/op/scatter_update.cpp b/ngraph/core/src/op/scatter_update.cpp
index 0fb131bf5ff66b..e8182e8b2114c5 100644
--- a/ngraph/core/src/op/scatter_update.cpp
+++ b/ngraph/core/src/op/scatter_update.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::ScatterUpdate::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::ScatterUpdate, "ScatterUpdate", 3, util::ScatterBase);
 
 op::v3::ScatterUpdate::ScatterUpdate(const Output<Node>& data,
                                      const Output<Node>& indices,
diff --git a/ngraph/core/src/op/select.cpp b/ngraph/core/src/op/select.cpp
index aff5c697e28547..d1f9aff02b7334 100644
--- a/ngraph/core/src/op/select.cpp
+++ b/ngraph/core/src/op/select.cpp
@@ -16,7 +16,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::Select, "Select", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Select, "Select", 1);
 
 op::v1::Select::Select(const Output<Node>& arg0,
                        const Output<Node>& arg1,
@@ -42,29 +42,30 @@ void op::v1::Select::validate_and_infer_types() {
                           element::Type::merge(result_et, get_input_element_type(1), get_input_element_type(2)),
                           "Argument 1 and 2 element types must match.");
 
-    PartialShape result_shape;
+    ov::PartialShape result_shape;
     if (get_auto_broadcast().m_type == op::AutoBroadcastType::PDPD) {
         result_shape = get_input_partial_shape(1);  // 'then' tensor
         NODE_VALIDATION_CHECK(
             this,
-            PartialShape::broadcast_merge_into(result_shape, get_input_partial_shape(2), get_auto_broadcast()),
+            ov::PartialShape::broadcast_merge_into(result_shape, get_input_partial_shape(2), get_auto_broadcast()),
             "'Else' tensor shape is not broadcastable.");
         NODE_VALIDATION_CHECK(
             this,
-            PartialShape::broadcast_merge_into(result_shape, get_input_partial_shape(0), get_auto_broadcast()),
+            ov::PartialShape::broadcast_merge_into(result_shape, get_input_partial_shape(0), get_auto_broadcast()),
             "'Cond' tensor shape is not broadcastable.");
     } else {
         result_shape = get_input_partial_shape(2);
         for (int i = 1; i >= 0; i--) {
             if (get_auto_broadcast().m_type == op::AutoBroadcastType::NONE) {
                 NODE_VALIDATION_CHECK(this,
-                                      PartialShape::merge_into(result_shape, get_input_partial_shape(i)),
+                                      ov::PartialShape::merge_into(result_shape, get_input_partial_shape(i)),
                                       "Argument shapes are inconsistent.");
             } else if (get_auto_broadcast().m_type == op::AutoBroadcastType::NUMPY) {
-                NODE_VALIDATION_CHECK(
-                    this,
-                    PartialShape::broadcast_merge_into(result_shape, get_input_partial_shape(i), get_auto_broadcast()),
-                    "Argument shapes are inconsistent.");
+                NODE_VALIDATION_CHECK(this,
+                                      ov::PartialShape::broadcast_merge_into(result_shape,
+                                                                             get_input_partial_shape(i),
+                                                                             get_auto_broadcast()),
+                                      "Argument shapes are inconsistent.");
             } else {
                 NODE_VALIDATION_CHECK(this, false, "Unsupported auto broadcast specification");
             }
diff --git a/ngraph/core/src/op/selu.cpp b/ngraph/core/src/op/selu.cpp
index 08ddf2c31b8577..8987823d612833 100644
--- a/ngraph/core/src/op/selu.cpp
+++ b/ngraph/core/src/op/selu.cpp
@@ -9,7 +9,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Selu, "Selu", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Selu, "Selu", 0);
 
 op::v0::Selu::Selu(const Output<Node>& data, const Output<Node>& alpha, const Output<Node>& lambda)
     : Op({data, alpha, lambda}) {
diff --git a/ngraph/core/src/op/shape_of.cpp b/ngraph/core/src/op/shape_of.cpp
index 69090af304a569..e703219a42f542 100644
--- a/ngraph/core/src/op/shape_of.cpp
+++ b/ngraph/core/src/op/shape_of.cpp
@@ -20,7 +20,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::v3::ShapeOf::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::ShapeOf, "ShapeOf", 3);
 
 op::v3::ShapeOf::ShapeOf(const Output<Node>& arg, element::Type output_type) : Op({arg}), m_output_type(output_type) {
     constructor_validate_and_infer_types();
@@ -33,7 +33,7 @@ void op::v3::ShapeOf::validate_and_infer_types() {
                           "Output type must be i32 or i64");
     set_input_is_relevant_to_value(0, false);
     const auto input_partial_shape = get_input_partial_shape(0);
-    set_output_type(0, m_output_type, PartialShape{input_partial_shape.rank()});
+    set_output_type(0, m_output_type, ov::PartialShape{input_partial_shape.rank()});
 }
 
 bool ngraph::op::v3::ShapeOf::visit_attributes(AttributeVisitor& visitor) {
@@ -51,15 +51,15 @@ shared_ptr<Node> op::v3::ShapeOf::clone_with_new_inputs(const OutputVector& new_
 
 namespace shape_of {
 template <element::Type_t ET>
-inline bool evaluate(const Shape& shape, const HostTensorPtr& output_value) {
+inline bool evaluate(const ov::Shape& shape, const HostTensorPtr& output_value) {
     runtime::reference::shape_of(shape, output_value->get_data_ptr<ET>());
     return true;
 }
 
 bool evaluate_shape_of(const HostTensorPtr& output_value, const HostTensorPtr& input_value) {
     bool rc = true;
-    Shape shape = input_value->get_shape();
-    output_value->set_shape(Shape{shape.size()});
+    ov::Shape shape = input_value->get_shape();
+    output_value->set_shape(ov::Shape{shape.size()});
     switch (output_value->get_element_type()) {
         NGRAPH_TYPE_CASE(evaluate_shape_of, i32, shape, output_value);
         NGRAPH_TYPE_CASE(evaluate_shape_of, i64, shape, output_value);
@@ -93,7 +93,7 @@ bool evaluate_bound_shape(const Node* shape_of_node, const HostTensorVector& out
     if (input_partial_shape.rank().is_dynamic())
         return false;
     const auto rank = input_partial_shape.rank().get_length();
-    auto pshape_low = PartialShape::dynamic(rank), pshape_up = PartialShape::dynamic(rank);
+    auto pshape_low = ov::PartialShape::dynamic(rank), pshape_up = ov::PartialShape::dynamic(rank);
     for (Dimension::value_type i = 0; i < rank; ++i) {
         Interval interval = input_partial_shape[i].get_interval();
         pshape_low[i] = interval.get_min_val();
@@ -111,14 +111,14 @@ bool evaluate_bound_shape(const Node* shape_of_node, const HostTensorVector& out
         HostTensorVector upper =
             is_upper ? output_values
                      : HostTensorVector{
-                           std::make_shared<HostTensor>(output_et, PartialShape{pshape_up.rank().get_length()})};
+                           std::make_shared<HostTensor>(output_et, ov::PartialShape{pshape_up.rank().get_length()})};
         shape_of_node->evaluate(upper, {std::make_shared<HostTensor>(input_et, pshape_up)});
         shape_of_node->get_output_tensor(0).set_upper_value(upper[0]);
 
         HostTensorVector lower =
             !is_upper ? output_values
                       : HostTensorVector{
-                            std::make_shared<HostTensor>(output_et, PartialShape{pshape_low.rank().get_length()})};
+                            std::make_shared<HostTensor>(output_et, ov::PartialShape{pshape_low.rank().get_length()})};
         shape_of_node->evaluate(lower, {std::make_shared<HostTensor>(input_et, pshape_low)});
         shape_of_node->get_output_tensor(0).set_lower_value(lower[0]);
 
@@ -180,7 +180,7 @@ bool op::v3::ShapeOf::constant_fold(OutputVector& output_values, const OutputVec
 }
 
 // op::v0::ShapeOf
-NGRAPH_RTTI_DEFINITION(op::v0::ShapeOf, "ShapeOf", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::ShapeOf, "ShapeOf", 0);
 
 op::v0::ShapeOf::ShapeOf(const Output<Node>& arg) : Op({arg}) {
     constructor_validate_and_infer_types();
@@ -189,7 +189,7 @@ op::v0::ShapeOf::ShapeOf(const Output<Node>& arg) : Op({arg}) {
 void op::v0::ShapeOf::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_ShapeOf_validate_and_infer_types);
     set_input_is_relevant_to_value(0, false);
-    set_output_type(0, element::i64, PartialShape{get_input_partial_shape(0).rank()});
+    set_output_type(0, element::i64, ov::PartialShape{get_input_partial_shape(0).rank()});
 }
 
 bool ngraph::op::v0::ShapeOf::visit_attributes(AttributeVisitor& visitor) {
diff --git a/ngraph/core/src/op/shuffle_channels.cpp b/ngraph/core/src/op/shuffle_channels.cpp
index 1e73dac967c6ed..89dd145b705ad2 100644
--- a/ngraph/core/src/op/shuffle_channels.cpp
+++ b/ngraph/core/src/op/shuffle_channels.cpp
@@ -18,7 +18,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::ShuffleChannels, "ShuffleChannels", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::ShuffleChannels, "ShuffleChannels", 0);
 
 op::ShuffleChannels::ShuffleChannels(const Output<Node>& data, const int64_t axis, const int64_t group)
     : Op({data}),
diff --git a/ngraph/core/src/op/sigmoid.cpp b/ngraph/core/src/op/sigmoid.cpp
index 1ceaca5144b00e..0565cf62f00999 100644
--- a/ngraph/core/src/op/sigmoid.cpp
+++ b/ngraph/core/src/op/sigmoid.cpp
@@ -15,15 +15,15 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::Sigmoid::type_info;
+OPENVINO_RTTI_DEFINITION(ov::op::v0::Sigmoid, "Sigmoid", 0, util::UnaryElementwiseArithmetic);
 
-shared_ptr<Node> op::Sigmoid::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<Node> ov::op::v0::Sigmoid::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_Sigmoid_clone_with_new_inputs);
     check_new_args_count(this, new_args);
     return make_shared<Sigmoid>(new_args.at(0));
 }
 
-op::Sigmoid::Sigmoid(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
+ov::op::v0::Sigmoid::Sigmoid(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
 }
 
@@ -56,13 +56,13 @@ bool evaluate_sigmoid(const HostTensorPtr& arg0, const HostTensorPtr& out) {
 }
 }  // namespace sigmoid
 
-bool op::Sigmoid::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::v0::Sigmoid::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v0_Sigmoid_evaluate);
     NGRAPH_CHECK(validate_host_tensor_vector(outputs, 1) && validate_host_tensor_vector(inputs, 1));
     return sigmoid::evaluate_sigmoid(inputs[0], outputs[0]);
 }
 
-bool op::Sigmoid::has_evaluate() const {
+bool ov::op::v0::Sigmoid::has_evaluate() const {
     NGRAPH_OP_SCOPE(v0_Sigmoid_has_evaluate);
     switch (get_input_element_type(0)) {
     case ngraph::element::boolean:
diff --git a/ngraph/core/src/op/sign.cpp b/ngraph/core/src/op/sign.cpp
index 74b0e89acf90d9..50aa74539b9d0a 100644
--- a/ngraph/core/src/op/sign.cpp
+++ b/ngraph/core/src/op/sign.cpp
@@ -5,15 +5,14 @@
 #include "ngraph/op/sign.hpp"
 
 #include "itt.hpp"
-
-using namespace std;
-using namespace ngraph;
-
 #include "ngraph/runtime/host_tensor.hpp"
 #include "ngraph/runtime/reference/sign.hpp"
 #include "ngraph/validation_util.hpp"
 
-NGRAPH_RTTI_DEFINITION(op::v0::Sign, "Sign", 0, util::UnaryElementwiseArithmetic);
+using namespace std;
+using namespace ngraph;
+
+OPENVINO_RTTI_DEFINITION(op::v0::Sign, "Sign", 0, util::UnaryElementwiseArithmetic);
 
 op::Sign::Sign(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/sin.cpp b/ngraph/core/src/op/sin.cpp
index 07e91332df3625..9afac15a716cc1 100644
--- a/ngraph/core/src/op/sin.cpp
+++ b/ngraph/core/src/op/sin.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-constexpr NodeTypeInfo op::Sin::type_info;
+OPENVINO_RTTI_DEFINITION(op::v0::Sin, "Sin", 0, util::UnaryElementwiseArithmetic);
 
 op::Sin::Sin(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/sinh.cpp b/ngraph/core/src/op/sinh.cpp
index 24484615e3a026..0fd742f575df0a 100644
--- a/ngraph/core/src/op/sinh.cpp
+++ b/ngraph/core/src/op/sinh.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Sinh, "Sinh", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Sinh, "Sinh", 0, util::UnaryElementwiseArithmetic);
 
 op::Sinh::Sinh(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/sink.cpp b/ngraph/core/src/op/sink.cpp
index a1ed861d5f6226..567f7faa439862 100644
--- a/ngraph/core/src/op/sink.cpp
+++ b/ngraph/core/src/op/sink.cpp
@@ -6,6 +6,6 @@
 
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::Sink, "Sink", 0);
+OPENVINO_RTTI_DEFINITION(op::Sink, "Sink", 0);
 
-op::Sink::~Sink() {}
+op::Sink::~Sink() = default;
diff --git a/ngraph/core/src/op/slice.cpp b/ngraph/core/src/op/slice.cpp
new file mode 100644
index 00000000000000..295a077eaf909e
--- /dev/null
+++ b/ngraph/core/src/op/slice.cpp
@@ -0,0 +1,286 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "ngraph/op/slice.hpp"
+
+#include <numeric>
+
+#include "itt.hpp"
+#include "ngraph/attribute_visitor.hpp"
+#include "ngraph/graph_util.hpp"
+#include "ngraph/op/constant.hpp"
+#include "ngraph/validation_util.hpp"
+
+using namespace std;
+using namespace ngraph;
+
+OPENVINO_RTTI_DEFINITION(op::v8::Slice, "Slice", 8);
+
+op::v8::Slice::Slice(const Output<Node>& data,
+                     const Output<Node>& start,
+                     const Output<Node>& stop,
+                     const Output<Node>& step)
+    : Op({data, start, stop, step}) {
+    constructor_validate_and_infer_types();
+}
+
+op::v8::Slice::Slice(const Output<Node>& data,
+                     const Output<Node>& start,
+                     const Output<Node>& stop,
+                     const Output<Node>& step,
+                     const Output<Node>& axes)
+    : Op({data, start, stop, step, axes}) {
+    constructor_validate_and_infer_types();
+}
+
+namespace {
+
+std::shared_ptr<ngraph::op::v0::Constant> get_default_const_axes(const Output<Node>& start) {
+    const auto start_pshape = start.get_partial_shape();
+    // Static case
+    if (start_pshape.rank().is_static() && start_pshape.rank().get_length() == 1 && start_pshape[0].is_static()) {
+        size_t axes_length = start_pshape[0].get_length();
+        std::vector<int64_t> axes(axes_length);
+        std::iota(axes.begin(), axes.end(), 0);
+        return op::v0::Constant::create(element::i64, Shape{axes_length}, axes);
+    }
+    // Dynamic case
+    return nullptr;
+}
+
+int64_t get_sliced_dim_size(int64_t start, int64_t stop, int64_t step, int64_t dim_size) {
+    // Normalize index
+    start = start < 0 ? dim_size + start : start;
+    stop = stop < 0 ? dim_size + stop : stop;
+
+    // Clip normalized bounds according to the dim size
+    start = std::max(int64_t(0), std::min(start, dim_size));  // inclusive
+    stop = std::max(int64_t(-1), std::min(stop, dim_size));   // exclusive
+
+    int64_t elements_in_range = 0;
+    if (step < 0) {
+        // Clip max start index (last element inclusively)
+        elements_in_range = std::max(int64_t(0), std::min(dim_size - 1, start) - stop);
+    } else {
+        // Clip max stop index (last element exclusively)
+        elements_in_range = std::max(int64_t(0), std::min(dim_size, stop) - start);
+    }
+    const int64_t sliced_dim_size = std::ceil(elements_in_range / std::fabs(step));
+    return sliced_dim_size;
+}
+
+}  // namespace
+
+bool op::v8::Slice::visit_attributes(AttributeVisitor& visitor) {
+    NGRAPH_OP_SCOPE(v8_Slice_visit_attributes);
+    return true;
+}
+
+void op::v8::Slice::validate_and_infer_types() {
+    NGRAPH_OP_SCOPE(v8_Slice_validate_and_infer_types);
+
+    const auto inputs_size = get_input_size();
+    NODE_VALIDATION_CHECK(this,
+                          inputs_size == 4 || inputs_size == 5,
+                          "Slice has to have 4 or 5 inputs. Got: ",
+                          inputs_size);
+
+    const PartialShape& data_shape = get_input_partial_shape(0);
+    const auto& data_rank = data_shape.rank();
+
+    NODE_VALIDATION_CHECK(this,
+                          data_rank.is_dynamic() || data_rank.get_length() > 0,
+                          "Slice `data` input can't be a scalar.");
+
+    const auto start_const = get_constant_from_source(input_value(1));
+    const auto stop_const = get_constant_from_source(input_value(2));
+    const auto step_const = get_constant_from_source(input_value(3));
+
+    const auto& start_input = start_const ? start_const : input_value(1);
+    const auto& stop_input = stop_const ? stop_const : input_value(2);
+    const auto& step_input = step_const ? step_const : input_value(3);
+
+    NODE_VALIDATION_CHECK(this,
+                          start_input.get_element_type().is_integral_number(),
+                          "Slice `start` input type must be integer.");
+    NODE_VALIDATION_CHECK(this,
+                          stop_input.get_element_type().is_integral_number(),
+                          "Slice `stop` input type must be integer.");
+    NODE_VALIDATION_CHECK(this,
+                          step_input.get_element_type().is_integral_number(),
+                          "Slice `step` input type must be integer.");
+
+    const auto& start_shape = start_input.get_partial_shape();
+    const auto& stop_shape = stop_input.get_partial_shape();
+    const auto& step_shape = step_input.get_partial_shape();
+
+    const auto& start_rank = start_shape.rank();
+    const auto& stop_rank = stop_shape.rank();
+    const auto& step_rank = step_shape.rank();
+
+    NODE_VALIDATION_CHECK(this,
+                          start_rank.compatible(1),
+                          "Slice `start` input must be a 1D tensor. Got rank: ",
+                          start_rank);
+    NODE_VALIDATION_CHECK(this,
+                          stop_rank.compatible(1),
+                          "Slice `stop` input must be a 1D tensor. Got rank: ",
+                          stop_rank);
+    NODE_VALIDATION_CHECK(this,
+                          step_rank.compatible(1),
+                          "Slice `step` input must be a 1D tensor. Got rank: ",
+                          step_rank);
+
+    if (data_rank.is_static()) {
+        const auto data_rank_length = data_rank.get_length();
+        NODE_VALIDATION_CHECK(this,
+                              start_rank.is_dynamic() || start_shape[0].get_max_length() <= data_rank_length,
+                              "Slice `start` input dim size can't be bigger than `data` rank.");
+        NODE_VALIDATION_CHECK(this,
+                              stop_rank.is_dynamic() || stop_shape[0].get_max_length() <= data_rank_length,
+                              "Slice `stop` input dim size can't be bigger than `data` rank.");
+        NODE_VALIDATION_CHECK(this,
+                              step_rank.is_dynamic() || step_shape[0].get_max_length() <= data_rank_length,
+                              "Slice `step` input dim size can't be bigger than `data` rank.");
+    }
+
+    NODE_VALIDATION_CHECK(
+        this,
+        start_shape.compatible(stop_shape) && start_shape.compatible(step_shape) && stop_shape.compatible(step_shape),
+        "Slice `start`, `stop`, `step` inputs must have compatible shapes.");
+
+    set_input_is_relevant_to_shape(0);
+    set_input_is_relevant_to_shape(1);
+    set_input_is_relevant_to_shape(2);
+    set_input_is_relevant_to_shape(3);
+
+    std::shared_ptr<ngraph::op::v0::Constant> axes_const;
+    if (get_input_size() > 4) {
+        set_input_is_relevant_to_shape(4);
+        axes_const = get_constant_from_source(input_value(4));
+        const auto& axes_input = axes_const ? axes_const : input_value(4);
+        const auto& axes_rank = axes_input.get_partial_shape().rank();
+        NODE_VALIDATION_CHECK(this,
+                              axes_rank.compatible(1),
+                              "Slice `axes` input must be a 1D tensor. Got rank: ",
+                              axes_rank);
+        NODE_VALIDATION_CHECK(this,
+                              axes_rank.is_dynamic() || axes_input.get_partial_shape()[0].get_max_length() <=
+                                                            data_rank.get_interval().get_max_val(),
+                              "Slice `axes` input dim size can't be bigger than `data` rank.");
+        NODE_VALIDATION_CHECK(this,
+                              axes_input.get_partial_shape().compatible(start_shape),
+                              "Slice `axes` input must have compatible shape with `start`, `stop`, `step` inputs.");
+        NODE_VALIDATION_CHECK(this,
+                              axes_input.get_element_type().is_integral_number(),
+                              "Slice `axes` input type must be integer.");
+    } else {
+        axes_const = get_default_const_axes(start_input);
+    }
+
+    PartialShape output_shape(data_shape);
+
+    // If data_shape rank is dynamic we can't calulate output shape.
+    // Even with const start/stop/step/axes, we don't know how many axes should be copied
+    // as "unspefified" in the final output shape, so the output shape rank is also dynamic.
+    if (data_rank.is_dynamic()) {
+        set_output_type(0, get_input_element_type(0), output_shape);
+        return;
+    }
+    const auto data_static_rank = data_shape.rank().get_length();
+
+    if (start_const && stop_const && step_const && axes_const) {
+        const auto& starts = start_const->cast_vector<int64_t>();
+        const auto& stops = stop_const->cast_vector<int64_t>();
+        const auto& steps = step_const->cast_vector<int64_t>();
+        const auto& axes = axes_const->cast_vector<int64_t>();
+
+        std::unordered_set<int64_t> axes_set(axes.begin(), axes.end());
+        NODE_VALIDATION_CHECK(this, axes_set.size() == axes.size(), "Slice values in `axes` input must be unique.");
+
+        for (size_t i = 0; i < axes.size(); ++i) {
+            const auto norm_axis = axes[i] < 0 ? data_static_rank + axes[i] : axes[i];
+            NODE_VALIDATION_CHECK(this,
+                                  norm_axis >= 0 && norm_axis < data_static_rank,
+                                  "Values in the `axes` input must be in range of the `data` input rank: [-",
+                                  data_static_rank,
+                                  ", ",
+                                  data_static_rank - 1,
+                                  "]. Got: ",
+                                  axes[i]);
+
+            auto start = starts[i];
+            auto stop = stops[i];
+            auto step = steps[i];
+
+            NODE_VALIDATION_CHECK(this, step != 0, "Slice 'step' value can't be zero.");
+
+            const auto& axis_dim = data_shape[norm_axis];
+            const auto axis_min_dim_length = axis_dim.get_min_length();
+            const auto min_dim_size = get_sliced_dim_size(start, stop, step, axis_min_dim_length);
+            if (axis_dim.is_static()) {
+                output_shape[norm_axis] = min_dim_size;
+            }
+
+            // Avoid negative index normalization without upper bounds
+            if (!axis_dim.get_interval().has_upper_bound()) {
+                if ((step < 0 && start < 0 && stop > 0) || (step > 0 && stop < 0 && start > 0)) {
+                    output_shape[norm_axis] = Dimension(-1);
+                    continue;
+                } else if (step < 0 && start > 0 && stop < 0) {
+                    int64_t max_out_dim = start >= INT32_MAX ? INT64_MAX : start + 1;
+                    output_shape[norm_axis] = Dimension(0, max_out_dim);
+                    continue;
+                } else if (step > 0 && stop > 0 && start < 0) {
+                    int64_t max_out_dim = stop >= INT32_MAX ? INT64_MAX : stop;
+                    output_shape[norm_axis] = Dimension(0, max_out_dim);
+                    continue;
+                }
+            }
+
+            // Calculate max dim length (upper bound)
+            auto axis_max_dim_length = axis_dim.get_interval().get_max_val();
+            const auto max_dim_size = get_sliced_dim_size(start, stop, step, axis_max_dim_length);
+            output_shape[norm_axis] = Dimension(min_dim_size, max_dim_size);
+        }
+    } else {
+        if (axes_const) {
+            // If we know only `axes` values, we should update lower_bound to 0 value,
+            // for the specified dims by the axes. For unspecified dims, bounds as in data_shape.
+            for (const auto& axis : axes_const->cast_vector<int64_t>()) {
+                const auto norm_axis = axis < 0 ? data_static_rank + axis : axis;
+                NODE_VALIDATION_CHECK(this,
+                                      norm_axis >= 0 && norm_axis < data_static_rank,
+                                      "Values in the `axes` input must be in range of the `data` input rank: [-",
+                                      data_static_rank,
+                                      ", ",
+                                      data_static_rank - 1,
+                                      "]. Got: ",
+                                      axis);
+                output_shape[axis] = Dimension(0, data_shape[axis].get_max_length());
+            }
+        } else {
+            // Otherwise `axes` values are also unknown,
+            // then all of the output dims can be 0, so have lower bound = 0.
+            for (size_t i = 0; i < data_shape.rank().get_length(); ++i) {
+                output_shape[i] = Dimension(0, data_shape[i].get_max_length());
+            }
+        }
+    }
+    set_output_type(0, get_input_element_type(0), output_shape);
+}
+
+shared_ptr<Node> op::v8::Slice::clone_with_new_inputs(const OutputVector& new_args) const {
+    NGRAPH_OP_SCOPE(v8_Slice_clone_with_new_inputs);
+    check_new_args_count(this, new_args);
+    if (new_args.size() == 4) {
+        return std::make_shared<v8::Slice>(new_args.at(0), new_args.at(1), new_args.at(2), new_args.at(3));
+    } else {
+        return std::make_shared<v8::Slice>(new_args.at(0),
+                                           new_args.at(1),
+                                           new_args.at(2),
+                                           new_args.at(3),
+                                           new_args.at(4));
+    }
+}
diff --git a/ngraph/core/src/op/softmax.cpp b/ngraph/core/src/op/softmax.cpp
index 057725b414f202..c8680a14c8cc6a 100644
--- a/ngraph/core/src/op/softmax.cpp
+++ b/ngraph/core/src/op/softmax.cpp
@@ -23,7 +23,7 @@ using namespace ngraph;
 
 namespace {
 template <element::Type_t ET>
-inline bool evaluate(const HostTensorPtr& arg, const HostTensorPtr& out, const Shape& shape, const AxisSet& axes) {
+inline bool evaluate(const HostTensorPtr& arg, const HostTensorPtr& out, const ov::Shape& shape, const AxisSet& axes) {
     runtime::reference::softmax(arg->get_data_ptr<ET>(), out->get_data_ptr<ET>(), shape, axes);
     return true;
 }
@@ -46,7 +46,7 @@ bool evaluate_softmax(const HostTensorPtr& arg, const HostTensorPtr& out, const
 }  // namespace
 
 // *** SOFTMAX OP SET V1 ***
-NGRAPH_RTTI_DEFINITION(op::v1::Softmax, "Softmax", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Softmax, "Softmax", 1);
 
 op::v1::Softmax::Softmax(const Output<Node>& arg, const size_t axis) : Op({arg}), m_axis(axis) {
     constructor_validate_and_infer_types();
@@ -60,7 +60,7 @@ bool ngraph::op::v1::Softmax::visit_attributes(AttributeVisitor& visitor) {
 
 void op::v1::Softmax::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_Softmax_validate_and_infer_types);
-    const PartialShape& input_shape = get_input_partial_shape(0);
+    const ov::PartialShape& input_shape = get_input_partial_shape(0);
     if (input_shape.rank().is_static())
         NODE_VALIDATION_CHECK(this,
                               m_axis < static_cast<size_t>(input_shape.rank().get_length()),
diff --git a/ngraph/core/src/op/softplus.cpp b/ngraph/core/src/op/softplus.cpp
index 778b438015435a..411a5d7b8a1910 100644
--- a/ngraph/core/src/op/softplus.cpp
+++ b/ngraph/core/src/op/softplus.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v4::SoftPlus, "SoftPlus", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::SoftPlus, "SoftPlus", 4);
 
 op::v4::SoftPlus::SoftPlus(const Output<Node>& arg) : Op({arg}) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/space_to_batch.cpp b/ngraph/core/src/op/space_to_batch.cpp
index f380887b5cb4f5..c7cc341b194ff4 100644
--- a/ngraph/core/src/op/space_to_batch.cpp
+++ b/ngraph/core/src/op/space_to_batch.cpp
@@ -21,7 +21,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::SpaceToBatch, "SpaceToBatch", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::SpaceToBatch, "SpaceToBatch", 1);
 
 ngraph::op::v1::SpaceToBatch::SpaceToBatch(const ngraph::Output<ngraph::Node>& data,
                                            const ngraph::Output<ngraph::Node>& block_shape,
@@ -33,7 +33,7 @@ ngraph::op::v1::SpaceToBatch::SpaceToBatch(const ngraph::Output<ngraph::Node>& d
 
 void op::v1::SpaceToBatch::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_SpaceToBatch_validate_and_infer_types);
-    PartialShape data_pshape = get_input_partial_shape(0);
+    ov::PartialShape data_pshape = get_input_partial_shape(0);
     const auto& data_type = get_input_element_type(0);
     const auto& block_shape_type = get_input_element_type(1);
     const auto& pads_begin_type = get_input_element_type(2);
@@ -83,7 +83,7 @@ void op::v1::SpaceToBatch::validate_and_infer_types() {
         for (long idx : block_val)
             block_prod *= idx;
 
-        Shape output_shape = {static_cast<size_t>(data_shape[0] * block_prod)};
+        ov::Shape output_shape = {static_cast<size_t>(data_shape[0] * block_prod)};
         for (size_t idx = 1; idx < data_shape.size(); ++idx) {
             NODE_VALIDATION_CHECK(this, block_val.at(idx) > 0, "block_shape values must be greater than 0");
             NODE_VALIDATION_CHECK(
@@ -102,7 +102,7 @@ void op::v1::SpaceToBatch::validate_and_infer_types() {
         set_output_size(1);
         set_output_type(0, data_type, output_shape);
     } else {
-        set_output_type(0, data_type, PartialShape::dynamic(data_pshape.rank()));
+        set_output_type(0, data_type, ov::PartialShape::dynamic(data_pshape.rank()));
     }
 }
 
@@ -149,7 +149,7 @@ bool ngraph::op::v1::SpaceToBatch::evaluate_space_to_batch(const HostTensorVecto
     CoordinateDiff pads_end_vec(shape_size(inputs[2]->get_shape()));
     pads_end_vec.assign(pads_end, pads_end + shape_size(inputs[2]->get_shape()));
 
-    Shape padded_shape(data_shape.size());
+    ov::Shape padded_shape(data_shape.size());
     for (size_t i = 0; i < data_shape.size(); ++i) {
         padded_shape[i] = data_shape[i] + pads_begin_vec[i] + pads_end_vec[i];
     }
@@ -166,9 +166,9 @@ bool ngraph::op::v1::SpaceToBatch::evaluate_space_to_batch(const HostTensorVecto
                                     ngraph::op::PadMode::CONSTANT);
     data_shape = padded_shape;
 
-    Shape dispersed_shape(block_values_size + 1);
+    ov::Shape dispersed_shape(block_values_size + 1);
     std::vector<size_t> axes_order(block_values_size + 1);
-    Shape squeezed_shape(data_shape.begin(), data_shape.end());
+    ov::Shape squeezed_shape(data_shape.begin(), data_shape.end());
     std::vector<size_t> plain_axes_order(block_values_size + 1);
     std::iota(plain_axes_order.begin(), plain_axes_order.end(), 0);
 
@@ -202,7 +202,7 @@ bool ngraph::op::v1::SpaceToBatch::evaluate_space_to_batch(const HostTensorVecto
                                      plain_axes_order,
                                      dispersed_shape,
                                      elem_size);
-        Shape post_transpose_shape(axes_order.size());
+        ov::Shape post_transpose_shape(axes_order.size());
         for (size_t i = 0; i < axes_order.size(); ++i) {
             post_transpose_shape[i] = dispersed_shape[axes_order[i]];
         }
diff --git a/ngraph/core/src/op/space_to_depth.cpp b/ngraph/core/src/op/space_to_depth.cpp
index 102beee02ed99e..a6021e6f0eb72d 100644
--- a/ngraph/core/src/op/space_to_depth.cpp
+++ b/ngraph/core/src/op/space_to_depth.cpp
@@ -17,16 +17,16 @@
 
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::SpaceToDepth, "SpaceToDepth", 0);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::SpaceToDepth, "SpaceToDepth", 0);
 
-op::SpaceToDepth::SpaceToDepth(const Output<Node>& data, const SpaceToDepthMode& mode, size_t block_size)
+ov::op::v0::SpaceToDepth::SpaceToDepth(const Output<Node>& data, const SpaceToDepthMode& mode, size_t block_size)
     : Op({data}),
       m_blocksize(block_size),
       m_mode(mode) {
     constructor_validate_and_infer_types();
 }
 
-op::SpaceToDepth::SpaceToDepth(const Output<Node>& data, const std::string& mode, size_t block_size)
+ov::op::v0::SpaceToDepth::SpaceToDepth(const Output<Node>& data, const std::string& mode, size_t block_size)
     : SpaceToDepth(data, as_enum<SpaceToDepthMode>(mode), block_size) {}
 
 bool ngraph::op::v0::SpaceToDepth::visit_attributes(AttributeVisitor& visitor) {
@@ -36,7 +36,7 @@ bool ngraph::op::v0::SpaceToDepth::visit_attributes(AttributeVisitor& visitor) {
     return true;
 }
 
-std::shared_ptr<Node> op::SpaceToDepth::clone_with_new_inputs(const OutputVector& new_args) const {
+std::shared_ptr<Node> ov::op::v0::SpaceToDepth::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_SpaceToDepth_clone_with_new_inputs);
     if (new_args.size() != 1) {
         throw ngraph_error("Incorrect number of new arguments");
@@ -46,7 +46,7 @@ std::shared_ptr<Node> op::SpaceToDepth::clone_with_new_inputs(const OutputVector
 
 void ngraph::op::v0::SpaceToDepth::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_SpaceToDepth_validate_and_infer_types);
-    PartialShape data_pshape = get_input_partial_shape(0);
+    ov::PartialShape data_pshape = get_input_partial_shape(0);
 
     const auto& data_type = get_input_element_type(0);
 
@@ -81,14 +81,14 @@ void ngraph::op::v0::SpaceToDepth::validate_and_infer_types() {
         set_output_size(1);
         set_output_type(0, data_type, out_shape);
     } else {
-        set_output_type(0, data_type, PartialShape::dynamic(data_pshape.rank()));
+        set_output_type(0, data_type, ov::PartialShape::dynamic(data_pshape.rank()));
     }
 }
 
 bool evaluate_space_to_depth(const HostTensorVector& outputs,
                              const HostTensorVector& inputs,
                              const std::size_t block_size,
-                             const op::SpaceToDepth::SpaceToDepthMode mode) {
+                             const ov::op::v0::SpaceToDepth::SpaceToDepthMode mode) {
     const auto& in = inputs[0];
     const auto& out = outputs[0];
     size_t elem_size = in->get_element_type().size();
@@ -116,19 +116,20 @@ bool ngraph::op::v0::SpaceToDepth::has_evaluate() const {
     return !get_input_partial_shape(0).is_dynamic();
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::v0::SpaceToDepth::SpaceToDepthMode& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::v0::SpaceToDepth::SpaceToDepthMode& type) {
     return s << as_string(type);
 }
 
 namespace ov {
 template <>
-NGRAPH_API EnumNames<op::v0::SpaceToDepth::SpaceToDepthMode>& EnumNames<op::v0::SpaceToDepth::SpaceToDepthMode>::get() {
-    static auto enum_names = EnumNames<op::v0::SpaceToDepth::SpaceToDepthMode>(
+NGRAPH_API EnumNames<ngraph::op::v0::SpaceToDepth::SpaceToDepthMode>&
+EnumNames<ngraph::op::v0::SpaceToDepth::SpaceToDepthMode>::get() {
+    static auto enum_names = EnumNames<ngraph::op::v0::SpaceToDepth::SpaceToDepthMode>(
         "op::v0::SpaceToDepth::SpaceToDepthMode",
-        {{"blocks_first", op::v0::SpaceToDepth::SpaceToDepthMode::BLOCKS_FIRST},
-         {"depth_first", op::v0::SpaceToDepth::SpaceToDepthMode::DEPTH_FIRST}});
+        {{"blocks_first", ngraph::op::v0::SpaceToDepth::SpaceToDepthMode::BLOCKS_FIRST},
+         {"depth_first", ngraph::op::v0::SpaceToDepth::SpaceToDepthMode::DEPTH_FIRST}});
     return enum_names;
 }
 
-constexpr DiscreteTypeInfo AttributeAdapter<op::v0::SpaceToDepth::SpaceToDepthMode>::type_info;
+constexpr DiscreteTypeInfo AttributeAdapter<ngraph::op::v0::SpaceToDepth::SpaceToDepthMode>::type_info;
 }  // namespace ov
diff --git a/ngraph/core/src/op/split.cpp b/ngraph/core/src/op/split.cpp
index f1aaba1057861b..683a20471439fc 100644
--- a/ngraph/core/src/op/split.cpp
+++ b/ngraph/core/src/op/split.cpp
@@ -18,7 +18,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::Split, "Split", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Split, "Split", 1);
 
 op::v1::Split::Split(const Output<Node>& data, const Output<Node>& axis, const size_t num_splits)
     : Op({data, axis}),
@@ -34,8 +34,8 @@ bool ngraph::op::v1::Split::visit_attributes(AttributeVisitor& visitor) {
 
 void op::v1::Split::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v1_Split_validate_and_infer_types);
-    const PartialShape& data_ps = get_input_partial_shape(0);
-    const PartialShape& axis_ps = get_input_partial_shape(1);
+    const ov::PartialShape& data_ps = get_input_partial_shape(0);
+    const ov::PartialShape& axis_ps = get_input_partial_shape(1);
     const element::Type& axis_et = get_input_element_type(1);
 
     NODE_VALIDATION_CHECK(this, axis_ps.rank().compatible(0), "'axis' input must be a scalar. Got: ", axis_ps);
@@ -50,7 +50,7 @@ void op::v1::Split::validate_and_infer_types() {
                           "Attribute 'num_splits' must be greater than zero. Got: ",
                           m_num_splits);
 
-    PartialShape each_output_shape{data_ps};
+    ov::PartialShape each_output_shape{data_ps};
     const Rank data_rank = data_ps.rank();
     const auto axis_input = get_constant_from_source(input_value(1));
     if (axis_input && data_rank.is_static()) {
@@ -87,7 +87,7 @@ void op::v1::Split::validate_and_infer_types() {
             each_output_shape[axis] = Dimension(dim_interval_at_axis_min, dim_interval_at_axis_max);
         }
     } else {
-        each_output_shape = PartialShape::dynamic(data_ps.rank());
+        each_output_shape = ov::PartialShape::dynamic(data_ps.rank());
     }
 
     for (size_t i = 0; i < m_num_splits; ++i) {
@@ -108,7 +108,7 @@ inline bool evaluate(const HostTensorPtr& data_tensor,
                      const HostTensorVector& outputs,
                      const int64_t axis,
                      const int64_t num_splits) {
-    Shape output_shape = data_tensor->get_shape();
+    ov::Shape output_shape = data_tensor->get_shape();
     std::vector<char*> outputs_data(num_splits);
     output_shape.at(axis) /= num_splits;
     for (size_t i = 0; i < outputs.size(); ++i) {
diff --git a/ngraph/core/src/op/sqrt.cpp b/ngraph/core/src/op/sqrt.cpp
index 32533220c5b630..dec1c8622a935b 100644
--- a/ngraph/core/src/op/sqrt.cpp
+++ b/ngraph/core/src/op/sqrt.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Sqrt, "Sqrt", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Sqrt, "Sqrt", 0, util::UnaryElementwiseArithmetic);
 
 op::Sqrt::Sqrt(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/squared_difference.cpp b/ngraph/core/src/op/squared_difference.cpp
index f8667e0fcb29e3..d9141388a99118 100644
--- a/ngraph/core/src/op/squared_difference.cpp
+++ b/ngraph/core/src/op/squared_difference.cpp
@@ -7,21 +7,20 @@
 #include "itt.hpp"
 
 using namespace std;
-using namespace ngraph;
 
 // ------------------------------ v0 -------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::SquaredDifference, "SquaredDifference", 0, util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(ov::op::v0::SquaredDifference, "SquaredDifference", 0, util::BinaryElementwiseArithmetic);
 
-op::SquaredDifference::SquaredDifference(const Output<Node>& arg0,
-                                         const Output<Node>& arg1,
-                                         const AutoBroadcastSpec& auto_broadcast)
+ov::op::v0::SquaredDifference::SquaredDifference(const Output<Node>& arg0,
+                                                 const Output<Node>& arg1,
+                                                 const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
     constructor_validate_and_infer_types();
 }
 
-shared_ptr<Node> op::SquaredDifference::clone_with_new_inputs(const OutputVector& new_args) const {
+shared_ptr<ov::Node> ov::op::v0::SquaredDifference::clone_with_new_inputs(const OutputVector& new_args) const {
     NGRAPH_OP_SCOPE(v0_SquaredDifference_clone_with_new_inputs);
     check_new_args_count(this, new_args);
-    return make_shared<op::SquaredDifference>(new_args.at(0), new_args.at(1), this->get_autob());
+    return make_shared<ov::op::v0::SquaredDifference>(new_args.at(0), new_args.at(1), this->get_autob());
 }
diff --git a/ngraph/core/src/op/squeeze.cpp b/ngraph/core/src/op/squeeze.cpp
index d837b661635cd0..0a54160a39ab48 100644
--- a/ngraph/core/src/op/squeeze.cpp
+++ b/ngraph/core/src/op/squeeze.cpp
@@ -19,7 +19,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Squeeze, "Squeeze", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Squeeze, "Squeeze", 0);
 
 op::Squeeze::Squeeze() : Op() {}
 
@@ -42,7 +42,7 @@ void op::Squeeze::validate_and_infer_types() {
     if (get_input_size() == 1) {
         // Handling the case when Squeeze op is created with a single input - data.
         // This way the following code (validation, shape inference) can be used in both cases.
-        axes_constant = make_shared<op::v0::Constant>(element::i64, Shape{0}, vector<int64_t>{});
+        axes_constant = make_shared<op::v0::Constant>(element::i64, ov::Shape{0}, vector<int64_t>{});
     } else {
         auto axes_node = input_value(1).get_node_shared_ptr();
         auto axes_pshape = get_input_partial_shape(1);
@@ -78,7 +78,7 @@ void op::Squeeze::validate_and_infer_types() {
             }
         }
 
-        set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
+        set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
         return;
     }
 
@@ -116,7 +116,7 @@ void op::Squeeze::validate_and_infer_types() {
             output_data_shape.push_back(data_partial_shape[idx]);
         }
     }
-    set_output_type(0, get_input_element_type(0), PartialShape(output_data_shape));
+    set_output_type(0, get_input_element_type(0), ov::PartialShape(output_data_shape));
 }
 
 bool ngraph::op::v0::Squeeze::visit_attributes(AttributeVisitor& visitor) {
@@ -268,8 +268,8 @@ bool op::v0::Squeeze::constant_fold(OutputVector& output_values, const OutputVec
 
     const auto& shape = get_output_shape(0);
 
-    if (auto data_const = std::dynamic_pointer_cast<op::Constant>(inputs_values[0].get_node_shared_ptr())) {
-        output_values[0] = std::make_shared<op::Constant>(*data_const, shape);
+    if (auto data_const = std::dynamic_pointer_cast<op::v0::Constant>(inputs_values[0].get_node_shared_ptr())) {
+        output_values[0] = std::make_shared<op::v0::Constant>(*data_const, shape);
         return true;
     }
     return false;
diff --git a/ngraph/core/src/op/strided_slice.cpp b/ngraph/core/src/op/strided_slice.cpp
index 6ae268a122dba7..0a4ddb9efc0625 100644
--- a/ngraph/core/src/op/strided_slice.cpp
+++ b/ngraph/core/src/op/strided_slice.cpp
@@ -23,7 +23,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::StridedSlice, "StridedSlice", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::StridedSlice, "StridedSlice", 1);
 
 op::v1::StridedSlice::StridedSlice(const Output<Node>& data,
                                    const Output<Node>& begin,
@@ -61,7 +61,7 @@ shared_ptr<Node> calculate_default_strides(const Output<Node>& begin, const Outp
                                                    std::make_shared<op::ShapeOf>(begin));
     }
 
-    return op::Constant::create(element::i64, Shape{strides_length}, vector<int64_t>(strides_length, 1));
+    return op::Constant::create(element::i64, ov::Shape{strides_length}, vector<int64_t>(strides_length, 1));
 }
 }  // namespace
 
@@ -173,7 +173,7 @@ void op::v1::StridedSlice::validate_and_infer_types() {
                                           convert_mask_to_axis_set(get_shrink_axis_mask()),
                                           convert_mask_to_axis_set(get_ellipsis_mask())));
     } else {
-        set_output_type(0, get_input_element_type(0), PartialShape::dynamic(data_rank));
+        set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic(data_rank));
     }
 }
 
diff --git a/ngraph/core/src/op/subtract.cpp b/ngraph/core/src/op/subtract.cpp
index d7dbfd0182e26a..3554ab1d61eee6 100644
--- a/ngraph/core/src/op/subtract.cpp
+++ b/ngraph/core/src/op/subtract.cpp
@@ -51,7 +51,7 @@ bool evaluate_subtract(const HostTensorPtr& arg0,
 
 // ------------------------------- v1 ------------------------------------------
 
-NGRAPH_RTTI_DEFINITION(op::v1::Subtract, "Subtract", 1, util::BinaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v1::Subtract, "Subtract", 1, util::BinaryElementwiseArithmetic);
 
 op::v1::Subtract::Subtract(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseArithmetic(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/op/swish.cpp b/ngraph/core/src/op/swish.cpp
index 4a990cd760931b..6f08453cff915f 100644
--- a/ngraph/core/src/op/swish.cpp
+++ b/ngraph/core/src/op/swish.cpp
@@ -15,7 +15,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v4::Swish, "Swish", 4);
+OPENVINO_RTTI_DEFINITION(op::v4::Swish, "Swish", 4);
 
 op::v4::Swish::Swish(const Output<Node>& arg) : Op({arg}) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/tan.cpp b/ngraph/core/src/op/tan.cpp
index cc59868935d778..5c23321fe5855d 100644
--- a/ngraph/core/src/op/tan.cpp
+++ b/ngraph/core/src/op/tan.cpp
@@ -14,7 +14,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Tan, "Tan", 0, util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Tan, "Tan", 0, util::UnaryElementwiseArithmetic);
 
 op::Tan::Tan(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/tanh.cpp b/ngraph/core/src/op/tanh.cpp
index 743dc5dfae3d12..e638c97f51ed6a 100644
--- a/ngraph/core/src/op/tanh.cpp
+++ b/ngraph/core/src/op/tanh.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Tanh, "Tanh", 0, op::util::UnaryElementwiseArithmetic);
+OPENVINO_RTTI_DEFINITION(op::v0::Tanh, "Tanh", 0, op::util::UnaryElementwiseArithmetic);
 
 op::Tanh::Tanh(const Output<Node>& arg) : UnaryElementwiseArithmetic(arg) {
     constructor_validate_and_infer_types();
diff --git a/ngraph/core/src/op/tensor_iterator.cpp b/ngraph/core/src/op/tensor_iterator.cpp
index 9669769b8bcd4b..4a7b444afefdea 100644
--- a/ngraph/core/src/op/tensor_iterator.cpp
+++ b/ngraph/core/src/op/tensor_iterator.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::TensorIterator, "TensorIterator", 0, op::util::SubGraphOp);
+OPENVINO_RTTI_DEFINITION(op::v0::TensorIterator, "TensorIterator", 0, op::util::SubGraphOp);
 
 op::v0::TensorIterator::TensorIterator(const OutputVector& values) : op::util::SubGraphOp(values) {}
 
@@ -99,11 +99,11 @@ void op::v0::TensorIterator::validate_and_infer_types() {
                 // +1 because the left and right borders are included [start, end]
                 m_num_iterations = (abs(end - start) + 1) / part_size;
                 // infer type for m_body_parameter
-                Shape out_shape{input_shape};
+                ov::Shape out_shape{input_shape};
                 out_shape[axis] = part_size;
                 body_parameter->set_partial_shape(out_shape);
             } else {
-                body_parameter->set_partial_shape(PartialShape::dynamic(input_partial_shape.rank()));
+                body_parameter->set_partial_shape(ov::PartialShape::dynamic(input_partial_shape.rank()));
             }
         } else if (auto merged_input_description = ov::as_type_ptr<MergedInputDescription>(input_description)) {
             auto body_value = m_bodies[0]->get_results().at(merged_input_description->m_body_value_index)->input(0);
@@ -135,14 +135,14 @@ void op::v0::TensorIterator::validate_and_infer_types() {
         auto body_value = m_bodies[0]->get_results().at(output_description->m_body_value_index)->input_value(0);
 
         if (auto concat_output_description = ov::as_type_ptr<ConcatOutputDescription>(output_description)) {
-            auto body_value_partial_shape = body_value.get_partial_shape();
-            set_output_type(index, body_value.get_element_type(), PartialShape::dynamic());
+            const auto& body_value_partial_shape = body_value.get_partial_shape();
+            set_output_type(index, body_value.get_element_type(), ov::PartialShape::dynamic());
             if (body_value_partial_shape.is_static()) {
                 auto body_value_shape = body_value_partial_shape.to_shape();
                 auto part_size = concat_output_description->m_part_size;
                 auto axis = concat_output_description->m_axis;
 
-                Shape out_shape{body_value_shape};
+                ov::Shape out_shape{body_value_shape};
 
                 if (body_value_shape.empty()) {
                     NODE_VALIDATION_CHECK(this,
@@ -151,7 +151,7 @@ void op::v0::TensorIterator::validate_and_infer_types() {
                                           "tensor slices are scalars. "
                                           "TensorIterator output index: ",
                                           index);
-                    out_shape = Shape(1);
+                    out_shape = ov::Shape(1);
                 }
 
                 if (m_num_iterations != -1) {
@@ -162,7 +162,7 @@ void op::v0::TensorIterator::validate_and_infer_types() {
             } else {
                 set_output_type(index,
                                 body_value.get_element_type(),
-                                PartialShape::dynamic(body_value.get_partial_shape().rank()));
+                                ov::PartialShape::dynamic(body_value.get_partial_shape().rank()));
             }
         } else if (auto body_output_description = ov::as_type_ptr<BodyOutputDescription>(output_description)) {
             set_output_type(index, body_value.get_element_type(), body_value.get_partial_shape());
@@ -204,7 +204,7 @@ std::shared_ptr<Node> op::v0::TensorIterator::clone_with_new_inputs(const Output
     op->set_output_size(m_output_descriptions[0].size());
 
     std::vector<::ngraph::element::Type> types(m_bodies[0]->get_parameters().size());
-    std::vector<::ngraph::PartialShape> new_shapes(m_bodies[0]->get_parameters().size());
+    std::vector<ov::PartialShape> new_shapes(m_bodies[0]->get_parameters().size());
 
     for (size_t input_index = 0; input_index < new_args.size(); ++input_index) {
         for (auto& input_description : m_input_descriptions[0]) {
diff --git a/ngraph/core/src/op/tile.cpp b/ngraph/core/src/op/tile.cpp
index 2d55b04641db8e..0d5c60b90ad9a2 100644
--- a/ngraph/core/src/op/tile.cpp
+++ b/ngraph/core/src/op/tile.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Tile, "Tile", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Tile, "Tile", 0);
 
 op::v0::Tile::Tile(const Output<Node>& data, const Output<Node>& repeats) : Op({data, repeats}) {
     constructor_validate_and_infer_types();
@@ -37,8 +37,8 @@ void op::v0::Tile::validate_and_infer_types() {
 
     auto arg_shape = get_input_partial_shape(0);
     auto repeats_shape = get_input_partial_shape(1);
-    NODE_VALIDATION_CHECK(this, repeats_shape.rank().compatible(1), "Shape of repeats must be of rank 1");
-    PartialShape repeats_as_pshape;
+    NODE_VALIDATION_CHECK(this, repeats_shape.rank().compatible(1), "PartialShape of repeats must be of rank 1");
+    ov::PartialShape repeats_as_pshape;
     bool repeats_are_known = evaluate_as_partial_shape(get_input_source_output(1), repeats_as_pshape);
     std::vector<Dimension> repeats_value(repeats_as_pshape);
     if (repeats_are_known && !repeats_value.empty() && arg_shape.rank().is_static()) {
@@ -51,12 +51,12 @@ void op::v0::Tile::validate_and_infer_types() {
         data_shape.insert(data_shape.begin(), output_rank - data_rank, 1);
         repeats_value.insert(repeats_value.begin(), output_rank - repeats_rank, 1);
 
-        auto output_shape = PartialShape::dynamic(output_rank);
+        auto output_shape = ov::PartialShape::dynamic(output_rank);
         for (size_t i = 0; i < output_rank; i++)
             output_shape[i] = data_shape[i] * repeats_value[i];
         set_output_type(0, arg_et, output_shape);
     } else {
-        set_output_type(0, arg_et, PartialShape::dynamic());
+        set_output_type(0, arg_et, ov::PartialShape::dynamic());
     }
 
     set_input_is_relevant_to_shape(0);
@@ -73,9 +73,9 @@ bool op::v0::Tile::evaluate_tile(const HostTensorVector& outputs, const HostTens
     const auto& data = inputs[0];
     const auto& axis = inputs[1];
     auto& output = outputs[0];
-    auto repeats_val = read_vector<int64_t>(axis);
+    auto repeats_val = read_index_vector(axis);
     auto repeats_rank = repeats_val.size();
-    Shape data_shape = data->get_shape();
+    ov::Shape data_shape = data->get_shape();
     auto data_rank = data_shape.size();
     auto output_rank = std::max(data_rank, repeats_rank);
 
@@ -83,7 +83,7 @@ bool op::v0::Tile::evaluate_tile(const HostTensorVector& outputs, const HostTens
     data_shape.insert(data_shape.begin(), output_rank - data_rank, 1);
     repeats_val.insert(repeats_val.begin(), output_rank - repeats_rank, 1);
 
-    Shape output_shape(output_rank);
+    ov::Shape output_shape(output_rank);
     for (size_t i = 0; i < output_rank; i++) {
         output_shape[i] = data_shape[i] * repeats_val[i];
     }
diff --git a/ngraph/core/src/op/topk.cpp b/ngraph/core/src/op/topk.cpp
index e11457eca43df5..e29e682362ad96 100644
--- a/ngraph/core/src/op/topk.cpp
+++ b/ngraph/core/src/op/topk.cpp
@@ -24,14 +24,14 @@ template <element::Type_t INPUT_ET, element::Type_t INDEX_ET>
 inline bool evaluate_execute(const HostTensorPtr& arg0,
                              const HostTensorPtr& out_indices,
                              const HostTensorPtr& out_values,
-                             const Shape out_shape,
+                             const ov::Shape out_shape,
                              const size_t axis,
                              const size_t k,
                              const bool compute_max,
                              const op::v1::TopK::SortType sort) {
     using T = typename element_type_traits<INPUT_ET>::value_type;
     using U = typename element_type_traits<INDEX_ET>::value_type;
-    const Shape in_shape = arg0->get_shape();
+    const ov::Shape in_shape = arg0->get_shape();
     out_indices->set_shape(out_shape);
     out_indices->set_element_type(INDEX_ET);
 
@@ -60,7 +60,7 @@ template <element::Type_t INPUT_ET>
 bool evaluate(const HostTensorPtr& arg,
               const HostTensorPtr& out_indices,
               const HostTensorPtr& out_values,
-              const Shape out_shape,
+              const ov::Shape out_shape,
               const size_t axis,
               const size_t k,
               const bool max,
@@ -80,7 +80,7 @@ bool evaluate(const HostTensorPtr& arg,
 bool evaluate_topk(const HostTensorPtr& arg,
                    const HostTensorPtr& out_indices,
                    const HostTensorPtr& out_values,
-                   const Shape out_shape,
+                   const ov::Shape out_shape,
                    const size_t axis,
                    const size_t k,
                    const bool max,
@@ -136,7 +136,7 @@ size_t read_k_from_host_tensor(const HostTensorPtr& arg_k) {
 }  // namespace topk
 
 // v1 version starts
-NGRAPH_RTTI_DEFINITION(op::v1::TopK, "TopK", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::TopK, "TopK", 1);
 
 static const std::uint64_t UNKNOWN_NORMALIZED_AXIS = std::numeric_limits<uint64_t>::max();
 
@@ -196,17 +196,17 @@ void op::v1::TopK::validate_and_infer_types() {
                           "Index element type attribute should be either \'i32\' or \'i64\'. Got: ",
                           m_index_element_type);
 
-    if (op::is_constant(input_value(1).get_node())) {
+    if (ov::op::util::is_constant(input_value(1).get_node())) {
         // Check k value
         read_k_from_constant_node(input_value(1).get_node_shared_ptr(), get_input_element_type(1));
     }
 
-    PartialShape output_shape{input_partial_shape};
+    ov::PartialShape output_shape{input_partial_shape};
 
     if (output_shape.rank().is_static()) {
         m_normalized_axis = ngraph::normalize_axis(this, m_axis, output_shape.rank());
 
-        PartialShape k_as_shape;
+        ov::PartialShape k_as_shape;
         if (evaluate_as_partial_shape(input_value(1), k_as_shape)) {
             if (k_as_shape.is_static()) {
                 output_shape[m_normalized_axis] = k_as_shape[0];
@@ -232,10 +232,10 @@ void op::v1::TopK::validate_and_infer_types() {
     set_output_type(1, m_index_element_type, output_shape);
 }
 
-Shape op::v1::TopK::compute_output_shape(const std::string& node_description,
-                                         const PartialShape input_partial_shape,
-                                         const int64_t k) const {
-    PartialShape output_shape{input_partial_shape};
+ov::Shape op::v1::TopK::compute_output_shape(const std::string& node_description,
+                                             const ov::PartialShape input_partial_shape,
+                                             const int64_t k) const {
+    ov::PartialShape output_shape{input_partial_shape};
 
     auto normalized_axis = ngraph::normalize_axis(node_description, m_axis, output_shape.rank());
     if (k != 0) {
@@ -281,7 +281,7 @@ size_t op::v1::TopK::read_k_from_constant_node(const shared_ptr<Node>& node,
         k_element_type,
         ").");
 
-    const auto k_constant = ov::as_type_ptr<op::Constant>(node);
+    const auto k_constant = ov::as_type_ptr<op::v0::Constant>(node);
 
     size_t k = 0;
 
@@ -303,7 +303,7 @@ size_t op::v1::TopK::read_k_from_constant_node(const shared_ptr<Node>& node,
 }
 
 template <typename T>
-size_t op::v1::TopK::validate_and_get_k(const shared_ptr<op::Constant>& k_constant) const {
+size_t op::v1::TopK::validate_and_get_k(const shared_ptr<op::v0::Constant>& k_constant) const {
     const auto k_const_contents = k_constant->get_vector<T>();
 
     NODE_VALIDATION_CHECK(this,
@@ -334,7 +334,7 @@ shared_ptr<Node> op::v1::TopK::clone_with_new_inputs(const OutputVector& new_arg
 
 size_t op::v1::TopK::get_k() const {
     size_t k = 0;
-    if (op::is_constant(input_value(1).get_node())) {
+    if (op::util::is_constant(input_value(1).get_node())) {
         k = read_k_from_constant_node(input_value(1).get_node_shared_ptr(), get_input_element_type(1));
     }
 
@@ -345,12 +345,12 @@ size_t op::v1::TopK::get_k() const {
 }
 
 void op::v1::TopK::set_k(size_t k) {
-    this->input(1).replace_source_output(op::Constant::create(element::i64, Shape{}, {k})->output(0));
+    this->input(1).replace_source_output(op::v0::Constant::create(element::i64, ov::Shape{}, {k})->output(0));
 }
 
 bool op::v1::TopK::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(v1_TopK_evaluate);
-    Shape arg_shape = inputs[0]->get_shape();
+    ov::Shape arg_shape = inputs[0]->get_shape();
     // 1. get axis, mode ( max/min), sort_type
     size_t axis = ngraph::normalize_axis(this, m_axis, arg_shape.size());
     bool compute_max = get_mode() == TopKMode::MAX ? true : false;
@@ -358,7 +358,7 @@ bool op::v1::TopK::evaluate(const HostTensorVector& outputs, const HostTensorVec
 
     // 2. get value of k - from constant node or from HT
     size_t k = 0;
-    if (op::is_constant(input_value(1).get_node())) {
+    if (op::util::is_constant(input_value(1).get_node())) {
         k = read_k_from_constant_node(input_value(1).get_node_shared_ptr(), get_input_element_type(1));
         NGRAPH_CHECK(k <= arg_shape[axis], "'K' exceeds the dimension of top_k_axis");
     } else {
@@ -400,7 +400,7 @@ bool op::v1::TopK::has_evaluate() const {
         return false;
     }
 
-    if (op::is_constant(input_value(1).get_node())) {
+    if (op::util::is_constant(input_value(1).get_node())) {
         switch (get_input_element_type(1)) {
         case ngraph::element::i8:
         case ngraph::element::i32:
@@ -429,7 +429,7 @@ bool op::v1::TopK::has_evaluate() const {
 }
 
 // v3 version starts
-constexpr NodeTypeInfo op::v3::TopK::type_info;
+OPENVINO_RTTI_DEFINITION(op::v3::TopK, "TopK", 3);
 
 op::v3::TopK::TopK(const Output<Node>& data,
                    const Output<Node>& k,
@@ -471,7 +471,7 @@ void op::v3::TopK::validate_and_infer_types() {
 
 size_t op::v3::TopK::read_k_from_constant_node(const shared_ptr<Node>& node,
                                                const element::Type& k_element_type) const {
-    const auto k_constant = ov::as_type_ptr<op::Constant>(node);
+    const auto k_constant = ov::as_type_ptr<op::v0::Constant>(node);
 
     size_t k = 0;
 
@@ -536,7 +536,7 @@ bool op::v3::TopK::has_evaluate() const {
         return false;
     }
 
-    if (op::is_constant(input_value(1).get_node())) {
+    if (op::util::is_constant(input_value(1).get_node())) {
         switch (get_input_element_type(1)) {
         case ngraph::element::i8:
         case ngraph::element::i32:
diff --git a/ngraph/core/src/op/transpose.cpp b/ngraph/core/src/op/transpose.cpp
index e0c9bd37a74afc..4cda6759531c41 100644
--- a/ngraph/core/src/op/transpose.cpp
+++ b/ngraph/core/src/op/transpose.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::Transpose, "Transpose", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::Transpose, "Transpose", 1);
 
 op::v1::Transpose::Transpose(const Output<Node>& arg, const Output<Node>& input_order) : Op({arg, input_order}) {
     constructor_validate_and_infer_types();
@@ -36,7 +36,7 @@ void op::v1::Transpose::validate_and_infer_types() {
     const auto& arg_shape = get_input_partial_shape(0);
     NODE_VALIDATION_CHECK(
         this,
-        input_order_shape.compatible(PartialShape{arg_shape.rank()}) ||
+        input_order_shape.compatible(ov::PartialShape{arg_shape.rank()}) ||
             (input_order_shape.is_static() && input_order_shape.rank() == 1 && input_order_shape[0] == 0),
         "Input order must have shape [n], where n is the rank of arg.");
 
@@ -57,7 +57,7 @@ void op::v1::Transpose::validate_and_infer_types() {
                               arg_shape);
         set_output_type(0, get_input_element_type(0), ngraph::apply_permutation(arg_shape, permutation));
     } else {
-        set_output_type(0, get_input_element_type(0), PartialShape::dynamic(arg_shape.rank()));
+        set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic(arg_shape.rank()));
     }
     NGRAPH_SUPPRESS_DEPRECATED_END
 }
@@ -74,7 +74,7 @@ bool evaluate_transpose(const HostTensorPtr& arg1, const HostTensorPtr& arg2, co
                  "Transpose axis element type has to be integral data type.");
 
     std::vector<int64_t> axes_order = host_tensor_2_vector<int64_t>(arg2);
-    Shape in_shape = arg1->get_shape();
+    ov::Shape in_shape = arg1->get_shape();
     if (shape_size(arg2->get_shape()) == 0) {
         axes_order.resize(in_shape.size());
         std::iota(axes_order.begin(), axes_order.end(), 0);
@@ -85,7 +85,7 @@ bool evaluate_transpose(const HostTensorPtr& arg1, const HostTensorPtr& arg2, co
         NGRAPH_CHECK(is_unique_order, "Transpose axes order values must be unique.");
     }
 
-    Shape out_shape(in_shape.size());
+    ov::Shape out_shape(in_shape.size());
     std::transform(axes_order.begin(), axes_order.end(), out_shape.begin(), [&](const int64_t& v) {
         NGRAPH_CHECK(v >= 0, "Negative values for transpose axes order are not supported.");
         NGRAPH_CHECK(v < int64_t(in_shape.size()), "Transpose axis ", v, " is out of shape range.");
diff --git a/ngraph/core/src/op/type_relaxed.cpp b/ngraph/core/src/op/type_relaxed.cpp
index 6f5881d070d141..cc3bf7253ec108 100644
--- a/ngraph/core/src/op/type_relaxed.cpp
+++ b/ngraph/core/src/op/type_relaxed.cpp
@@ -10,7 +10,6 @@
 
 namespace ngraph {
 namespace op {
-TypeRelaxedBase::~TypeRelaxedBase() {}
-
+TypeRelaxedBase::~TypeRelaxedBase() = default;
 }  // namespace op
 }  // namespace ngraph
diff --git a/ngraph/core/src/op/unsqueeze.cpp b/ngraph/core/src/op/unsqueeze.cpp
index cec998664d3537..749c49500a8259 100644
--- a/ngraph/core/src/op/unsqueeze.cpp
+++ b/ngraph/core/src/op/unsqueeze.cpp
@@ -19,7 +19,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v0::Unsqueeze, "Unsqueeze", 0);
+OPENVINO_RTTI_DEFINITION(op::v0::Unsqueeze, "Unsqueeze", 0);
 
 op::v0::Unsqueeze::Unsqueeze(const Output<Node>& data, const Output<Node>& axes) : Op({data, axes}) {
     constructor_validate_and_infer_types();
@@ -40,7 +40,7 @@ void op::v0::Unsqueeze::validate_and_infer_types() {
                           axes_pshape.rank().get_length());
 
     if (data_rank.is_dynamic() || !axes_constant) {
-        set_output_type(0, get_input_element_type(0), PartialShape::dynamic());
+        set_output_type(0, get_input_element_type(0), ov::PartialShape::dynamic());
         return;
     }
 
@@ -58,7 +58,7 @@ void op::v0::Unsqueeze::validate_and_infer_types() {
 
         output_shape.insert(next(begin(output_shape), axis), 1);
     }
-    set_output_type(0, get_input_element_type(0), PartialShape{output_shape});
+    set_output_type(0, get_input_element_type(0), ov::PartialShape{output_shape});
 }
 
 bool op::v0::Unsqueeze::visit_attributes(AttributeVisitor& visitor) {
@@ -166,8 +166,8 @@ bool op::v0::Unsqueeze::constant_fold(OutputVector& output_values, const OutputV
 
     const auto& shape = get_output_shape(0);
 
-    if (auto data_const = std::dynamic_pointer_cast<op::Constant>(inputs_values[0].get_node_shared_ptr())) {
-        output_values[0] = std::make_shared<op::Constant>(*data_const, shape);
+    if (auto data_const = std::dynamic_pointer_cast<op::v0::Constant>(inputs_values[0].get_node_shared_ptr())) {
+        output_values[0] = std::make_shared<op::v0::Constant>(*data_const, shape);
         return true;
     }
     return false;
diff --git a/ngraph/core/src/op/util/activation_functions.cpp b/ngraph/core/src/op/util/activation_functions.cpp
index 64ef443178e54b..922f3cf26389f1 100644
--- a/ngraph/core/src/op/util/activation_functions.cpp
+++ b/ngraph/core/src/op/util/activation_functions.cpp
@@ -16,43 +16,42 @@
 #include "ngraph/op/tanh.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-static shared_ptr<Node> sigmoid(const shared_ptr<Node>& arg, float /* alpha */, float /* beta */) {
-    return make_shared<op::Sigmoid>(arg);
+static shared_ptr<ov::Node> sigmoid(const shared_ptr<ov::Node>& arg, float /* alpha */, float /* beta */) {
+    return make_shared<ngraph::op::Sigmoid>(arg);
 }
 
-static shared_ptr<Node> tanh(const shared_ptr<Node>& arg, float /* alpha */, float /* beta */) {
-    return make_shared<op::Tanh>(arg);
+static shared_ptr<ov::Node> tanh(const shared_ptr<ov::Node>& arg, float /* alpha */, float /* beta */) {
+    return make_shared<ngraph::op::Tanh>(arg);
 }
 
-static shared_ptr<Node> relu(const shared_ptr<Node>& arg, float /* alpha */, float /* beta */) {
-    return make_shared<op::Relu>(arg);
+static shared_ptr<ov::Node> relu(const shared_ptr<ov::Node>& arg, float /* alpha */, float /* beta */) {
+    return make_shared<ngraph::op::Relu>(arg);
 }
 
-static shared_ptr<Node> hardsigmoid(const shared_ptr<Node>& arg, float alpha, float beta) {
-    const auto alpha_node = op::Constant::create<float>(arg->get_element_type(), Shape{}, {alpha});
-    const auto beta_node = op::Constant::create<float>(arg->get_element_type(), Shape{}, {beta});
+static shared_ptr<ov::Node> hardsigmoid(const shared_ptr<ov::Node>& arg, float alpha, float beta) {
+    const auto alpha_node = ngraph::op::Constant::create<float>(arg->get_element_type(), ngraph::Shape{}, {alpha});
+    const auto beta_node = ngraph::op::Constant::create<float>(arg->get_element_type(), ngraph::Shape{}, {beta});
 
-    return make_shared<op::HardSigmoid>(arg, alpha_node, beta_node);
+    return make_shared<ngraph::op::HardSigmoid>(arg, alpha_node, beta_node);
 }
 
-op::util::ActivationFunction::ActivationFunction(ActivationFunctionType f, float alpha, float beta)
+ov::op::util::ActivationFunction::ActivationFunction(ActivationFunctionType f, float alpha, float beta)
     : m_function{f},
       m_alpha{alpha},
       m_beta{beta} {}
 
-op::util::ActivationFunction::ActivationFunction(ActivationFunctionType f, float alpha)
+ov::op::util::ActivationFunction::ActivationFunction(ActivationFunctionType f, float alpha)
     : ActivationFunction(f, alpha, nanf("")) {}
 
-op::util::ActivationFunction::ActivationFunction(ActivationFunctionType f)
+ov::op::util::ActivationFunction::ActivationFunction(ActivationFunctionType f)
     : ActivationFunction(f, nanf(""), nanf("")) {}
 
-shared_ptr<Node> op::util::ActivationFunction::operator()(const shared_ptr<Node>& arg) const {
+shared_ptr<ov::Node> ov::op::util::ActivationFunction::operator()(const shared_ptr<Node>& arg) const {
     return m_function(arg, m_alpha, m_beta);
 }
 
-op::util::ActivationFunction op::util::get_activation_func_by_name(const string& func_name) {
+ov::op::util::ActivationFunction ov::op::util::get_activation_func_by_name(const string& func_name) {
     using ActivationFunctionMap = unordered_map<string, op::util::ActivationFunction>;
 
     static ActivationFunctionMap func_map{
diff --git a/ngraph/core/src/op/util/arithmetic_reduction.cpp b/ngraph/core/src/op/util/arithmetic_reduction.cpp
index 40b151039906da..b7b3cdd63a8402 100644
--- a/ngraph/core/src/op/util/arithmetic_reduction.cpp
+++ b/ngraph/core/src/op/util/arithmetic_reduction.cpp
@@ -9,20 +9,19 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::ArithmeticReduction, "ArithmeticReduction", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::ArithmeticReduction, "ArithmeticReduction", 0);
 
-op::util::ArithmeticReduction::ArithmeticReduction() {}
+ov::op::util::ArithmeticReduction::ArithmeticReduction() = default;
 
-op::util::ArithmeticReduction::ArithmeticReduction(const Output<Node>& arg, const Output<Node>& reduction_axes)
+ov::op::util::ArithmeticReduction::ArithmeticReduction(const Output<Node>& arg, const Output<Node>& reduction_axes)
     : ReductionBase(arg, reduction_axes) {}
 
-bool op::util::ArithmeticReduction::reduction_axes_constant() const {
-    return ov::is_type<op::Constant>(input_value(1).get_node());
+bool ov::op::util::ArithmeticReduction::reduction_axes_constant() const {
+    return ov::is_type<ngraph::op::Constant>(input_value(1).get_node());
 }
 
-const AxisSet op::util::ArithmeticReduction::get_reduction_axes() const {
+const ov::AxisSet ov::op::util::ArithmeticReduction::get_reduction_axes() const {
     AxisSet axes;
     if (const auto& const_op = get_constant_from_source(input_value(1))) {
         const auto const_data = const_op->cast_vector<int64_t>();
@@ -33,12 +32,13 @@ const AxisSet op::util::ArithmeticReduction::get_reduction_axes() const {
     return axes;
 }
 
-void op::util::ArithmeticReduction::set_reduction_axes(const AxisSet& reduction_axes) {
+void ov::op::util::ArithmeticReduction::set_reduction_axes(const AxisSet& reduction_axes) {
     this->input(1).replace_source_output(
-        op::Constant::create(element::i64, Shape{reduction_axes.size()}, reduction_axes.to_vector())->output(0));
+        ngraph::op::Constant::create(element::i64, ov::Shape{reduction_axes.size()}, reduction_axes.to_vector())
+            ->output(0));
 }
 
-void op::util::ArithmeticReduction::validate_and_infer_types() {
+void ov::op::util::ArithmeticReduction::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_ArithmeticReduction_validate_and_infer_types);
 
     const PartialShape& axes_shape = get_input_partial_shape(1);
diff --git a/ngraph/core/src/op/util/arithmetic_reductions_keep_dims.cpp b/ngraph/core/src/op/util/arithmetic_reductions_keep_dims.cpp
index 01d061da855293..522f0561508115 100644
--- a/ngraph/core/src/op/util/arithmetic_reductions_keep_dims.cpp
+++ b/ngraph/core/src/op/util/arithmetic_reductions_keep_dims.cpp
@@ -10,23 +10,23 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::ArithmeticReductionKeepDims, "ArithmeticReductionKeepDims", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::ArithmeticReductionKeepDims, "ArithmeticReductionKeepDims", 0);
 
-op::util::ArithmeticReductionKeepDims::ArithmeticReductionKeepDims(const ngraph::Output<ngraph::Node>& arg,
-                                                                   const ngraph::Output<ngraph::Node>& reduction_axes,
-                                                                   bool keep_dims)
+ov::op::util::ArithmeticReductionKeepDims::ArithmeticReductionKeepDims(
+    const ngraph::Output<ngraph::Node>& arg,
+    const ngraph::Output<ngraph::Node>& reduction_axes,
+    bool keep_dims)
     : ArithmeticReduction(arg, reduction_axes),
       m_keep_dims{keep_dims} {}
 
-bool ngraph::op::util::ArithmeticReductionKeepDims::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::ArithmeticReductionKeepDims::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_util_ArithmeticReductionKeepDims_visit_attributes);
     visitor.on_attribute("keep_dims", m_keep_dims);
     return true;
 }
 
-void op::util::ArithmeticReductionKeepDims::validate_and_infer_types() {
+void ov::op::util::ArithmeticReductionKeepDims::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_util_ArithmeticReductionKeepDims_validate_and_infer_types);
 
     const element::Type& data_et = get_input_element_type(0);
diff --git a/ngraph/core/src/op/util/assign_base.cpp b/ngraph/core/src/op/util/assign_base.cpp
new file mode 100644
index 00000000000000..63e5ab51b8b4b8
--- /dev/null
+++ b/ngraph/core/src/op/util/assign_base.cpp
@@ -0,0 +1,7 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/op/util/assign_base.hpp"
+
+OPENVINO_RTTI_DEFINITION(ov::op::util::AssignBase, "AssignBase", 0);
diff --git a/ngraph/core/src/op/util/attr_types.cpp b/ngraph/core/src/op/util/attr_types.cpp
index 36814edc3217f1..c7bfd40ff819d0 100644
--- a/ngraph/core/src/op/util/attr_types.cpp
+++ b/ngraph/core/src/op/util/attr_types.cpp
@@ -140,44 +140,43 @@ NGRAPH_API EnumNames<ngraph::op::RecurrentSequenceDirection>& EnumNames<ngraph::
          {"bidirectional", ngraph::op::RecurrentSequenceDirection::BIDIRECTIONAL}});
     return enum_names;
 }
-}  // namespace ov
 
-const ngraph::op::AutoBroadcastSpec ngraph::op::AutoBroadcastSpec::NUMPY(AutoBroadcastType::NUMPY, 0);
-const ngraph::op::AutoBroadcastSpec ngraph::op::AutoBroadcastSpec::NONE{AutoBroadcastType::NONE, 0};
+const op::AutoBroadcastSpec op::AutoBroadcastSpec::NUMPY(AutoBroadcastType::NUMPY, 0);
+const op::AutoBroadcastSpec op::AutoBroadcastSpec::NONE{AutoBroadcastType::NONE, 0};
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::PadMode& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::PadMode& type) {
     return s << as_string(type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::PadType& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::PadType& type) {
     return s << as_string(type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::RoundingType& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::RoundingType& type) {
     return s << as_string(type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::BroadcastType& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::BroadcastType& type) {
     return s << as_string(type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::AutoBroadcastType& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::AutoBroadcastType& type) {
     return s << as_string(type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::EpsMode& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::EpsMode& type) {
     return s << as_string(type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::TopKSortType& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::TopKSortType& type) {
     return s << as_string(type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::TopKMode& type) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::TopKMode& type) {
     return s << as_string(type);
 }
 
-ngraph::op::AutoBroadcastType ngraph::op::AutoBroadcastSpec::type_from_string(const std::string& type) const {
+op::AutoBroadcastType op::AutoBroadcastSpec::type_from_string(const std::string& type) const {
     auto lowercase_type = type;
     std::transform(lowercase_type.begin(), lowercase_type.end(), lowercase_type.begin(), [](char c) {
         return std::tolower(c);
@@ -193,6 +192,7 @@ ngraph::op::AutoBroadcastType ngraph::op::AutoBroadcastSpec::type_from_string(co
     return allowed_values.at(lowercase_type);
 }
 
-std::ostream& ngraph::op::operator<<(std::ostream& s, const ngraph::op::RecurrentSequenceDirection& direction) {
+std::ostream& op::operator<<(std::ostream& s, const ngraph::op::RecurrentSequenceDirection& direction) {
     return s << as_string(direction);
 }
+}  // namespace ov
diff --git a/ngraph/core/src/op/util/binary_elementwise_arithmetic.cpp b/ngraph/core/src/op/util/binary_elementwise_arithmetic.cpp
index ee97867d871c1d..b09b87977dbbdf 100644
--- a/ngraph/core/src/op/util/binary_elementwise_arithmetic.cpp
+++ b/ngraph/core/src/op/util/binary_elementwise_arithmetic.cpp
@@ -11,19 +11,19 @@
 #include "ngraph/op/util/elementwise_args.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::BinaryElementwiseArithmetic, "BinaryElementwiseArithmetic", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::BinaryElementwiseArithmetic, "BinaryElementwiseArithmetic", 0);
 
-op::util::BinaryElementwiseArithmetic::BinaryElementwiseArithmetic(const AutoBroadcastSpec& autob) : m_autob(autob) {}
+ov::op::util::BinaryElementwiseArithmetic::BinaryElementwiseArithmetic(const AutoBroadcastSpec& autob)
+    : m_autob(autob) {}
 
-op::util::BinaryElementwiseArithmetic::BinaryElementwiseArithmetic(const Output<Node>& arg0,
-                                                                   const Output<Node>& arg1,
-                                                                   const AutoBroadcastSpec& autob)
+ov::op::util::BinaryElementwiseArithmetic::BinaryElementwiseArithmetic(const Output<Node>& arg0,
+                                                                       const Output<Node>& arg1,
+                                                                       const AutoBroadcastSpec& autob)
     : Op({arg0, arg1}),
       m_autob(autob) {}
 
-void op::util::BinaryElementwiseArithmetic::validate_and_infer_elementwise_arithmetic(
+void ov::op::util::BinaryElementwiseArithmetic::validate_and_infer_elementwise_arithmetic(
     const op::AutoBroadcastSpec& autob) {
     auto args_et_pshape = op::util::validate_and_infer_elementwise_args(this, autob);
     element::Type& args_et = std::get<0>(args_et_pshape);
@@ -38,35 +38,35 @@ void op::util::BinaryElementwiseArithmetic::validate_and_infer_elementwise_arith
     set_output_type(0, args_et, args_pshape);
 }
 
-void op::util::BinaryElementwiseArithmetic::validate_and_infer_types() {
+void ov::op::util::BinaryElementwiseArithmetic::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_util_BinaryElementwiseArithmetic_validate_and_infer_types);
     validate_and_infer_elementwise_arithmetic(m_autob);
 }
 
-bool op::util::BinaryElementwiseArithmetic::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::BinaryElementwiseArithmetic::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_util_BinaryElementwiseArithmetic_visit_attributes);
     visitor.on_attribute("auto_broadcast", m_autob);
     return true;
 }
 
-bool op::util::BinaryElementwiseArithmetic::evaluate_upper(const HostTensorVector& output_values) const {
-    NGRAPH_CHECK(validate_host_tensor_vector(output_values, 1));
+bool ov::op::util::BinaryElementwiseArithmetic::evaluate_upper(const HostTensorVector& output_values) const {
+    NGRAPH_CHECK(ngraph::validate_host_tensor_vector(output_values, 1));
     HostTensorVector lower_output_tensors;
     for (const auto& output : output_values)
         lower_output_tensors.push_back(
             std::make_shared<HostTensor>(output->get_element_type(), output->get_partial_shape()));
-    if (!interval_bound_evaluator(this, lower_output_tensors, output_values))
+    if (!ngraph::interval_bound_evaluator(this, lower_output_tensors, output_values))
         return false;
     return true;
 }
 
-bool op::util::BinaryElementwiseArithmetic::evaluate_lower(const HostTensorVector& output_values) const {
-    NGRAPH_CHECK(validate_host_tensor_vector(output_values, 1));
+bool ov::op::util::BinaryElementwiseArithmetic::evaluate_lower(const HostTensorVector& output_values) const {
+    NGRAPH_CHECK(ngraph::validate_host_tensor_vector(output_values, 1));
     HostTensorVector upper_output_tensors;
     for (const auto& output : output_values)
         upper_output_tensors.push_back(
             std::make_shared<HostTensor>(output->get_element_type(), output->get_partial_shape()));
-    if (!interval_bound_evaluator(this, output_values, upper_output_tensors))
+    if (!ngraph::interval_bound_evaluator(this, output_values, upper_output_tensors))
         return false;
     return true;
 }
diff --git a/ngraph/core/src/op/util/binary_elementwise_comparison.cpp b/ngraph/core/src/op/util/binary_elementwise_comparison.cpp
index 4915b9dd218042..7a6e15a0cb8495 100644
--- a/ngraph/core/src/op/util/binary_elementwise_comparison.cpp
+++ b/ngraph/core/src/op/util/binary_elementwise_comparison.cpp
@@ -9,19 +9,19 @@
 #include "ngraph/op/util/elementwise_args.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::BinaryElementwiseComparison, "BinaryElementwiseComparison", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::BinaryElementwiseComparison, "BinaryElementwiseComparison", 0);
 
-op::util::BinaryElementwiseComparison::BinaryElementwiseComparison(const AutoBroadcastSpec& autob) : m_autob(autob) {}
+ov::op::util::BinaryElementwiseComparison::BinaryElementwiseComparison(const AutoBroadcastSpec& autob)
+    : m_autob(autob) {}
 
-op::util::BinaryElementwiseComparison::BinaryElementwiseComparison(const Output<Node>& arg0,
-                                                                   const Output<Node>& arg1,
-                                                                   const AutoBroadcastSpec& autob)
+ov::op::util::BinaryElementwiseComparison::BinaryElementwiseComparison(const Output<Node>& arg0,
+                                                                       const Output<Node>& arg1,
+                                                                       const AutoBroadcastSpec& autob)
     : Op({arg0, arg1}),
       m_autob(autob) {}
 
-void op::util::BinaryElementwiseComparison::validate_and_infer_types() {
+void ov::op::util::BinaryElementwiseComparison::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_util_BinaryElementwiseComparison_validate_and_infer_types);
     auto args_et_pshape = op::util::validate_and_infer_elementwise_args(this, m_autob);
     PartialShape& args_pshape = std::get<1>(args_et_pshape);
@@ -29,7 +29,7 @@ void op::util::BinaryElementwiseComparison::validate_and_infer_types() {
     set_output_type(0, element::boolean, args_pshape);
 }
 
-bool op::util::BinaryElementwiseComparison::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::BinaryElementwiseComparison::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_util_BinaryElementwiseComparison_visit_attributes);
     visitor.on_attribute("auto_broadcast", m_autob);
     return true;
diff --git a/ngraph/core/src/op/util/binary_elementwise_logical.cpp b/ngraph/core/src/op/util/binary_elementwise_logical.cpp
index d8b6efb4793427..fc9125e63cebd3 100644
--- a/ngraph/core/src/op/util/binary_elementwise_logical.cpp
+++ b/ngraph/core/src/op/util/binary_elementwise_logical.cpp
@@ -9,19 +9,18 @@
 #include "ngraph/op/util/elementwise_args.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::BinaryElementwiseLogical, "BinaryElementwiseLogical", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::BinaryElementwiseLogical, "BinaryElementwiseLogical", 0);
 
-op::util::BinaryElementwiseLogical::BinaryElementwiseLogical() {}
+ov::op::util::BinaryElementwiseLogical::BinaryElementwiseLogical() = default;
 
-op::util::BinaryElementwiseLogical::BinaryElementwiseLogical(const Output<Node>& arg0,
-                                                             const Output<Node>& arg1,
-                                                             const AutoBroadcastSpec& autob)
+ov::op::util::BinaryElementwiseLogical::BinaryElementwiseLogical(const Output<Node>& arg0,
+                                                                 const Output<Node>& arg1,
+                                                                 const AutoBroadcastSpec& autob)
     : Op({arg0, arg1}),
       m_autob(autob) {}
 
-void op::util::BinaryElementwiseLogical::validate_and_infer_types() {
+void ov::op::util::BinaryElementwiseLogical::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_util_BinaryElementwiseLogical_validate_and_infer_types);
 
     auto args_et_pshape = op::util::validate_and_infer_elementwise_args(this, m_autob);
@@ -37,7 +36,7 @@ void op::util::BinaryElementwiseLogical::validate_and_infer_types() {
     set_output_type(0, element::boolean, args_pshape);
 }
 
-bool op::util::BinaryElementwiseLogical::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::BinaryElementwiseLogical::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_util_BinaryElementwiseLogical_visit_attributes);
     visitor.on_attribute("auto_broadcast", m_autob);
     return true;
diff --git a/ngraph/core/src/op/util/broadcast_base.cpp b/ngraph/core/src/op/util/broadcast_base.cpp
index 11d088e0bc0767..1260d154b151ea 100644
--- a/ngraph/core/src/op/util/broadcast_base.cpp
+++ b/ngraph/core/src/op/util/broadcast_base.cpp
@@ -16,26 +16,25 @@
 #include "ngraph/runtime/reference/broadcast.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::BroadcastBase, "BroadcastBase", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::BroadcastBase, "BroadcastBase", 0);
 
-op::util::BroadcastBase::BroadcastBase(const Output<Node>& arg,
-                                       const Output<Node>& target_shape,
-                                       const Output<Node>& axes_mapping,
-                                       const BroadcastModeSpec& broadcast_mode)
+ov::op::util::BroadcastBase::BroadcastBase(const Output<Node>& arg,
+                                           const Output<Node>& target_shape,
+                                           const Output<Node>& axes_mapping,
+                                           const BroadcastModeSpec& broadcast_mode)
     : Op({arg, target_shape, axes_mapping}),
       m_mode{broadcast_mode} {}
 
-op::util::BroadcastBase::BroadcastBase(const Output<Node>& arg,
-                                       const Output<Node>& target_shape,
-                                       const BroadcastModeSpec& broadcast_mode)
+ov::op::util::BroadcastBase::BroadcastBase(const Output<Node>& arg,
+                                           const Output<Node>& target_shape,
+                                           const BroadcastModeSpec& broadcast_mode)
     : Op({arg, target_shape}),
       m_mode{broadcast_mode} {}
 
-PartialShape op::util::BroadcastBase::get_result_shape_pdpd(const PartialShape& arg0_shape,
-                                                            const PartialShape& target_pshape,
-                                                            const op::BroadcastModeSpec& broadcast_spec) const {
+ov::PartialShape ov::op::util::BroadcastBase::get_result_shape_pdpd(const PartialShape& arg0_shape,
+                                                                    const PartialShape& target_pshape,
+                                                                    const op::BroadcastModeSpec& broadcast_spec) const {
     if (target_pshape.is_dynamic())
         return PartialShape::dynamic(target_pshape.rank());
     Shape target_shape = target_pshape.to_shape();
@@ -69,8 +68,8 @@ PartialShape op::util::BroadcastBase::get_result_shape_pdpd(const PartialShape&
     return result_shape;
 }
 
-void op::util::BroadcastBase::validate_target_shape_numpy(const PartialShape& arg_shape,
-                                                          const PartialShape& target_shape) const {
+void ov::op::util::BroadcastBase::validate_target_shape_numpy(const PartialShape& arg_shape,
+                                                              const PartialShape& target_shape) const {
     if (arg_shape.rank().is_dynamic() || target_shape.rank().is_dynamic()) {
         return;
     }
@@ -98,9 +97,9 @@ void op::util::BroadcastBase::validate_target_shape_numpy(const PartialShape& ar
     }
 }
 
-void op::util::BroadcastBase::validate_target_shape_none(const PartialShape& arg_shape,
-                                                         const AxisVector& axes_mapping_val,
-                                                         const PartialShape& target_shape) const {
+void ov::op::util::BroadcastBase::validate_target_shape_none(const PartialShape& arg_shape,
+                                                             const AxisVector& axes_mapping_val,
+                                                             const PartialShape& target_shape) const {
     if (arg_shape.rank().is_dynamic() || target_shape.rank().is_dynamic()) {
         return;
     }
@@ -144,7 +143,7 @@ void op::util::BroadcastBase::validate_target_shape_none(const PartialShape& arg
     }
 }
 
-void op::util::BroadcastBase::validate_and_infer_types() {
+void ov::op::util::BroadcastBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_BroadcastBase_validate_and_infer_types);
     // shape node should have integer data type. For now we only allow i64
     auto shape_et = get_input_element_type(1);
@@ -191,9 +190,9 @@ void op::util::BroadcastBase::validate_and_infer_types() {
     }
 
     PartialShape output_shape;
-    bool output_shape_defined = evaluate_as_partial_shape(get_input_source_output(1), output_shape);
+    bool output_shape_defined = ngraph::evaluate_as_partial_shape(get_input_source_output(1), output_shape);
 
-    if (auto concat = ov::as_type_ptr<op::v0::Concat>(input_value(1).get_node_shared_ptr())) {
+    if (auto concat = ov::as_type_ptr<ngraph::op::v0::Concat>(input_value(1).get_node_shared_ptr())) {
         auto concat_inputs = concat->inputs();
 
         if (!output_shape_defined && concat->get_output_partial_shape(0).is_static() &&
@@ -201,8 +200,8 @@ void op::util::BroadcastBase::validate_and_infer_types() {
             auto output_partial_shape = vector<Dimension>{};
             for (const auto& concat_input : concat_inputs) {
                 auto source_node_ptr = concat_input.get_source_output().get_node_shared_ptr();
-                if (auto source_const_ptr = ov::as_type_ptr<op::v0::Constant>(source_node_ptr)) {
-                    output_partial_shape.push_back(source_const_ptr->get_axis_vector_val()[0]);
+                if (auto source_const_ptr = ov::as_type_ptr<ngraph::op::v0::Constant>(source_node_ptr)) {
+                    output_partial_shape.emplace_back(source_const_ptr->get_axis_vector_val()[0]);
                 } else {
                     output_partial_shape.push_back(Dimension::dynamic());
                 }
@@ -231,7 +230,7 @@ void op::util::BroadcastBase::validate_and_infer_types() {
                                   " doesn't match rank of input tensor ",
                                   input_rank);
 
-            if (output_shape_defined && has_and_set_equal_bounds(input_value(2))) {
+            if (output_shape_defined && ngraph::has_and_set_equal_bounds(input_value(2))) {
                 auto axes_mapping_val = get_constant_from_source(input_value(2))->get_axis_vector_val();
                 validate_target_shape_none(arg_shape, axes_mapping_val, output_shape);
             }
@@ -249,7 +248,7 @@ void op::util::BroadcastBase::validate_and_infer_types() {
     set_output_type(0, get_input_element_type(0), result_shape);
 }
 
-std::pair<bool, AxisSet> op::util::BroadcastBase::get_broadcast_axes_numpy_pdpd(
+std::pair<bool, ov::AxisSet> ov::op::util::BroadcastBase::get_broadcast_axes_numpy_pdpd(
     const Shape& arg_shape,
     const Shape& result_shape,
     const op::BroadcastModeSpec& broadcast_spec) {
@@ -267,8 +266,8 @@ std::pair<bool, AxisSet> op::util::BroadcastBase::get_broadcast_axes_numpy_pdpd(
     return std::make_pair(axes_known, broadcast_axes);
 }
 
-std::pair<bool, AxisSet> op::util::BroadcastBase::get_broadcast_axes_none(const AxisVector axes_mapping_val,
-                                                                          const size_t target_shape_size) {
+std::pair<bool, ov::AxisSet> ov::op::util::BroadcastBase::get_broadcast_axes_none(const AxisVector& axes_mapping_val,
+                                                                                  const size_t target_shape_size) {
     AxisSet broadcast_axes;
     bool axes_known = false;
 
@@ -283,7 +282,7 @@ std::pair<bool, AxisSet> op::util::BroadcastBase::get_broadcast_axes_none(const
     return std::make_pair(axes_known, broadcast_axes);
 }
 
-std::pair<bool, AxisSet> op::util::BroadcastBase::get_broadcast_axes() const {
+std::pair<bool, ov::AxisSet> ov::op::util::BroadcastBase::get_broadcast_axes() const {
     AxisSet broadcast_axes;
     bool axes_known = false;
 
@@ -302,44 +301,46 @@ std::pair<bool, AxisSet> op::util::BroadcastBase::get_broadcast_axes() const {
             return get_broadcast_axes_numpy_pdpd(arg_shape, result_shape, m_mode);
         }
     } else {
-        throw ngraph_error("Unknown autobroadcast type");
+        throw ov::Exception("Unknown autobroadcast type");
     }
 
     return std::make_pair(axes_known, broadcast_axes);
 }
 
-bool op::util::BroadcastBase::evaluate_broadcast(const HostTensorPtr& arg0,
-                                                 const HostTensorPtr& out,
-                                                 const AxisSet& broadcast_axes) const {
+bool ov::op::util::BroadcastBase::evaluate_broadcast(const HostTensorPtr& arg0,
+                                                     const HostTensorPtr& out,
+                                                     const AxisSet& broadcast_axes) const {
     NGRAPH_OP_SCOPE(util_BroadcastBase_evaluate_axes);
     auto arg0_shape = arg0->get_shape();
     if (arg0_shape.size() == 0) {
         arg0_shape = Shape{1};
     }
-    runtime::reference::broadcast(arg0->get_data_ptr<const char>(),
-                                  out->get_data_ptr<char>(),
-                                  arg0_shape,
-                                  out->get_shape(),
-                                  broadcast_axes,
-                                  arg0->get_element_type().size());
+    ngraph::runtime::reference::broadcast(arg0->get_data_ptr<const char>(),
+                                          out->get_data_ptr<char>(),
+                                          arg0_shape,
+                                          out->get_shape(),
+                                          broadcast_axes,
+                                          arg0->get_element_type().size());
     return true;
 }
 
 namespace {
-template <element::Type_t ET>
-void get_axis_vector_from_hosttensor(const HostTensorPtr& arg, AxisVector& axes_vector) {
-    using T = typename element_type_traits<ET>::value_type;
+template <ov::element::Type_t ET>
+void get_axis_vector_from_hosttensor(const ngraph::HostTensorPtr& arg, ov::AxisVector& axes_vector) {
+    using T = typename ov::element_type_traits<ET>::value_type;
     auto rank = arg->get_shape().at(0);
     std::vector<T> axes_vec(rank);
     arg->read(axes_vec.data(), rank * sizeof(T));
-    axes_vector = AxisVector(axes_vec.begin(), axes_vec.end());
+    axes_vector = ov::AxisVector(axes_vec.begin(), axes_vec.end());
 }
 
-#define GET_AXIS_VECTOR(a)   \
-    case element::Type_t::a: \
-        get_axis_vector_from_hosttensor<element::Type_t::a>
+#define GET_AXIS_VECTOR(a)       \
+    case ov::element::Type_t::a: \
+        get_axis_vector_from_hosttensor<ov::element::Type_t::a>
 
-void get_axis_vector_from_ht(const HostTensorPtr& arg, AxisVector& axis_vector, const Shape& arg_shape) {
+void get_axis_vector_from_ht(const ngraph::HostTensorPtr& arg,
+                             ov::AxisVector& axis_vector,
+                             const ov::Shape& arg_shape) {
     switch (arg->get_element_type()) {
         GET_AXIS_VECTOR(i8)(arg, axis_vector);
         break;
@@ -359,8 +360,7 @@ void get_axis_vector_from_ht(const HostTensorPtr& arg, AxisVector& axis_vector,
         break;
     default:
         // other types are not supported and would have thrown in ctor
-        ngraph_error("get_axis_vector_from_ht: type is not integral\n");
-        break;
+        throw ov::Exception("get_axis_vector_from_ht: type is not integral");
     }
     // Rank(arg_shape) == shape_size(axes_mapping)
     NGRAPH_CHECK(axis_vector.size() == arg_shape.size(),
@@ -370,21 +370,21 @@ void get_axis_vector_from_ht(const HostTensorPtr& arg, AxisVector& axis_vector,
                  arg_shape.size());
 }
 
-template <element::Type_t ET>
-void get_shape_from_hosttensor(const HostTensorPtr& input1, Shape& target_shape) {
-    using T = typename element_type_traits<ET>::value_type;
+template <ov::element::Type_t ET>
+void get_shape_from_hosttensor(const ngraph::HostTensorPtr& input1, ov::Shape& target_shape) {
+    using T = typename ov::element_type_traits<ET>::value_type;
     auto rank = input1->get_shape().at(0);
     std::vector<T> target_shape_vec(rank);
     input1->read(target_shape_vec.data(), rank * sizeof(T));
-    target_shape = Shape(target_shape_vec.begin(), target_shape_vec.end());
+    target_shape = ov::Shape(target_shape_vec.begin(), target_shape_vec.end());
 }
 
-#define CASE_GET_SHAPE(a)    \
-    case element::Type_t::a: \
-        get_shape_from_hosttensor<element::Type_t::a>
+#define CASE_GET_SHAPE(a)        \
+    case ov::element::Type_t::a: \
+        get_shape_from_hosttensor<ov::element::Type_t::a>
 
-Shape get_target_shape_from_ht(const HostTensorPtr& input1) {
-    Shape target_shape;
+ov::Shape get_target_shape_from_ht(const ngraph::HostTensorPtr& input1) {
+    ov::Shape target_shape;
     switch (input1->get_element_type()) {
         CASE_GET_SHAPE(i8)(input1, target_shape);
         break;
@@ -404,17 +404,16 @@ Shape get_target_shape_from_ht(const HostTensorPtr& input1) {
         break;
     default:
         // other types are not supported and would have thrown in ctor
-        ngraph_error("get_target_shape_from_ht: type is not integral\n");
-        break;
+        throw ov::Exception("get_target_shape_from_ht: type is not integral");
     }
     return target_shape;
 }
 }  // namespace
 
-bool op::util::BroadcastBase::evaluate_broadcast(const HostTensorPtr& arg0,
-                                                 const HostTensorPtr& out,
-                                                 const std::pair<bool, AxisSet> pair_broadcast_axes,
-                                                 const Shape output_shape) const {
+bool ov::op::util::BroadcastBase::evaluate_broadcast(const HostTensorPtr& arg0,
+                                                     const HostTensorPtr& out,
+                                                     const std::pair<bool, AxisSet>& pair_broadcast_axes,
+                                                     const Shape& output_shape) const {
     if (!pair_broadcast_axes.first) {
         // broadcast_axes not known deterministically
         return false;
@@ -426,9 +425,9 @@ bool op::util::BroadcastBase::evaluate_broadcast(const HostTensorPtr& arg0,
     return evaluate_broadcast(arg0, out, pair_broadcast_axes.second);
 }
 
-Shape op::util::BroadcastBase::get_target_shape(const HostTensorPtr& input1) const {
+ov::Shape ov::op::util::BroadcastBase::get_target_shape(const HostTensorPtr& input1) const {
     Shape target_shape;
-    const auto shape_constant = ov::as_type_ptr<op::v0::Constant>(input_value(1).get_node_shared_ptr());
+    const auto shape_constant = ov::as_type_ptr<ngraph::op::v0::Constant>(input_value(1).get_node_shared_ptr());
     if (shape_constant) {
         target_shape = shape_constant->get_shape_val();
     } else {
@@ -437,10 +436,10 @@ Shape op::util::BroadcastBase::get_target_shape(const HostTensorPtr& input1) con
     return target_shape;
 }
 
-bool op::util::BroadcastBase::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::util::BroadcastBase::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(util_BroadcastBase_evaluate);
-    NGRAPH_CHECK(validate_host_tensor_vector(inputs, 2) || validate_host_tensor_vector(inputs, 3));
-    NGRAPH_CHECK(validate_host_tensor_vector(outputs, 1));
+    NGRAPH_CHECK(ngraph::validate_host_tensor_vector(inputs, 2) || ngraph::validate_host_tensor_vector(inputs, 3));
+    NGRAPH_CHECK(ngraph::validate_host_tensor_vector(outputs, 1));
 
     Shape target_shape = get_target_shape(inputs[1]);
 
@@ -450,7 +449,8 @@ bool op::util::BroadcastBase::evaluate(const HostTensorVector& outputs, const Ho
 
     if (m_mode.m_type == BroadcastType::NONE) {
         AxisVector axes_mapping_val;
-        const auto axes_mapping_constant = ov::as_type_ptr<op::v0::Constant>(input_value(2).get_node_shared_ptr());
+        const auto axes_mapping_constant =
+            ov::as_type_ptr<ngraph::op::v0::Constant>(input_value(2).get_node_shared_ptr());
         if (axes_mapping_constant) {
             axes_mapping_val = axes_mapping_constant->get_axis_vector_val();
         } else {
@@ -468,22 +468,22 @@ bool op::util::BroadcastBase::evaluate(const HostTensorVector& outputs, const Ho
         validate_target_shape_numpy(arg_shape, target_shape);
         pair_broadcast_axes = get_broadcast_axes_numpy_pdpd(arg_shape, result_shape.to_shape(), m_mode);
     } else {
-        ngraph_error("Unsupported BroadcastType ");
+        throw ov::Exception("Unsupported BroadcastType ");
     }
 
     return evaluate_broadcast(inputs[0], outputs[0], pair_broadcast_axes, result_shape.to_shape());
 }
 
-bool op::util::BroadcastBase::evaluate_lower(const HostTensorVector& output_values) const {
+bool ov::op::util::BroadcastBase::evaluate_lower(const HostTensorVector& output_values) const {
     if (!input_value(1).get_tensor().has_and_set_bound() ||
         (get_input_size() > 2 && !input_value(2).get_tensor().has_and_set_bound()))
         return false;
-    return default_lower_bound_evaluator(this, output_values);
+    return ngraph::default_lower_bound_evaluator(this, output_values);
 }
 
-bool op::util::BroadcastBase::evaluate_upper(const HostTensorVector& output_values) const {
+bool ov::op::util::BroadcastBase::evaluate_upper(const HostTensorVector& output_values) const {
     if (!input_value(1).get_tensor().has_and_set_bound() ||
         (get_input_size() > 2 && !input_value(2).get_tensor().has_and_set_bound()))
         return false;
-    return default_upper_bound_evaluator(this, output_values);
+    return ngraph::default_upper_bound_evaluator(this, output_values);
 }
diff --git a/ngraph/core/src/op/util/deformable_convolution_base.cpp b/ngraph/core/src/op/util/deformable_convolution_base.cpp
index 916d62019da44e..c1343f6f402336 100644
--- a/ngraph/core/src/op/util/deformable_convolution_base.cpp
+++ b/ngraph/core/src/op/util/deformable_convolution_base.cpp
@@ -12,18 +12,17 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
-
-NGRAPH_RTTI_DEFINITION(op::util::DeformableConvolutionBase, "DeformableConvolutionBase", 0);
-
-op::util::DeformableConvolutionBase::DeformableConvolutionBase(const OutputVector& arguments,
-                                                               const Strides& strides,
-                                                               const CoordinateDiff& pads_begin,
-                                                               const CoordinateDiff& pads_end,
-                                                               const Strides& dilations,
-                                                               const PadType& auto_pad,
-                                                               const int64_t group,
-                                                               const int64_t deformable_group)
+
+NGRAPH_RTTI_DEFINITION(ov::op::util::DeformableConvolutionBase, "DeformableConvolutionBase", 0);
+
+ov::op::util::DeformableConvolutionBase::DeformableConvolutionBase(const OutputVector& arguments,
+                                                                   const Strides& strides,
+                                                                   const CoordinateDiff& pads_begin,
+                                                                   const CoordinateDiff& pads_end,
+                                                                   const Strides& dilations,
+                                                                   const PadType& auto_pad,
+                                                                   const int64_t group,
+                                                                   const int64_t deformable_group)
     : Op(arguments),
       m_strides(strides),
       m_dilations(dilations),
@@ -33,7 +32,7 @@ op::util::DeformableConvolutionBase::DeformableConvolutionBase(const OutputVecto
       m_group(group),
       m_deformable_group(deformable_group) {}
 
-bool op::util::DeformableConvolutionBase::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::DeformableConvolutionBase::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_DeformableConvolutionBase_visit_attributes);
     visitor.on_attribute("strides", m_strides);
     visitor.on_attribute("dilations", m_dilations);
@@ -45,7 +44,7 @@ bool op::util::DeformableConvolutionBase::visit_attributes(AttributeVisitor& vis
     return true;
 }
 
-void op::util::DeformableConvolutionBase::validate_and_infer_types() {
+void ov::op::util::DeformableConvolutionBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_DeformableConvolutionBase_validate_and_infer_types);
     const PartialShape& data_batch_pshape = get_input_partial_shape(0);
     const PartialShape& offsets_pshape = get_input_partial_shape(1);
@@ -159,15 +158,15 @@ void op::util::DeformableConvolutionBase::validate_and_infer_types() {
         }
         return new_shape;
     }(m_group);
-    PartialShape result_shape = validate_and_infer_convolution_forward_output_shape(this,
-                                                                                    result_ps_rank,
-                                                                                    data_batch_pshape,
-                                                                                    new_filters_pshape,
-                                                                                    m_auto_pad,
-                                                                                    m_strides,
-                                                                                    m_dilations,
-                                                                                    m_pads_begin,
-                                                                                    m_pads_end);
+    PartialShape result_shape = ngraph::validate_and_infer_convolution_forward_output_shape(this,
+                                                                                            result_ps_rank,
+                                                                                            data_batch_pshape,
+                                                                                            new_filters_pshape,
+                                                                                            m_auto_pad,
+                                                                                            m_strides,
+                                                                                            m_dilations,
+                                                                                            m_pads_begin,
+                                                                                            m_pads_end);
 
     if (result_shape.rank().is_static() && offsets_pshape.rank().is_static()) {
         PartialShape result_spatial_shape = [&result_shape]() {
diff --git a/ngraph/core/src/op/util/elementwise_args.cpp b/ngraph/core/src/op/util/elementwise_args.cpp
index fecd9fedf2261d..9a290f7fb8a96f 100644
--- a/ngraph/core/src/op/util/elementwise_args.cpp
+++ b/ngraph/core/src/op/util/elementwise_args.cpp
@@ -6,9 +6,7 @@
 
 #include "ngraph/op/util/binary_elementwise_arithmetic.hpp"
 
-using namespace ngraph;
-
-std::tuple<element::Type, PartialShape> ngraph::op::util::validate_and_infer_elementwise_args(
+std::tuple<ov::element::Type, ov::PartialShape> ov::op::util::validate_and_infer_elementwise_args(
     Node* node,
     const op::AutoBroadcastSpec& autob) {
     NGRAPH_CHECK(node != nullptr, "nGraph node is empty! Cannot validate eltwise arguments.");
diff --git a/ngraph/core/src/op/util/embeddingbag_offsets_base.cpp b/ngraph/core/src/op/util/embeddingbag_offsets_base.cpp
index e27aa19a413506..358ba88c04352d 100644
--- a/ngraph/core/src/op/util/embeddingbag_offsets_base.cpp
+++ b/ngraph/core/src/op/util/embeddingbag_offsets_base.cpp
@@ -8,35 +8,34 @@
 #include "ngraph/op/constant.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo op::util::EmbeddingBagOffsetsBase::type_info;
+OPENVINO_RTTI_DEFINITION(ov::op::util::EmbeddingBagOffsetsBase, "EmbeddingBagOffsetsBase", 3);
 
-op::util::EmbeddingBagOffsetsBase::EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
-                                                           const Output<Node>& indices,
-                                                           const Output<Node>& offsets,
-                                                           const Output<Node>& default_index,
-                                                           const Output<Node>& per_sample_weights)
+ov::op::util::EmbeddingBagOffsetsBase::EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
+                                                               const Output<Node>& indices,
+                                                               const Output<Node>& offsets,
+                                                               const Output<Node>& default_index,
+                                                               const Output<Node>& per_sample_weights)
     : Op({emb_table, indices, offsets, default_index, per_sample_weights}) {
     constructor_validate_and_infer_types();
 }
 
-op::util::EmbeddingBagOffsetsBase::EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
-                                                           const Output<Node>& indices,
-                                                           const Output<Node>& offsets,
-                                                           const Output<Node>& default_index)
+ov::op::util::EmbeddingBagOffsetsBase::EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
+                                                               const Output<Node>& indices,
+                                                               const Output<Node>& offsets,
+                                                               const Output<Node>& default_index)
     : Op({emb_table, indices, offsets, default_index}) {
     constructor_validate_and_infer_types();
 }
 
-op::util::EmbeddingBagOffsetsBase::EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
-                                                           const Output<Node>& indices,
-                                                           const Output<Node>& offsets)
+ov::op::util::EmbeddingBagOffsetsBase::EmbeddingBagOffsetsBase(const Output<Node>& emb_table,
+                                                               const Output<Node>& indices,
+                                                               const Output<Node>& offsets)
     : Op({emb_table, indices, offsets}) {
     constructor_validate_and_infer_types();
 }
 
-void op::util::EmbeddingBagOffsetsBase::validate_and_infer_types() {
+void ov::op::util::EmbeddingBagOffsetsBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_EmbeddingBagOffsetsBase_validate_and_infer_types);
     NODE_VALIDATION_CHECK(
         this,
@@ -120,7 +119,7 @@ void op::util::EmbeddingBagOffsetsBase::validate_and_infer_types() {
     set_output_type(0, result_et, result_shape);
 }
 
-bool op::util::EmbeddingBagOffsetsBase::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::EmbeddingBagOffsetsBase::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_EmbeddingBagOffsetsBase_visit_attributes);
     return true;
 }
diff --git a/ngraph/core/src/op/util/embeddingbag_packed_base.cpp b/ngraph/core/src/op/util/embeddingbag_packed_base.cpp
index 9ecfafb2060fcc..734fbd5ff1d1ed 100644
--- a/ngraph/core/src/op/util/embeddingbag_packed_base.cpp
+++ b/ngraph/core/src/op/util/embeddingbag_packed_base.cpp
@@ -8,23 +8,22 @@
 #include "ngraph/op/constant.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo op::util::EmbeddingBagPackedBase::type_info;
+OPENVINO_RTTI_DEFINITION(ov::op::util::EmbeddingBagPackedBase, "EmbeddingBagPackedBase", 3);
 
-op::util::EmbeddingBagPackedBase::EmbeddingBagPackedBase(const Output<Node>& emb_table,
-                                                         const Output<Node>& indices,
-                                                         const Output<Node>& per_sample_weights)
+ov::op::util::EmbeddingBagPackedBase::EmbeddingBagPackedBase(const Output<Node>& emb_table,
+                                                             const Output<Node>& indices,
+                                                             const Output<Node>& per_sample_weights)
     : Op({emb_table, indices, per_sample_weights}) {
     constructor_validate_and_infer_types();
 }
 
-op::util::EmbeddingBagPackedBase::EmbeddingBagPackedBase(const Output<Node>& emb_table, const Output<Node>& indices)
+ov::op::util::EmbeddingBagPackedBase::EmbeddingBagPackedBase(const Output<Node>& emb_table, const Output<Node>& indices)
     : Op({emb_table, indices}) {
     constructor_validate_and_infer_types();
 }
 
-void op::util::EmbeddingBagPackedBase::validate_and_infer_types() {
+void ov::op::util::EmbeddingBagPackedBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_EmbeddingBagPackedBase_validate_and_infer_types);
     NODE_VALIDATION_CHECK(
         this,
@@ -71,7 +70,7 @@ void op::util::EmbeddingBagPackedBase::validate_and_infer_types() {
     set_output_type(0, result_et, result_shape);
 }
 
-bool op::util::EmbeddingBagPackedBase::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::EmbeddingBagPackedBase::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_EmbeddingBagPackedBase_visit_attributes);
     return true;
 }
diff --git a/ngraph/core/src/op/util/evaluation_context.cpp b/ngraph/core/src/op/util/evaluation_context.cpp
index 1bc0acc454e517..073a74a2e5f34c 100644
--- a/ngraph/core/src/op/util/evaluation_context.cpp
+++ b/ngraph/core/src/op/util/evaluation_context.cpp
@@ -6,4 +6,4 @@
 
 #include "ngraph/op/util/variable_context.hpp"
 
-constexpr ngraph::VariantTypeInfo ngraph::VariantWrapper<ngraph::VariableContext>::type_info;
+constexpr ov::VariantTypeInfo ov::VariantWrapper<ngraph::VariableContext>::type_info;
diff --git a/ngraph/core/src/op/util/fft_base.cpp b/ngraph/core/src/op/util/fft_base.cpp
index e1cc47e8d01fe1..d6551d4527583a 100644
--- a/ngraph/core/src/op/util/fft_base.cpp
+++ b/ngraph/core/src/op/util/fft_base.cpp
@@ -10,21 +10,20 @@
 #include "ngraph/attribute_visitor.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::FFTBase, "FFTBase", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::FFTBase, "FFTBase", 0);
 
-op::util::FFTBase::FFTBase(const Output<Node>& data, const Output<Node>& axes) : Op({data, axes}) {}
+ov::op::util::FFTBase::FFTBase(const Output<Node>& data, const Output<Node>& axes) : Op({data, axes}) {}
 
-op::util::FFTBase::FFTBase(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size)
+ov::op::util::FFTBase::FFTBase(const Output<Node>& data, const Output<Node>& axes, const Output<Node>& signal_size)
     : Op({data, axes, signal_size}) {}
 
-bool op::util::FFTBase::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::FFTBase::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_FFTBase_visit_attributes);
     return true;
 }
 
-void op::util::FFTBase::validate() {
+void ov::op::util::FFTBase::validate() {
     size_t num_of_inputs = get_input_size();
 
     NODE_VALIDATION_CHECK(this, num_of_inputs == 2 || num_of_inputs == 3, "FFT op must have 2 or 3 inputs.");
@@ -73,7 +72,7 @@ void op::util::FFTBase::validate() {
                               axes_shape.to_shape()[0]);
     }
 
-    if (input_shape.rank().is_static() && ov::is_type<op::Constant>(input_value(1).get_node())) {
+    if (input_shape.rank().is_static() && ov::is_type<ngraph::op::Constant>(input_value(1).get_node())) {
         const auto input_rank = input_shape.rank().get_length();
         const auto& const_axes = get_constant_from_source(input_value(1));
         auto axes = const_axes->cast_vector<int64_t>();
@@ -132,7 +131,7 @@ void op::util::FFTBase::validate() {
     }
 }
 
-void op::util::FFTBase::validate_and_infer_types() {
+void ov::op::util::FFTBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_FFTBase_validate_and_infer_types);
     validate();
 
@@ -146,7 +145,7 @@ void op::util::FFTBase::validate_and_infer_types() {
 
     const auto input_rank = input_shape.rank().get_length();
 
-    if (axes_shape.rank().is_dynamic() || !ov::is_type<op::Constant>(input_value(1).get_node())) {
+    if (axes_shape.rank().is_dynamic() || !ov::is_type<ngraph::op::Constant>(input_value(1).get_node())) {
         for (int64_t i = 0; i < input_rank - 1; ++i) {
             output_shape[i] = Dimension::dynamic();
         }
@@ -179,7 +178,7 @@ void op::util::FFTBase::validate_and_infer_types() {
         }
     }
 
-    if (!ov::is_type<op::Constant>(input_value(2).get_node())) {
+    if (!ov::is_type<ngraph::op::Constant>(input_value(2).get_node())) {
         for (int64_t axis : axes) {
             output_shape[axis] = Dimension::dynamic();
         }
diff --git a/ngraph/core/src/op/util/gather_base.cpp b/ngraph/core/src/op/util/gather_base.cpp
index 321e4649e06aee..fbcea62b4988c3 100644
--- a/ngraph/core/src/op/util/gather_base.cpp
+++ b/ngraph/core/src/op/util/gather_base.cpp
@@ -15,20 +15,19 @@
 #include "ngraph/shape.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::GatherBase, "GatherBase", 7);
+NGRAPH_RTTI_DEFINITION(ov::op::util::GatherBase, "GatherBase", 7);
 
-op::util::GatherBase::GatherBase(const Output<Node>& data,
-                                 const Output<Node>& indices,
-                                 const Output<Node>& axis,
-                                 const int64_t batch_dims)
+ov::op::util::GatherBase::GatherBase(const Output<Node>& data,
+                                     const Output<Node>& indices,
+                                     const Output<Node>& axis,
+                                     const int64_t batch_dims)
     : Op({data, indices, axis}),
       m_batch_dims(batch_dims) {
     constructor_validate_and_infer_types();
 }
 
-void op::util::GatherBase::validate_and_infer_types() {
+void ov::op::util::GatherBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_GatherBase_validate_and_infer_types);
     const auto& data_type = get_input_element_type(0);
 
@@ -129,10 +128,10 @@ void op::util::GatherBase::validate_and_infer_types() {
     }
 }
 
-int64_t op::util::GatherBase::get_axis() const {
+int64_t ov::op::util::GatherBase::get_axis() const {
     const auto& const_op = get_constant_from_source(input_value(2));
     if (!const_op)
-        throw ngraph_error("axis value is not set");
+        throw ov::Exception("axis value is not set");
 
     int64_t axis = const_op->cast_vector<int64_t>()[0];
     if (axis < 0) {
@@ -145,16 +144,16 @@ int64_t op::util::GatherBase::get_axis() const {
 }
 
 namespace gather {
-template <element::Type_t ET>
-bool evaluate(const HostTensorPtr& arg0,
-              const HostTensorPtr& arg1,
-              const HostTensorPtr& out,
+template <ov::element::Type_t ET>
+bool evaluate(const ngraph::HostTensorPtr& arg0,
+              const ngraph::HostTensorPtr& arg1,
+              const ngraph::HostTensorPtr& out,
               int64_t axis,
               int64_t batch_dims) {
-    using T = typename element_type_traits<ET>::value_type;
-    Shape params_shape = arg0->get_shape();
-    Shape indices_shape = arg1->get_shape();
-    Shape out_shape(params_shape.size() + indices_shape.size() - 1 - batch_dims);
+    using T = typename ov::element_type_traits<ET>::value_type;
+    ov::Shape params_shape = arg0->get_shape();
+    ov::Shape indices_shape = arg1->get_shape();
+    ov::Shape out_shape(params_shape.size() + indices_shape.size() - 1 - batch_dims);
     int64_t i = 0;
     for (; i < axis; i++) {
         out_shape[i] = params_shape[i];
@@ -168,34 +167,34 @@ bool evaluate(const HostTensorPtr& arg0,
 
     out->set_shape(out_shape);
 
-    if (arg1->get_element_type() == element::i64) {
-        runtime::reference::gather<T, int64_t>(arg0->get_data_ptr<ET>(),
-                                               arg1->get_data_ptr<int64_t>(),
-                                               out->get_data_ptr<ET>(),
-                                               arg0->get_shape(),
-                                               arg1->get_shape(),
-                                               out->get_shape(),
-                                               axis,
-                                               batch_dims);
-    } else if (arg1->get_element_type() == element::i32) {
-        runtime::reference::gather<T, int32_t>(arg0->get_data_ptr<ET>(),
-                                               arg1->get_data_ptr<int32_t>(),
-                                               out->get_data_ptr<ET>(),
-                                               arg0->get_shape(),
-                                               arg1->get_shape(),
-                                               out->get_shape(),
-                                               axis,
-                                               batch_dims);
+    if (arg1->get_element_type() == ov::element::i64) {
+        ngraph::runtime::reference::gather<T, int64_t>(arg0->get_data_ptr<ET>(),
+                                                       arg1->get_data_ptr<int64_t>(),
+                                                       out->get_data_ptr<ET>(),
+                                                       arg0->get_shape(),
+                                                       arg1->get_shape(),
+                                                       out->get_shape(),
+                                                       axis,
+                                                       batch_dims);
+    } else if (arg1->get_element_type() == ov::element::i32) {
+        ngraph::runtime::reference::gather<T, int32_t>(arg0->get_data_ptr<ET>(),
+                                                       arg1->get_data_ptr<int32_t>(),
+                                                       out->get_data_ptr<ET>(),
+                                                       arg0->get_shape(),
+                                                       arg1->get_shape(),
+                                                       out->get_shape(),
+                                                       axis,
+                                                       batch_dims);
     } else {
-        throw ngraph_error("Unexpected type");
+        throw ov::Exception("Unexpected type");
     }
 
     return true;
 }
 
-bool evaluate_gather(const HostTensorPtr& arg0,
-                     const HostTensorPtr& arg1,
-                     const HostTensorPtr& out,
+bool evaluate_gather(const ngraph::HostTensorPtr& arg0,
+                     const ngraph::HostTensorPtr& arg1,
+                     const ngraph::HostTensorPtr& out,
                      int64_t axis,
                      int64_t batch_dims = 0) {
     bool rc = true;
@@ -217,16 +216,16 @@ bool evaluate_gather(const HostTensorPtr& arg0,
     return rc;
 }
 
-bool cf_gather_with_subgraph(OutputVector& output_values,
-                             const OutputVector& input_values,
-                             const PartialShape& gather_ps) {
+bool cf_gather_with_subgraph(ov::OutputVector& output_values,
+                             const ov::OutputVector& input_values,
+                             const ov::PartialShape& gather_ps) {
     if (gather_ps.is_dynamic() || input_values.size() != 3) {
         return false;
     }
 
-    const auto concat = std::dynamic_pointer_cast<op::Concat>(input_values[0].get_node_shared_ptr());
-    const auto indices = std::dynamic_pointer_cast<op::Constant>(input_values[1].get_node_shared_ptr());
-    const auto axis = std::dynamic_pointer_cast<op::Constant>(input_values[2].get_node_shared_ptr());
+    const auto concat = std::dynamic_pointer_cast<ngraph::op::Concat>(input_values[0].get_node_shared_ptr());
+    const auto indices = std::dynamic_pointer_cast<ngraph::op::Constant>(input_values[1].get_node_shared_ptr());
+    const auto axis = std::dynamic_pointer_cast<ngraph::op::Constant>(input_values[2].get_node_shared_ptr());
 
     if (!concat || !indices || !axis) {
         return false;
@@ -262,8 +261,8 @@ bool cf_gather_with_subgraph(OutputVector& output_values,
     auto gathered = gathered_concat_input;
     if (indices_shape.empty()) {
         // gathering a scalar
-        const auto axis_const = op::Constant::create(element::i64, Shape{1}, {0});
-        gathered = make_shared<op::v0::Squeeze>(gathered_concat_input, axis_const);
+        const auto axis_const = ngraph::op::Constant::create(ov::element::i64, ov::Shape{1}, {0});
+        gathered = make_shared<ngraph::op::v0::Squeeze>(gathered_concat_input, axis_const);
     }
 
     output_values[0] = gathered;
@@ -272,10 +271,10 @@ bool cf_gather_with_subgraph(OutputVector& output_values,
 }
 }  // namespace gather
 
-bool op::util::GatherBase::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
+bool ov::op::util::GatherBase::evaluate(const HostTensorVector& outputs, const HostTensorVector& inputs) const {
     NGRAPH_OP_SCOPE(util_GatherBase_evaluate);
-    NGRAPH_CHECK(validate_host_tensor_vector(inputs, 3));
-    NGRAPH_CHECK(validate_host_tensor_vector(outputs, 1));
+    NGRAPH_CHECK(ngraph::validate_host_tensor_vector(inputs, 3));
+    NGRAPH_CHECK(ngraph::validate_host_tensor_vector(outputs, 1));
 
     int64_t axis = 0;
     switch (inputs[2]->get_element_type()) {
@@ -304,7 +303,7 @@ bool op::util::GatherBase::evaluate(const HostTensorVector& outputs, const HostT
         axis = inputs[2]->get_data_ptr<element::Type_t::u64>()[0];
         break;
     default:
-        throw ngraph_error("axis must be of integral data type.");
+        throw ov::Exception("axis must be of integral data type.");
     }
 
     if (axis < 0) {
@@ -322,19 +321,19 @@ bool op::util::GatherBase::evaluate(const HostTensorVector& outputs, const HostT
     return gather::evaluate_gather(inputs[0], inputs[1], outputs[0], axis, batch_dims);
 }
 
-bool op::util::GatherBase::evaluate_lower(const HostTensorVector& output_values) const {
+bool ov::op::util::GatherBase::evaluate_lower(const HostTensorVector& output_values) const {
     if (!input_value(1).get_tensor().has_and_set_bound() || !input_value(2).get_tensor().has_and_set_bound())
         return false;
-    return default_lower_bound_evaluator(this, output_values);
+    return ngraph::default_lower_bound_evaluator(this, output_values);
 }
 
-bool op::util::GatherBase::evaluate_upper(const HostTensorVector& output_values) const {
+bool ov::op::util::GatherBase::evaluate_upper(const HostTensorVector& output_values) const {
     if (!input_value(1).get_tensor().has_and_set_bound() || !input_value(2).get_tensor().has_and_set_bound())
         return false;
-    return default_upper_bound_evaluator(this, output_values);
+    return ngraph::default_upper_bound_evaluator(this, output_values);
 }
 
-bool op::util::GatherBase::constant_fold(OutputVector& output_values, const OutputVector& input_values) {
+bool ov::op::util::GatherBase::constant_fold(OutputVector& output_values, const OutputVector& input_values) {
     // try the regular constant folding just for the Gather node
     if (Node::constant_fold(output_values, input_values)) {
         return true;
diff --git a/ngraph/core/src/op/util/index_reduction.cpp b/ngraph/core/src/op/util/index_reduction.cpp
index 827ba2eb47fe0e..7e14a8cbb3aeb0 100644
--- a/ngraph/core/src/op/util/index_reduction.cpp
+++ b/ngraph/core/src/op/util/index_reduction.cpp
@@ -10,32 +10,31 @@
 #include "ngraph/attribute_visitor.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-op::util::IndexReduction::IndexReduction() {}
+ov::op::util::IndexReduction::IndexReduction() = default;
 
-op::util::IndexReduction::IndexReduction(const Output<Node>& arg,
-                                         uint64_t axis,
-                                         const element::Type& index_element_type)
+ov::op::util::IndexReduction::IndexReduction(const Output<Node>& arg,
+                                             uint64_t axis,
+                                             const element::Type& index_element_type)
     : Op({arg}) {
     set_reduction_axis(axis);
     set_index_element_type(index_element_type);
 }
 
-uint64_t op::util::IndexReduction::get_reduction_axis() const {
+uint64_t ov::op::util::IndexReduction::get_reduction_axis() const {
     return m_axis;
 }
-void op::util::IndexReduction::set_reduction_axis(uint64_t value) {
+void ov::op::util::IndexReduction::set_reduction_axis(uint64_t value) {
     m_axis = value;
 }
-element::Type op::util::IndexReduction::get_index_element_type() const {
+ov::element::Type ov::op::util::IndexReduction::get_index_element_type() const {
     return m_index_element_type;
 }
-void op::util::IndexReduction::set_index_element_type(const element::Type& index_element_type) {
+void ov::op::util::IndexReduction::set_index_element_type(const element::Type& index_element_type) {
     m_index_element_type = index_element_type;
 }
 
-void op::util::IndexReduction::validate_and_infer_types() {
+void ov::op::util::IndexReduction::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_IndexReduction_validate_and_infer_types);
     // TODO(amprocte): Should reject if size of reduction axis is zero.
     const PartialShape& arg_shape = get_input_partial_shape(0);
@@ -80,7 +79,7 @@ void op::util::IndexReduction::validate_and_infer_types() {
     set_output_type(0, m_index_element_type, output_shape);
 }
 
-bool op::util::IndexReduction::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::IndexReduction::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_IndexReduction_visit_attributes);
     visitor.on_attribute("axis", m_axis);
     visitor.on_attribute("index_element_type", m_index_element_type);
diff --git a/ngraph/core/src/op/util/logical_reduction.cpp b/ngraph/core/src/op/util/logical_reduction.cpp
index 1d116fcdb35f28..b061782e0541fc 100644
--- a/ngraph/core/src/op/util/logical_reduction.cpp
+++ b/ngraph/core/src/op/util/logical_reduction.cpp
@@ -9,16 +9,17 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
+using namespace ov;
 
 NGRAPH_RTTI_DEFINITION(op::util::LogicalReduction, "LogicalReduction", 1);
 
-op::util::LogicalReduction::LogicalReduction() {}
+op::util::LogicalReduction::LogicalReduction() = default;
 
 op::util::LogicalReduction::LogicalReduction(const Output<Node>& arg, const AxisSet& reduction_axes)
     : ReductionBase(
           arg,
-          op::Constant::create(element::i64, Shape{reduction_axes.size()}, reduction_axes.to_vector())->output(0)) {
+          ngraph::op::Constant::create(element::i64, ov::Shape{reduction_axes.size()}, reduction_axes.to_vector())
+              ->output(0)) {
     add_provenance_group_member(input_value(1).get_node_shared_ptr());
 }
 
@@ -26,7 +27,7 @@ op::util::LogicalReduction::LogicalReduction(const Output<Node>& arg, const Outp
     : ReductionBase(arg, reduction_axes) {}
 
 bool op::util::LogicalReduction::reduction_axes_constant() const {
-    return has_and_set_equal_bounds(input_value(1));
+    return ngraph::has_and_set_equal_bounds(input_value(1));
 }
 
 const AxisSet op::util::LogicalReduction::get_reduction_axes() const {
@@ -39,7 +40,8 @@ const AxisSet op::util::LogicalReduction::get_reduction_axes() const {
 
 void op::util::LogicalReduction::set_reduction_axes(const AxisSet& reduction_axes) {
     this->input(1).replace_source_output(
-        op::Constant::create(element::i64, Shape{reduction_axes.size()}, reduction_axes.to_vector())->output(0));
+        ngraph::op::Constant::create(element::i64, ov::Shape{reduction_axes.size()}, reduction_axes.to_vector())
+            ->output(0));
 }
 
 void op::util::LogicalReduction::validate_and_infer_types() {
diff --git a/ngraph/core/src/op/util/logical_reduction_keep_dims.cpp b/ngraph/core/src/op/util/logical_reduction_keep_dims.cpp
index 51568ea95bee39..014289eddfc4ad 100644
--- a/ngraph/core/src/op/util/logical_reduction_keep_dims.cpp
+++ b/ngraph/core/src/op/util/logical_reduction_keep_dims.cpp
@@ -10,23 +10,22 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::LogicalReductionKeepDims, "LogicalReductionKeepDims", 1);
+NGRAPH_RTTI_DEFINITION(ov::op::util::LogicalReductionKeepDims, "LogicalReductionKeepDims", 1);
 
-op::util::LogicalReductionKeepDims::LogicalReductionKeepDims(const ngraph::Output<ngraph::Node>& arg,
-                                                             const ngraph::Output<ngraph::Node>& reduction_axes,
-                                                             const bool keep_dims)
+ov::op::util::LogicalReductionKeepDims::LogicalReductionKeepDims(const ngraph::Output<ngraph::Node>& arg,
+                                                                 const ngraph::Output<ngraph::Node>& reduction_axes,
+                                                                 const bool keep_dims)
     : LogicalReduction(arg, reduction_axes),
       m_keep_dims{keep_dims} {}
 
-bool ngraph::op::util::LogicalReductionKeepDims::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::LogicalReductionKeepDims::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(v0_util_LogicalReductionKeepDims_visit_attributes);
     visitor.on_attribute("keep_dims", m_keep_dims);
     return true;
 }
 
-void op::util::LogicalReductionKeepDims::validate_and_infer_types() {
+void ov::op::util::LogicalReductionKeepDims::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(v0_util_LogicalReductionKeepDims_validate_and_infer_types);
 
     const element::Type& data_et = get_input_element_type(0);
diff --git a/ngraph/core/src/op/util/max_pool_base.cpp b/ngraph/core/src/op/util/max_pool_base.cpp
index 595742c21cbe0b..3534ebeeea578b 100644
--- a/ngraph/core/src/op/util/max_pool_base.cpp
+++ b/ngraph/core/src/op/util/max_pool_base.cpp
@@ -10,17 +10,16 @@
 #include "ngraph/shape.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::MaxPoolBase, "MaxPoolBase", 8);
+NGRAPH_RTTI_DEFINITION(ov::op::util::MaxPoolBase, "MaxPoolBase", 8);
 
-op::util::MaxPoolBase::MaxPoolBase(const Output<Node>& arg,
-                                   const Strides& strides,
-                                   const Shape& pads_begin,
-                                   const Shape& pads_end,
-                                   const Shape& kernel,
-                                   const op::RoundingType rounding_type,
-                                   const op::PadType auto_pad)
+ov::op::util::MaxPoolBase::MaxPoolBase(const Output<Node>& arg,
+                                       const Strides& strides,
+                                       const ov::Shape& pads_begin,
+                                       const ov::Shape& pads_end,
+                                       const ov::Shape& kernel,
+                                       const op::RoundingType rounding_type,
+                                       const op::PadType auto_pad)
     : Op({arg}),
       m_kernel(kernel),
       m_strides(strides),
@@ -31,7 +30,7 @@ op::util::MaxPoolBase::MaxPoolBase(const Output<Node>& arg,
     constructor_validate_and_infer_types();
 }
 
-void op::util::MaxPoolBase::validate_and_infer_types() {
+void ov::op::util::MaxPoolBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_MaxPoolBase_validate_and_infer_types);
 
     if (0 == m_strides.size()) {
@@ -39,11 +38,11 @@ void op::util::MaxPoolBase::validate_and_infer_types() {
     }
 
     if (0 == m_pads_begin.size()) {
-        m_pads_begin = Shape(m_kernel.size(), 0);
+        m_pads_begin = ov::Shape(m_kernel.size(), 0);
     }
 
     if (0 == m_pads_end.size()) {
-        m_pads_end = Shape(m_kernel.size(), 0);
+        m_pads_end = ov::Shape(m_kernel.size(), 0);
     }
 
     const PartialShape& arg_shape = get_input_partial_shape(0);
@@ -75,7 +74,7 @@ void op::util::MaxPoolBase::validate_and_infer_types() {
     }
 }
 
-PartialShape op::util::MaxPoolBase::infer_output_shape(const Strides& dilations) {
+ov::PartialShape ov::op::util::MaxPoolBase::infer_output_shape(const Strides& dilations) {
     NGRAPH_OP_SCOPE(util_MaxPoolBase_infer_output_shape);
 
     const auto& arg_shape = get_input_partial_shape(0);
@@ -87,23 +86,23 @@ PartialShape op::util::MaxPoolBase::infer_output_shape(const Strides& dilations)
         update_auto_padding_succeed = update_auto_padding(arg_shape, filter_dilations, m_pads_end, m_pads_begin);
     }
     if (m_auto_pad == PadType::VALID) {
-        m_pads_end = Shape(m_pads_end.size(), 0);
-        m_pads_begin = Shape(m_pads_begin.size(), 0);
+        m_pads_end = ov::Shape(m_pads_end.size(), 0);
+        m_pads_begin = ov::Shape(m_pads_begin.size(), 0);
     }
 
     auto output_shape = PartialShape::dynamic();
     if (update_auto_padding_succeed) {
         CoordinateDiff pads_begin(m_pads_begin.begin(), m_pads_begin.end());
         CoordinateDiff pads_end(m_pads_end.begin(), m_pads_end.end());
-        output_shape = infer_batched_pooling_forward(this,
-                                                     get_input_partial_shape(0),
-                                                     pads_begin,
-                                                     pads_end,
-                                                     m_kernel,
-                                                     m_strides,
-                                                     true,
-                                                     m_rounding_type == op::RoundingType::CEIL,
-                                                     dilations);
+        output_shape = ngraph::infer_batched_pooling_forward(this,
+                                                             get_input_partial_shape(0),
+                                                             pads_begin,
+                                                             pads_end,
+                                                             m_kernel,
+                                                             m_strides,
+                                                             true,
+                                                             m_rounding_type == op::RoundingType::CEIL,
+                                                             dilations);
     } else {
         if (arg_shape.rank().is_static()) {
             output_shape = std::vector<Dimension>(arg_shape.rank().get_max_length(), Dimension::dynamic());
@@ -119,17 +118,22 @@ PartialShape op::util::MaxPoolBase::infer_output_shape(const Strides& dilations)
     return output_shape;
 }
 
-bool op::util::MaxPoolBase::update_auto_padding(const PartialShape& in_shape,
-                                                const Strides& filter_dilations,
-                                                Shape& new_pads_end,
-                                                Shape& new_pads_begin) const {
+bool ov::op::util::MaxPoolBase::update_auto_padding(const PartialShape& in_shape,
+                                                    const Strides& filter_dilations,
+                                                    ov::Shape& new_pads_end,
+                                                    ov::Shape& new_pads_begin) const {
     bool update_auto_padding_succeed = true;
     if (m_auto_pad == PadType::SAME_UPPER || m_auto_pad == PadType::SAME_LOWER) {
         CoordinateDiff pads_end, pads_begin;
-        update_auto_padding_succeed =
-            try_apply_auto_padding(in_shape, m_kernel, m_strides, filter_dilations, m_auto_pad, pads_end, pads_begin);
-        new_pads_end = Shape(pads_end.begin(), pads_end.end());
-        new_pads_begin = Shape(pads_begin.begin(), pads_begin.end());
+        update_auto_padding_succeed = ngraph::try_apply_auto_padding(in_shape,
+                                                                     m_kernel,
+                                                                     m_strides,
+                                                                     filter_dilations,
+                                                                     m_auto_pad,
+                                                                     pads_end,
+                                                                     pads_begin);
+        new_pads_end = ov::Shape(pads_end.begin(), pads_end.end());
+        new_pads_begin = ov::Shape(pads_begin.begin(), pads_begin.end());
     }
     return update_auto_padding_succeed;
 }
diff --git a/ngraph/core/src/op/util/multi_subgraph_base.cpp b/ngraph/core/src/op/util/multi_subgraph_base.cpp
index fea33f2f653302..40d9c13dde05f8 100644
--- a/ngraph/core/src/op/util/multi_subgraph_base.cpp
+++ b/ngraph/core/src/op/util/multi_subgraph_base.cpp
@@ -7,30 +7,28 @@
 #include "ngraph/graph_util.hpp"
 #include "ngraph/opsets/opset5.hpp"
 
-using namespace ngraph;
-
-NGRAPH_RTTI_DEFINITION(op::util::MultiSubGraphOp, "MultiSubGraphOp", 0);
-NGRAPH_RTTI_DEFINITION(op::util::MultiSubGraphOp::SliceInputDescription, "SliceInputDescription", 0);
-NGRAPH_RTTI_DEFINITION(op::util::MultiSubGraphOp::MergedInputDescription, "MergedInputDescription", 0);
-NGRAPH_RTTI_DEFINITION(op::util::MultiSubGraphOp::InvariantInputDescription, "InvariantInputDescription", 0);
-NGRAPH_RTTI_DEFINITION(op::util::MultiSubGraphOp::BodyOutputDescription, "BodyOutputDescription", 0);
-NGRAPH_RTTI_DEFINITION(op::util::MultiSubGraphOp::ConcatOutputDescription, "ConcatOutputDescription", 0);
-
-op::util::MultiSubGraphOp::InputDescription::InputDescription(uint64_t input_index, uint64_t body_parameter_index)
+NGRAPH_RTTI_DEFINITION(ov::op::util::MultiSubGraphOp, "MultiSubGraphOp", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::MultiSubGraphOp::SliceInputDescription, "SliceInputDescription", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::MultiSubGraphOp::MergedInputDescription, "MergedInputDescription", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::MultiSubGraphOp::InvariantInputDescription, "InvariantInputDescription", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::MultiSubGraphOp::BodyOutputDescription, "BodyOutputDescription", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::MultiSubGraphOp::ConcatOutputDescription, "ConcatOutputDescription", 0);
+
+ov::op::util::MultiSubGraphOp::InputDescription::InputDescription(uint64_t input_index, uint64_t body_parameter_index)
     : m_input_index(input_index),
       m_body_parameter_index(body_parameter_index) {}
 
-op::util::MultiSubGraphOp::OutputDescription::OutputDescription(uint64_t body_value_index, uint64_t output_index)
+ov::op::util::MultiSubGraphOp::OutputDescription::OutputDescription(uint64_t body_value_index, uint64_t output_index)
     : m_body_value_index(body_value_index),
       m_output_index(output_index) {}
 
-op::util::MultiSubGraphOp::SliceInputDescription::SliceInputDescription(uint64_t input_index,
-                                                                        uint64_t body_parameter_index,
-                                                                        int64_t start,
-                                                                        int64_t stride,
-                                                                        int64_t part_size,
-                                                                        int64_t end,
-                                                                        int64_t axis)
+ov::op::util::MultiSubGraphOp::SliceInputDescription::SliceInputDescription(uint64_t input_index,
+                                                                            uint64_t body_parameter_index,
+                                                                            int64_t start,
+                                                                            int64_t stride,
+                                                                            int64_t part_size,
+                                                                            int64_t end,
+                                                                            int64_t axis)
     : InputDescription(input_index, body_parameter_index),
       m_start(start),
       m_stride(stride),
@@ -38,8 +36,8 @@ op::util::MultiSubGraphOp::SliceInputDescription::SliceInputDescription(uint64_t
       m_end(end),
       m_axis(axis) {}
 
-std::shared_ptr<op::util::MultiSubGraphOp::InputDescription> op::util::MultiSubGraphOp::SliceInputDescription::copy()
-    const {
+std::shared_ptr<ov::op::util::MultiSubGraphOp::InputDescription>
+ov::op::util::MultiSubGraphOp::SliceInputDescription::copy() const {
     return std::make_shared<SliceInputDescription>(m_input_index,
                                                    m_body_parameter_index,
                                                    m_start,
@@ -49,24 +47,24 @@ std::shared_ptr<op::util::MultiSubGraphOp::InputDescription> op::util::MultiSubG
                                                    m_axis);
 }
 
-op::util::MultiSubGraphOp::MergedInputDescription::MergedInputDescription(uint64_t input_index,
-                                                                          uint64_t body_parameter_index,
-                                                                          uint64_t body_value_index)
+ov::op::util::MultiSubGraphOp::MergedInputDescription::MergedInputDescription(uint64_t input_index,
+                                                                              uint64_t body_parameter_index,
+                                                                              uint64_t body_value_index)
     : InputDescription(input_index, body_parameter_index),
       m_body_value_index(body_value_index) {}
 
-std::shared_ptr<op::util::MultiSubGraphOp::InputDescription> op::util::MultiSubGraphOp::MergedInputDescription::copy()
-    const {
+std::shared_ptr<ov::op::util::MultiSubGraphOp::InputDescription>
+ov::op::util::MultiSubGraphOp::MergedInputDescription::copy() const {
     return std::make_shared<MergedInputDescription>(m_input_index, m_body_parameter_index, m_body_value_index);
 }
 
-op::util::MultiSubGraphOp::ConcatOutputDescription::ConcatOutputDescription(uint64_t body_value_index,
-                                                                            uint64_t output_index,
-                                                                            int64_t start,
-                                                                            int64_t stride,
-                                                                            int64_t part_size,
-                                                                            int64_t end,
-                                                                            int64_t axis)
+ov::op::util::MultiSubGraphOp::ConcatOutputDescription::ConcatOutputDescription(uint64_t body_value_index,
+                                                                                uint64_t output_index,
+                                                                                int64_t start,
+                                                                                int64_t stride,
+                                                                                int64_t part_size,
+                                                                                int64_t end,
+                                                                                int64_t axis)
     : OutputDescription(body_value_index, output_index),
       m_start(start),
       m_stride(stride),
@@ -74,8 +72,8 @@ op::util::MultiSubGraphOp::ConcatOutputDescription::ConcatOutputDescription(uint
       m_end(end),
       m_axis(axis) {}
 
-std::shared_ptr<op::util::MultiSubGraphOp::OutputDescription> op::util::MultiSubGraphOp::ConcatOutputDescription::copy()
-    const {
+std::shared_ptr<ov::op::util::MultiSubGraphOp::OutputDescription>
+ov::op::util::MultiSubGraphOp::ConcatOutputDescription::copy() const {
     return std::make_shared<ConcatOutputDescription>(m_body_value_index,
                                                      m_output_index,
                                                      m_start,
@@ -84,48 +82,49 @@ std::shared_ptr<op::util::MultiSubGraphOp::OutputDescription> op::util::MultiSub
                                                      m_end,
                                                      m_axis);
 }
-op::util::MultiSubGraphOp::InvariantInputDescription::InvariantInputDescription(uint64_t input_index,
-                                                                                uint64_t body_parameter_index)
+ov::op::util::MultiSubGraphOp::InvariantInputDescription::InvariantInputDescription(uint64_t input_index,
+                                                                                    uint64_t body_parameter_index)
     : InputDescription(input_index, body_parameter_index) {}
 
-std::shared_ptr<op::util::MultiSubGraphOp::InputDescription>
-op::util::MultiSubGraphOp::InvariantInputDescription::copy() const {
+std::shared_ptr<ov::op::util::MultiSubGraphOp::InputDescription>
+ov::op::util::MultiSubGraphOp::InvariantInputDescription::copy() const {
     return std::make_shared<MultiSubGraphOp::InvariantInputDescription>(m_input_index, m_body_parameter_index);
 }
 
-op::util::MultiSubGraphOp::BodyOutputDescription::BodyOutputDescription(uint64_t body_value_index,
-                                                                        uint64_t output_index,
-                                                                        int64_t iteration)
+ov::op::util::MultiSubGraphOp::BodyOutputDescription::BodyOutputDescription(uint64_t body_value_index,
+                                                                            uint64_t output_index,
+                                                                            int64_t iteration)
     : OutputDescription(body_value_index, output_index),
       m_iteration(iteration) {}
 
-std::shared_ptr<op::util::MultiSubGraphOp::OutputDescription> op::util::MultiSubGraphOp::BodyOutputDescription::copy()
-    const {
+std::shared_ptr<ov::op::util::MultiSubGraphOp::OutputDescription>
+ov::op::util::MultiSubGraphOp::BodyOutputDescription::copy() const {
     return std::make_shared<BodyOutputDescription>(m_body_value_index, m_output_index, m_iteration);
 }
 
-op::util::MultiSubGraphOp::MultiSubGraphOp(const OutputVector& args) : Op(args) {}
+ov::op::util::MultiSubGraphOp::MultiSubGraphOp(const OutputVector& args) : Op(args) {}
 
-op::util::MultiSubGraphOp::MultiSubGraphOp(size_t number_of_bodies) {
+ov::op::util::MultiSubGraphOp::MultiSubGraphOp(size_t number_of_bodies) {
     m_bodies.resize(number_of_bodies);
     m_input_descriptions.resize(number_of_bodies);
     m_output_descriptions.resize(number_of_bodies);
 }
 
-op::util::MultiSubGraphOp::MultiSubGraphOp(const OutputVector& args, size_t number_of_bodies) : MultiSubGraphOp(args) {
+ov::op::util::MultiSubGraphOp::MultiSubGraphOp(const OutputVector& args, size_t number_of_bodies)
+    : MultiSubGraphOp(args) {
     m_bodies.resize(number_of_bodies);
     m_input_descriptions.resize(number_of_bodies);
     m_output_descriptions.resize(number_of_bodies);
 }
 
-Input<Node> op::util::MultiSubGraphOp::input_for_value(const Output<Node>& value) {
+ov::Input<ov::Node> ov::op::util::MultiSubGraphOp::input_for_value(const Output<Node>& value) {
     auto input_index = get_input_size();
     set_argument(input_index, value);
-    return Input<Node>(this, input_index);
+    return ov::Input<Node>(this, input_index);
 }
 
-void op::util::MultiSubGraphOp::set_invariant_inputs(const Output<Node>& value,
-                                                     const ParameterVector& bodies_parameters) {
+void ov::op::util::MultiSubGraphOp::set_invariant_inputs(const Output<Node>& value,
+                                                         const ngraph::ParameterVector& bodies_parameters) {
     auto input_index = input_for_value(value).get_index();
     for (auto& param : bodies_parameters) {
         for (size_t body_index = 0; body_index < m_bodies.size(); ++body_index) {
@@ -138,7 +137,7 @@ void op::util::MultiSubGraphOp::set_invariant_inputs(const Output<Node>& value,
     }
 }
 
-Output<Node> op::util::MultiSubGraphOp::set_body_outputs(const ResultVector& bodies_results) {
+ov::Output<ov::Node> ov::op::util::MultiSubGraphOp::set_body_outputs(const ResultVector& bodies_results) {
     auto output_index = get_output_size();
     for (auto& body_result : bodies_results) {
         for (size_t body_index = 0; body_index < m_bodies.size(); body_index++) {
diff --git a/ngraph/core/src/op/util/nms_base.cpp b/ngraph/core/src/op/util/nms_base.cpp
index 22b848707ffad5..a9c4adc17762e1 100644
--- a/ngraph/core/src/op/util/nms_base.cpp
+++ b/ngraph/core/src/op/util/nms_base.cpp
@@ -15,32 +15,30 @@
 #include "ngraph/type/float16.hpp"
 #include "ngraph/util.hpp"
 
-using namespace ngraph;
+NGRAPH_RTTI_DEFINITION(ov::op::util::NmsBase, "NmsBase", 0);
 
-NGRAPH_RTTI_DEFINITION(op::util::NmsBase, "NmsBase", 0);
-
-op::util::NmsBase::NmsBase(ngraph::element::Type& output_type, int& nms_top_k, int& keep_top_k)
+ov::op::util::NmsBase::NmsBase(ngraph::element::Type& output_type, int& nms_top_k, int& keep_top_k)
     : m_output_type(output_type),
       m_nms_top_k(nms_top_k),
       m_keep_top_k(keep_top_k) {}
 
-op::util::NmsBase::NmsBase(const Output<Node>& boxes,
-                           const Output<Node>& scores,
-                           ngraph::element::Type& output_type,
-                           int& nms_top_k,
-                           int& keep_top_k)
+ov::op::util::NmsBase::NmsBase(const Output<Node>& boxes,
+                               const Output<Node>& scores,
+                               ngraph::element::Type& output_type,
+                               int& nms_top_k,
+                               int& keep_top_k)
     : Op({boxes, scores}),
       m_output_type(output_type),
       m_nms_top_k(nms_top_k),
       m_keep_top_k(keep_top_k) {}
 
 namespace {
-inline bool is_float_type_admissible(const element::Type& t) {
-    return t == element::f32 || t == element::f16 || t == element::bf16;
+inline bool is_float_type_admissible(const ov::element::Type& t) {
+    return t == ov::element::f32 || t == ov::element::f16 || t == ov::element::bf16;
 }
 }  // namespace
 
-void op::util::NmsBase::validate() {
+void ov::op::util::NmsBase::validate() {
     NGRAPH_OP_SCOPE(util_NmsBase_validate);
 
     const auto boxes_ps = get_input_partial_shape(0);
@@ -102,7 +100,7 @@ void op::util::NmsBase::validate() {
                           num_boxes_scores);
 }
 
-void op::util::NmsBase::validate_and_infer_types() {
+void ov::op::util::NmsBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_NmsBase_validate_and_infer_types);
     const auto boxes_ps = get_input_partial_shape(0);
     const auto scores_ps = get_input_partial_shape(1);
@@ -145,7 +143,7 @@ void op::util::NmsBase::validate_and_infer_types() {
     }
 }
 
-std::ostream& ngraph::operator<<(std::ostream& s, const op::util::NmsBase::SortResultType& type) {
+std::ostream& ov::operator<<(std::ostream& s, const op::util::NmsBase::SortResultType& type) {
     return s << as_string(type);
 }
 
diff --git a/ngraph/core/src/op/util/op_types.cpp b/ngraph/core/src/op/util/op_types.cpp
index ca5813bf117577..848c5c1af8120a 100644
--- a/ngraph/core/src/op/util/op_types.cpp
+++ b/ngraph/core/src/op/util/op_types.cpp
@@ -25,51 +25,51 @@
 #include "ngraph/op/xor.hpp"
 #include "ngraph/type.hpp"
 
-bool ngraph::op::is_unary_elementwise_arithmetic(const ngraph::Node* node) {
-    return dynamic_cast<const ngraph::op::util::UnaryElementwiseArithmetic*>(node) != nullptr;
+bool ov::op::util::is_unary_elementwise_arithmetic(const ov::Node* node) {
+    return dynamic_cast<const ov::op::util::UnaryElementwiseArithmetic*>(node) != nullptr;
 }
 
-bool ngraph::op::is_binary_elementwise_arithmetic(const ngraph::Node* node) {
-    return dynamic_cast<const ngraph::op::util::BinaryElementwiseArithmetic*>(node) != nullptr;
+bool ov::op::util::is_binary_elementwise_arithmetic(const ov::Node* node) {
+    return dynamic_cast<const ov::op::util::BinaryElementwiseArithmetic*>(node) != nullptr;
 }
 
-bool ngraph::op::is_binary_elementwise_comparison(const ngraph::Node* node) {
-    return dynamic_cast<const ngraph::op::util::BinaryElementwiseComparison*>(node) != nullptr;
+bool ov::op::util::is_binary_elementwise_comparison(const ov::Node* node) {
+    return dynamic_cast<const ov::op::util::BinaryElementwiseComparison*>(node) != nullptr;
 }
 
-bool ngraph::op::is_binary_elementwise_logical(const ngraph::Node* node) {
-    return dynamic_cast<const ngraph::op::util::BinaryElementwiseLogical*>(node) != nullptr;
+bool ov::op::util::is_binary_elementwise_logical(const ov::Node* node) {
+    return dynamic_cast<const ov::op::util::BinaryElementwiseLogical*>(node) != nullptr;
 }
 
-bool ngraph::op::supports_auto_broadcast(const ngraph::Node* node) {
+bool ov::op::util::supports_auto_broadcast(const ov::Node* node) {
     return dynamic_cast<const ngraph::op::v1::Select*>(node) != nullptr ||
            dynamic_cast<const ngraph::op::v0::SquaredDifference*>(node) != nullptr ||
-           dynamic_cast<const ngraph::op::util::BinaryElementwiseComparison*>(node) != nullptr ||
-           dynamic_cast<const ngraph::op::util::BinaryElementwiseLogical*>(node) != nullptr ||
-           dynamic_cast<const ngraph::op::util::BinaryElementwiseArithmetic*>(node) != nullptr;
+           dynamic_cast<const ov::op::util::BinaryElementwiseComparison*>(node) != nullptr ||
+           dynamic_cast<const ov::op::util::BinaryElementwiseLogical*>(node) != nullptr ||
+           dynamic_cast<const ov::op::util::BinaryElementwiseArithmetic*>(node) != nullptr;
 }
 
-bool ngraph::op::is_op(const ngraph::Node* node) {
-    return dynamic_cast<const ngraph::op::Op*>(node) != nullptr;
+bool ov::op::util::is_op(const ov::Node* node) {
+    return dynamic_cast<const ov::op::Op*>(node) != nullptr;
 }
 
-bool ngraph::op::is_parameter(const ngraph::Node* node) {
+bool ov::op::util::is_parameter(const ov::Node* node) {
     return dynamic_cast<const ngraph::op::Parameter*>(node) != nullptr;
 }
 
-bool ngraph::op::is_output(const ngraph::Node* node) {
+bool ov::op::util::is_output(const ov::Node* node) {
     return dynamic_cast<const ngraph::op::Result*>(node) != nullptr;
 }
 
-bool ngraph::op::is_sink(const ngraph::Node* node) {
+bool ov::op::util::is_sink(const ov::Node* node) {
     return dynamic_cast<const ngraph::op::Sink*>(node) != nullptr;
 }
 
-bool ngraph::op::is_constant(const ngraph::Node* node) {
+bool ov::op::util::is_constant(const ov::Node* node) {
     return dynamic_cast<const ngraph::op::Constant*>(node) != nullptr;
 }
 
-bool ngraph::op::is_commutative(const ngraph::Node* node) {
+bool ov::op::util::is_commutative(const ov::Node* node) {
     return dynamic_cast<const ngraph::op::v1::Add*>(node) != nullptr ||
            dynamic_cast<const ngraph::op::v1::Maximum*>(node) != nullptr ||
            dynamic_cast<const ngraph::op::v1::Equal*>(node) != nullptr ||
@@ -82,38 +82,38 @@ bool ngraph::op::is_commutative(const ngraph::Node* node) {
            dynamic_cast<const ngraph::op::v1::LogicalOr*>(node) != nullptr;
 }
 
-bool ngraph::op::is_unary_elementwise_arithmetic(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_unary_elementwise_arithmetic(const std::shared_ptr<ov::Node>& node) {
     return is_unary_elementwise_arithmetic(node.get());
 }
-bool ngraph::op::is_binary_elementwise_arithmetic(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_binary_elementwise_arithmetic(const std::shared_ptr<ov::Node>& node) {
     return is_binary_elementwise_arithmetic(node.get());
 }
-bool ngraph::op::is_binary_elementwise_comparison(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_binary_elementwise_comparison(const std::shared_ptr<ov::Node>& node) {
     return is_binary_elementwise_comparison(node.get());
 }
-bool ngraph::op::is_binary_elementwise_logical(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_binary_elementwise_logical(const std::shared_ptr<ov::Node>& node) {
     return is_binary_elementwise_logical(node.get());
 }
 
-bool ngraph::op::supports_auto_broadcast(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::supports_auto_broadcast(const std::shared_ptr<ov::Node>& node) {
     return supports_auto_broadcast(node.get());
 }
 
-bool ngraph::op::is_op(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_op(const std::shared_ptr<ov::Node>& node) {
     return is_op(node.get());
 }
-bool ngraph::op::is_parameter(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_parameter(const std::shared_ptr<ov::Node>& node) {
     return is_parameter(node.get());
 }
-bool ngraph::op::is_output(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_output(const std::shared_ptr<ov::Node>& node) {
     return is_output(node.get());
 }
-bool ngraph::op::is_sink(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_sink(const std::shared_ptr<ov::Node>& node) {
     return is_sink(node.get());
 }
-bool ngraph::op::is_constant(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_constant(const std::shared_ptr<ov::Node>& node) {
     return is_constant(node.get());
 }
-bool ngraph::op::is_commutative(const std::shared_ptr<ngraph::Node>& node) {
+bool ov::op::util::is_commutative(const std::shared_ptr<ov::Node>& node) {
     return is_commutative(node.get());
 }
diff --git a/ngraph/core/src/op/util/read_value_base.cpp b/ngraph/core/src/op/util/read_value_base.cpp
new file mode 100644
index 00000000000000..c2c00ef84c1ee2
--- /dev/null
+++ b/ngraph/core/src/op/util/read_value_base.cpp
@@ -0,0 +1,7 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/op/util/read_value_base.hpp"
+
+OPENVINO_RTTI_DEFINITION(ov::op::util::ReadValueBase, "ReadValueBase", 0);
diff --git a/ngraph/core/src/op/util/recurrent_sequence.cpp b/ngraph/core/src/op/util/recurrent_sequence.cpp
index b16a2b7a7089fe..c8396e8727946c 100644
--- a/ngraph/core/src/op/util/recurrent_sequence.cpp
+++ b/ngraph/core/src/op/util/recurrent_sequence.cpp
@@ -5,9 +5,8 @@
 #include "ngraph/op/util/recurrent_sequence.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-void op::util::validate_seq_input_rank_dimension(const std::vector<ngraph::PartialShape>& input) {
+void ngraph::op::util::validate_seq_input_rank_dimension(const std::vector<ngraph::PartialShape>& input) {
     enum { X, initial_hidden_state, sequence_lengths, W, R, B };
 
     // Verify static ranks for all inputs
diff --git a/ngraph/core/src/op/util/reduction_base.cpp b/ngraph/core/src/op/util/reduction_base.cpp
index a7b34f58c3cb2b..16419edc6efb1b 100644
--- a/ngraph/core/src/op/util/reduction_base.cpp
+++ b/ngraph/core/src/op/util/reduction_base.cpp
@@ -9,16 +9,15 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::ReductionBase, "ReductionBase", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::ReductionBase, "ReductionBase", 0);
 
-op::util::ReductionBase::ReductionBase() {}
+ov::op::util::ReductionBase::ReductionBase() = default;
 
-op::util::ReductionBase::ReductionBase(const Output<Node>& arg, const Output<Node>& reduction_axes)
+ov::op::util::ReductionBase::ReductionBase(const Output<Node>& arg, const Output<Node>& reduction_axes)
     : Op({arg, reduction_axes}) {}
 
-PartialShape op::util::ReductionBase::infer_reduction_output_shape(const bool keep_dims) {
+ov::PartialShape ov::op::util::ReductionBase::infer_reduction_output_shape(const bool keep_dims) {
     const PartialShape& data_ps = get_input_partial_shape(0);
     PartialShape result_ps{PartialShape::dynamic()};
     Rank data_rank = data_ps.rank();
@@ -33,8 +32,8 @@ PartialShape op::util::ReductionBase::infer_reduction_output_shape(const bool ke
         auto reduction_axes_val = axes->cast_vector<int64_t>();
         for (auto axis : reduction_axes_val) {
             try {
-                axis = normalize_axis(this, axis, data_rank);
-            } catch (const ngraph_error&) {
+                axis = ngraph::normalize_axis(this, axis, data_rank);
+            } catch (const ov::Exception&) {
                 NODE_VALIDATION_CHECK(this,
                                       false,
                                       "Reduction axis (",
diff --git a/ngraph/core/src/op/util/rnn_cell_base.cpp b/ngraph/core/src/op/util/rnn_cell_base.cpp
index 17cab3c1357bbd..f4293691e1af4c 100644
--- a/ngraph/core/src/op/util/rnn_cell_base.cpp
+++ b/ngraph/core/src/op/util/rnn_cell_base.cpp
@@ -18,11 +18,10 @@
 #include "ngraph/util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::util::RNNCellBase, "RNNCellBase", 0);
+NGRAPH_RTTI_DEFINITION(ov::op::util::RNNCellBase, "RNNCellBase", 0);
 
-std::shared_ptr<Node> ngraph::op::util::convert_lstm_node_format(const Output<Node>& node,
+std::shared_ptr<ov::Node> ov::op::util::convert_lstm_node_format(const Output<Node>& node,
                                                                  LSTMWeightsFormat from_format,
                                                                  LSTMWeightsFormat to_format,
                                                                  int64_t axis) {
@@ -37,32 +36,32 @@ std::shared_ptr<Node> ngraph::op::util::convert_lstm_node_format(const Output<No
     const auto& to = gate_order_map.at(to_format);
     size_t num_gates = 4;
 
-    auto axis_const = std::make_shared<opset4::Constant>(element::i64, Shape{}, axis);
-    OutputVector splitted_node = std::make_shared<opset4::Split>(node, axis_const, num_gates)->outputs();
+    auto axis_const = std::make_shared<ngraph::opset4::Constant>(element::i64, ngraph::Shape{}, axis);
+    OutputVector splitted_node = std::make_shared<ngraph::opset4::Split>(node, axis_const, num_gates)->outputs();
     OutputVector nodes_in_new_format(num_gates);
     for (size_t i = 0; i < num_gates; ++i) {
         nodes_in_new_format[to[from[i]]] = splitted_node[i];
     }
-    return std::make_shared<opset4::Concat>(nodes_in_new_format, axis);
+    return std::make_shared<ngraph::opset4::Concat>(nodes_in_new_format, axis);
 }
 
 // Modify input vector in-place and return reference to modified vector.
 static vector<string> to_lower_case(const vector<string>& vs) {
     vector<string> res(vs);
     transform(begin(res), end(res), begin(res), [](string& s) {
-        return to_lower(s);
+        return ngraph::to_lower(s);
     });
     return res;
 }
 
-op::util::RNNCellBase::RNNCellBase() : m_hidden_size(0), m_clip(0.f) {}
+ov::op::util::RNNCellBase::RNNCellBase() : m_hidden_size(0), m_clip(0.f) {}
 
-op::util::RNNCellBase::RNNCellBase(const OutputVector& args,
-                                   size_t hidden_size,
-                                   float clip,
-                                   const vector<string>& activations,
-                                   const vector<float>& activations_alpha,
-                                   const vector<float>& activations_beta)
+ov::op::util::RNNCellBase::RNNCellBase(const OutputVector& args,
+                                       size_t hidden_size,
+                                       float clip,
+                                       const vector<string>& activations,
+                                       const vector<float>& activations_alpha,
+                                       const vector<float>& activations_beta)
     : Op(args),
       m_hidden_size(hidden_size),
       m_clip(clip),
@@ -119,7 +118,7 @@ void ngraph::op::util::RNNCellBase::validate_input_rank_dimension(const std::vec
                           "RNNCellBase mismatched input_size dimension.");
 }
 
-op::util::ActivationFunction op::util::RNNCellBase::get_activation_function(size_t idx) const {
+ov::op::util::ActivationFunction ov::op::util::RNNCellBase::get_activation_function(size_t idx) const {
     // Normalize activation function case.
     std::string func_name = m_activations.at(idx);
     std::locale loc;
@@ -140,22 +139,22 @@ op::util::ActivationFunction op::util::RNNCellBase::get_activation_function(size
     return afunc;
 }
 
-shared_ptr<Node> op::util::RNNCellBase::add(const Output<Node>& lhs, const Output<Node>& rhs) {
-    return {make_shared<op::v1::Add>(lhs, rhs)};
+shared_ptr<ov::Node> ov::op::util::RNNCellBase::add(const Output<Node>& lhs, const Output<Node>& rhs) {
+    return {make_shared<ngraph::op::v1::Add>(lhs, rhs)};
 }
 
-shared_ptr<Node> op::util::RNNCellBase::sub(const Output<Node>& lhs, const Output<Node>& rhs) {
-    return {make_shared<op::v1::Subtract>(lhs, rhs)};
+shared_ptr<ov::Node> ov::op::util::RNNCellBase::sub(const Output<Node>& lhs, const Output<Node>& rhs) {
+    return {make_shared<ngraph::op::v1::Subtract>(lhs, rhs)};
 }
 
-shared_ptr<Node> op::util::RNNCellBase::mul(const Output<Node>& lhs, const Output<Node>& rhs) {
-    return {make_shared<op::v1::Multiply>(lhs, rhs)};
+shared_ptr<ov::Node> ov::op::util::RNNCellBase::mul(const Output<Node>& lhs, const Output<Node>& rhs) {
+    return {make_shared<ngraph::op::v1::Multiply>(lhs, rhs)};
 }
 
-shared_ptr<Node> op::util::RNNCellBase::clip(const Output<Node>& data) const {
+shared_ptr<ov::Node> ov::op::util::RNNCellBase::clip(const Output<Node>& data) const {
     if (m_clip == 0.f) {
         return data.get_node_shared_ptr();
     }
 
-    return make_shared<op::Clamp>(data, -m_clip, m_clip);
+    return make_shared<ngraph::op::Clamp>(data, -m_clip, m_clip);
 }
diff --git a/ngraph/core/src/op/util/scatter_base.cpp b/ngraph/core/src/op/util/scatter_base.cpp
index 27e8ec13ad2565..219fecb832cd35 100644
--- a/ngraph/core/src/op/util/scatter_base.cpp
+++ b/ngraph/core/src/op/util/scatter_base.cpp
@@ -10,19 +10,18 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo op::util::ScatterBase::type_info;
+OPENVINO_RTTI_DEFINITION(ov::op::util::ScatterBase, "ScatterBase", 0);
 
-op::util::ScatterBase::ScatterBase(const Output<Node>& data,
-                                   const Output<Node>& indices,
-                                   const Output<Node>& updates,
-                                   const Output<Node>& axis)
+ov::op::util::ScatterBase::ScatterBase(const Output<Node>& data,
+                                       const Output<Node>& indices,
+                                       const Output<Node>& updates,
+                                       const Output<Node>& axis)
     : Op({data, indices, updates, axis}) {
     constructor_validate_and_infer_types();
 }
 
-void op::util::ScatterBase::validate_and_infer_types() {
+void ov::op::util::ScatterBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_ScatterBase_validate_and_infer_types);
     const auto& data_et = get_input_element_type(DATA);
     const auto& indices_et = get_input_element_type(INDICES);
@@ -74,7 +73,7 @@ void op::util::ScatterBase::validate_and_infer_types() {
     if (const auto& axis_const_input = get_constant_from_source(input_value(AXIS))) {
         bool compatible = true;
         int64_t axis = axis_const_input->cast_vector<int64_t>().at(0);
-        axis = normalize_axis(this, axis, data_shape.rank().get_length());
+        axis = ngraph::normalize_axis(this, axis, data_shape.rank().get_length());
 
         if (indices_shape.rank().is_static() && updates_shape.rank().is_static()) {
             for (int64_t i = 0; i < indices_shape.rank().get_length(); ++i) {
@@ -106,7 +105,7 @@ void op::util::ScatterBase::validate_and_infer_types() {
     }
 }
 
-bool op::util::ScatterBase::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::ScatterBase::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_ScatterBase_visit_attributes);
     return true;
 }
diff --git a/ngraph/core/src/op/util/scatter_nd_base.cpp b/ngraph/core/src/op/util/scatter_nd_base.cpp
index a49eb192a68061..0c2b6a2f52e5ca 100644
--- a/ngraph/core/src/op/util/scatter_nd_base.cpp
+++ b/ngraph/core/src/op/util/scatter_nd_base.cpp
@@ -9,26 +9,25 @@
 #include "ngraph/shape.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo op::util::ScatterNDBase::type_info;
-constexpr int op::util::ScatterNDBase::INPUTS;
-constexpr int op::util::ScatterNDBase::INDICES;
-constexpr int op::util::ScatterNDBase::UPDATES;
+OPENVINO_RTTI_DEFINITION(ov::op::util::ScatterNDBase, "ScatterNDBase", 0);
+constexpr int ov::op::util::ScatterNDBase::INPUTS;
+constexpr int ov::op::util::ScatterNDBase::INDICES;
+constexpr int ov::op::util::ScatterNDBase::UPDATES;
 
-op::util::ScatterNDBase::ScatterNDBase(const Output<Node>& data,
-                                       const Output<Node>& indices,
-                                       const Output<Node>& updates)
+ov::op::util::ScatterNDBase::ScatterNDBase(const Output<Node>& data,
+                                           const Output<Node>& indices,
+                                           const Output<Node>& updates)
     : Op({data, indices, updates}) {
     constructor_validate_and_infer_types();
 }
 
-bool op::util::ScatterNDBase::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::ScatterNDBase::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_ScatterNDBase_visit_attributes);
     return true;
 }
 
-void op::util::ScatterNDBase::validate_and_infer_types() {
+void ov::op::util::ScatterNDBase::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_ScatterNDBase_validate_and_infer_types);
     element::Type inputs_et = get_input_element_type(INPUTS);
     element::Type indices_et = get_input_element_type(INDICES);
diff --git a/ngraph/core/src/op/util/sub_graph_base.cpp b/ngraph/core/src/op/util/sub_graph_base.cpp
index 82b9aeb972e0eb..815b513c0689ac 100644
--- a/ngraph/core/src/op/util/sub_graph_base.cpp
+++ b/ngraph/core/src/op/util/sub_graph_base.cpp
@@ -7,36 +7,34 @@
 #include "ngraph/graph_util.hpp"
 #include "ngraph/opsets/opset5.hpp"
 
-using namespace ngraph;
+NGRAPH_RTTI_DEFINITION(ov::op::util::SubGraphOp, "SubGraphOp", 0);
 
-NGRAPH_RTTI_DEFINITION(op::util::SubGraphOp, "SubGraphOp", 0);
+ov::op::util::SubGraphOp::SubGraphOp() : MultiSubGraphOp(1) {}
 
-op::util::SubGraphOp::SubGraphOp() : MultiSubGraphOp(1) {}
+ov::op::util::SubGraphOp::SubGraphOp(const OutputVector& args) : MultiSubGraphOp(args, 1) {}
 
-op::util::SubGraphOp::SubGraphOp(const OutputVector& args) : MultiSubGraphOp(args, 1) {}
-
-void op::util::SubGraphOp::set_merged_input(const std::shared_ptr<Parameter>& body_parameter,
-                                            const Output<Node>& initial_value,
-                                            const Output<Node>& successive_value) {
+void ov::op::util::SubGraphOp::set_merged_input(const std::shared_ptr<ngraph::op::Parameter>& body_parameter,
+                                                const Output<Node>& initial_value,
+                                                const Output<Node>& successive_value) {
     auto body = get_function();
 
     m_input_descriptions[0].push_back(
-        std::make_shared<TensorIterator::MergedInputDescription>(input_for_value(initial_value).get_index(),
-                                                                 body->get_parameter_index(body_parameter),
-                                                                 body->get_result_index(successive_value)));
+        std::make_shared<ngraph::op::TensorIterator::MergedInputDescription>(input_for_value(initial_value).get_index(),
+                                                                             body->get_parameter_index(body_parameter),
+                                                                             body->get_result_index(successive_value)));
     validate_and_infer_types();
 }
 
-void op::util::SubGraphOp::set_invariant_input(const std::shared_ptr<Parameter>& body_parameter,
-                                               const Output<Node>& value) {
+void ov::op::util::SubGraphOp::set_invariant_input(const std::shared_ptr<ngraph::op::Parameter>& body_parameter,
+                                                   const Output<Node>& value) {
     auto body = get_function();
-    m_input_descriptions[0].push_back(
-        std::make_shared<TensorIterator::InvariantInputDescription>(input_for_value(value).get_index(),
-                                                                    body->get_parameter_index(body_parameter)));
+    m_input_descriptions[0].push_back(std::make_shared<ngraph::op::TensorIterator::InvariantInputDescription>(
+        input_for_value(value).get_index(),
+        body->get_parameter_index(body_parameter)));
     validate_and_infer_types();
 }
 
-Output<Node> op::util::SubGraphOp::get_iter_value(const Output<Node>& body_value, int64_t iteration) {
+ov::Output<ov::Node> ov::op::util::SubGraphOp::get_iter_value(const Output<Node>& body_value, int64_t iteration) {
     auto output_index = get_output_size();
     auto body = get_function();
     m_output_descriptions[0].push_back(
@@ -46,12 +44,12 @@ Output<Node> op::util::SubGraphOp::get_iter_value(const Output<Node>& body_value
     return Output<Node>(shared_from_this(), output_index);
 }
 
-Output<Node> op::util::SubGraphOp::get_concatenated_slices(const Output<Node>& body_value,
-                                                           int64_t start,
-                                                           int64_t stride,
-                                                           int64_t part_size,
-                                                           int64_t end,
-                                                           int64_t axis) {
+ov::Output<ov::Node> ov::op::util::SubGraphOp::get_concatenated_slices(const Output<Node>& body_value,
+                                                                       int64_t start,
+                                                                       int64_t stride,
+                                                                       int64_t part_size,
+                                                                       int64_t end,
+                                                                       int64_t axis) {
     auto output_index = get_output_size();
     auto body = get_function();
     m_output_descriptions[0].push_back(std::make_shared<ConcatOutputDescription>(body->get_result_index(body_value),
@@ -66,13 +64,13 @@ Output<Node> op::util::SubGraphOp::get_concatenated_slices(const Output<Node>& b
     return Output<Node>(shared_from_this(), output_index);
 }
 
-void op::util::SubGraphOp::set_sliced_input(const std::shared_ptr<Parameter>& parameter,
-                                            const Output<Node>& value,
-                                            int64_t start,
-                                            int64_t stride,
-                                            int64_t part_size,
-                                            int64_t end,
-                                            int64_t axis) {
+void ov::op::util::SubGraphOp::set_sliced_input(const std::shared_ptr<ngraph::op::Parameter>& parameter,
+                                                const Output<Node>& value,
+                                                int64_t start,
+                                                int64_t stride,
+                                                int64_t part_size,
+                                                int64_t end,
+                                                int64_t axis) {
     auto body = get_function();
     m_input_descriptions[0].push_back(std::make_shared<SliceInputDescription>(input_for_value(value).get_index(),
                                                                               body->get_parameter_index(parameter),
@@ -84,8 +82,8 @@ void op::util::SubGraphOp::set_sliced_input(const std::shared_ptr<Parameter>& pa
     validate_and_infer_types();
 }
 
-Input<Node> op::util::SubGraphOp::input_for_value(const Output<Node>& value) {
+ov::Input<ov::Node> ov::op::util::SubGraphOp::input_for_value(const Output<Node>& value) {
     auto input_index = get_input_size();
     set_argument(input_index, value);
-    return Input<Node>(this, input_index);
+    return {this, input_index};
 }
diff --git a/ngraph/core/src/op/util/unary_elementwise_arithmetic.cpp b/ngraph/core/src/op/util/unary_elementwise_arithmetic.cpp
index 8ad965a42f440a..0d02f92f097209 100644
--- a/ngraph/core/src/op/util/unary_elementwise_arithmetic.cpp
+++ b/ngraph/core/src/op/util/unary_elementwise_arithmetic.cpp
@@ -7,15 +7,13 @@
 #include "itt.hpp"
 #include "ngraph/op/util/elementwise_args.hpp"
 
-using namespace ngraph;
+NGRAPH_RTTI_DEFINITION(ov::op::util::UnaryElementwiseArithmetic, "UnaryElementwiseArithmetic", 0);
 
-NGRAPH_RTTI_DEFINITION(op::util::UnaryElementwiseArithmetic, "UnaryElementwiseArithmetic", 0);
+ov::op::util::UnaryElementwiseArithmetic::UnaryElementwiseArithmetic() : Op() {}
 
-op::util::UnaryElementwiseArithmetic::UnaryElementwiseArithmetic() : Op() {}
+ov::op::util::UnaryElementwiseArithmetic::UnaryElementwiseArithmetic(const Output<Node>& arg) : Op({arg}) {}
 
-op::util::UnaryElementwiseArithmetic::UnaryElementwiseArithmetic(const Output<Node>& arg) : Op({arg}) {}
-
-void op::util::UnaryElementwiseArithmetic::validate_and_infer_elementwise_arithmetic() {
+void ov::op::util::UnaryElementwiseArithmetic::validate_and_infer_elementwise_arithmetic() {
     auto args_et_pshape = op::util::validate_and_infer_elementwise_args(this);
     element::Type& args_et = std::get<0>(args_et_pshape);
     PartialShape& args_pshape = std::get<1>(args_et_pshape);
@@ -29,12 +27,12 @@ void op::util::UnaryElementwiseArithmetic::validate_and_infer_elementwise_arithm
     set_output_type(0, args_et, args_pshape);
 }
 
-void op::util::UnaryElementwiseArithmetic::validate_and_infer_types() {
+void ov::op::util::UnaryElementwiseArithmetic::validate_and_infer_types() {
     NGRAPH_OP_SCOPE(util_UnaryElementwiseArithmetic_validate_and_infer_types);
     validate_and_infer_elementwise_arithmetic();
 }
 
-bool op::util::UnaryElementwiseArithmetic::visit_attributes(AttributeVisitor& visitor) {
+bool ov::op::util::UnaryElementwiseArithmetic::visit_attributes(AttributeVisitor& visitor) {
     NGRAPH_OP_SCOPE(util_UnaryElementwiseArithmetic_visit_attributes);
     return true;
 }
diff --git a/ngraph/core/src/op/util/variable.cpp b/ngraph/core/src/op/util/variable.cpp
index 3886f94d6c6e00..5b32fdd054660e 100644
--- a/ngraph/core/src/op/util/variable.cpp
+++ b/ngraph/core/src/op/util/variable.cpp
@@ -4,4 +4,4 @@
 
 #include <ngraph/op/util/variable.hpp>
 
-constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<std::shared_ptr<ngraph::Variable>>::type_info;
+constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<std::shared_ptr<ov::op::util::Variable>>::type_info;
diff --git a/ngraph/core/src/op/variadic_split.cpp b/ngraph/core/src/op/variadic_split.cpp
index 6482f7d4f6bbd5..d149ae90e6f208 100644
--- a/ngraph/core/src/op/variadic_split.cpp
+++ b/ngraph/core/src/op/variadic_split.cpp
@@ -13,7 +13,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::VariadicSplit, "VariadicSplit", 1);
+OPENVINO_RTTI_DEFINITION(op::v1::VariadicSplit, "VariadicSplit", 1);
 
 op::v1::VariadicSplit::VariadicSplit(const Output<Node>& data,
                                      const Output<Node>& axis,
@@ -101,11 +101,11 @@ void ngraph::op::v1::VariadicSplit::validate_and_infer_types() {
                     split_lengths.at(output) == -1 ? Dimension::dynamic() : split_lengths.at(output);
                 auto tmp_shape = data_shape_dims;
                 tmp_shape.at(axis) = output_split_dim;
-                set_output_type(output, data_type, PartialShape{tmp_shape});
+                set_output_type(output, data_type, ov::PartialShape{tmp_shape});
             }
         } else {
             for (int64_t output{0}; output < num_outputs; ++output) {
-                set_output_type(output, data_type, PartialShape::dynamic());
+                set_output_type(output, data_type, ov::PartialShape::dynamic());
             }
         }
     }
@@ -159,7 +159,7 @@ bool op::v1::VariadicSplit::evaluate_variadic_split(const HostTensorVector& inpu
         split_lengths[std::distance(std::begin(split_lengths), neg_one)] = data_shape[axis] - sum_of_known_splits;
     }
 
-    Shape output_shape = data_shape;
+    ov::Shape output_shape = data_shape;
     std::vector<size_t> lower_bounds(data_shape.size(), 0);
     std::vector<size_t> upper_bounds = data_shape;
     upper_bounds.at(axis) = split_lengths[0];
diff --git a/ngraph/core/src/op/xor.cpp b/ngraph/core/src/op/xor.cpp
index 00610fc9cebf01..3277da8011626c 100644
--- a/ngraph/core/src/op/xor.cpp
+++ b/ngraph/core/src/op/xor.cpp
@@ -12,7 +12,7 @@
 using namespace std;
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(op::v1::LogicalXor, "LogicalXor", 1, util::BinaryElementwiseLogical);
+OPENVINO_RTTI_DEFINITION(op::v1::LogicalXor, "LogicalXor", 1, util::BinaryElementwiseLogical);
 
 op::v1::LogicalXor::LogicalXor(const Output<Node>& arg0,
                                const Output<Node>& arg1,
@@ -75,7 +75,7 @@ bool op::v1::LogicalXor::has_evaluate() const {
     return false;
 }
 
-constexpr NodeTypeInfo op::v0::Xor::type_info;
+OPENVINO_RTTI_DEFINITION(op::v0::Xor, "Xor", 0, util::BinaryElementwiseLogical);
 
 op::v0::Xor::Xor(const Output<Node>& arg0, const Output<Node>& arg1, const AutoBroadcastSpec& auto_broadcast)
     : BinaryElementwiseLogical(arg0, arg1, auto_broadcast) {
diff --git a/ngraph/core/src/opsets/opset.cpp b/ngraph/core/src/opsets/opset.cpp
index b9a67b10427144..72a23e9f74bf15 100644
--- a/ngraph/core/src/opsets/opset.cpp
+++ b/ngraph/core/src/opsets/opset.cpp
@@ -7,12 +7,14 @@
 #include "ngraph/log.hpp"
 #include "ngraph/ops.hpp"
 
-std::mutex& ngraph::OpSet::get_mutex() {
+ngraph::OpSet::OpSet(const ov::OpSet& opset) : ov::OpSet(opset) {}
+
+std::mutex& ov::OpSet::get_mutex() {
     static std::mutex opset_mutex;
     return opset_mutex;
 }
 
-ngraph::Node* ngraph::OpSet::create(const std::string& name) const {
+ov::Node* ov::OpSet::create(const std::string& name) const {
     auto type_info_it = m_name_type_info_map.find(name);
     if (type_info_it == m_name_type_info_map.end()) {
         NGRAPH_WARN << "Couldn't create operator of type: " << name << " . Operation not registered in opset.";
@@ -21,96 +23,136 @@ ngraph::Node* ngraph::OpSet::create(const std::string& name) const {
     return m_factory_registry.create(type_info_it->second);
 }
 
-ngraph::Node* ngraph::OpSet::create_insensitive(const std::string& name) const {
+ov::Node* ov::OpSet::create_insensitive(const std::string& name) const {
     auto type_info_it = m_case_insensitive_type_info_map.find(to_upper_name(name));
     return type_info_it == m_case_insensitive_type_info_map.end() ? nullptr
                                                                   : m_factory_registry.create(type_info_it->second);
 }
 
-const ngraph::OpSet& ngraph::get_opset1() {
+const ov::OpSet& ov::get_opset1() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset1_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset1_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
 
-const ngraph::OpSet& ngraph::get_opset2() {
+const ov::OpSet& ov::get_opset2() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset2_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset2_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
 
-const ngraph::OpSet& ngraph::get_opset3() {
+const ov::OpSet& ov::get_opset3() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset3_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset3_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
 
-const ngraph::OpSet& ngraph::get_opset4() {
+const ov::OpSet& ov::get_opset4() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset4_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset4_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
 
-const ngraph::OpSet& ngraph::get_opset5() {
+const ov::OpSet& ov::get_opset5() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset5_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset5_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
 
-const ngraph::OpSet& ngraph::get_opset6() {
+const ov::OpSet& ov::get_opset6() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset6_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset6_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
 
-const ngraph::OpSet& ngraph::get_opset7() {
+const ov::OpSet& ov::get_opset7() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset7_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset7_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
 
-const ngraph::OpSet& ngraph::get_opset8() {
+const ov::OpSet& ov::get_opset8() {
     static OpSet opset;
     static std::once_flag flag;
     std::call_once(flag, [&]() {
-#define NGRAPH_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
-#include "ngraph/opsets/opset8_tbl.hpp"
-#undef NGRAPH_OP
+#define OPENVINO_OP(NAME, NAMESPACE) opset.insert<NAMESPACE::NAME>();
+#include "openvino/opsets/opset8_tbl.hpp"
+#undef OPENVINO_OP
     });
     return opset;
 }
+
+const ngraph::OpSet& ngraph::get_opset1() {
+    static OpSet opset(ov::get_opset1());
+    return opset;
+}
+
+const ngraph::OpSet& ngraph::get_opset2() {
+    static OpSet opset(ov::get_opset2());
+    return opset;
+}
+
+const ngraph::OpSet& ngraph::get_opset3() {
+    static OpSet opset(ov::get_opset3());
+    return opset;
+}
+
+const ngraph::OpSet& ngraph::get_opset4() {
+    static OpSet opset(ov::get_opset4());
+    return opset;
+}
+
+const ngraph::OpSet& ngraph::get_opset5() {
+    static OpSet opset(ov::get_opset5());
+    return opset;
+}
+
+const ngraph::OpSet& ngraph::get_opset6() {
+    static OpSet opset(ov::get_opset6());
+    return opset;
+}
+
+const ngraph::OpSet& ngraph::get_opset7() {
+    static OpSet opset(ov::get_opset7());
+    return opset;
+}
+
+const ngraph::OpSet& ngraph::get_opset8() {
+    static OpSet opset(ov::get_opset8());
+    return opset;
+}
diff --git a/ngraph/core/src/partial_shape.cpp b/ngraph/core/src/partial_shape.cpp
index da93eb1ba15f0b..988e37f6dd7959 100644
--- a/ngraph/core/src/partial_shape.cpp
+++ b/ngraph/core/src/partial_shape.cpp
@@ -10,30 +10,28 @@
 
 #include "ngraph/check.hpp"
 
-using namespace ov;
+ov::PartialShape::PartialShape() : PartialShape(std::initializer_list<Dimension>{}) {}
 
-PartialShape::PartialShape() : PartialShape(std::initializer_list<Dimension>{}) {}
+ov::PartialShape::PartialShape(std::initializer_list<Dimension> init) : PartialShape(true, init) {}
 
-PartialShape::PartialShape(std::initializer_list<Dimension> init) : PartialShape(true, init) {}
-
-PartialShape::PartialShape(const std::vector<Dimension::value_type>& dimensions)
+ov::PartialShape::PartialShape(const std::vector<Dimension::value_type>& dimensions)
     : m_rank_is_static(true),
       m_dimensions(dimensions.begin(), dimensions.end()) {}
 
-PartialShape::PartialShape(const ngraph::Shape& shape)
+ov::PartialShape::PartialShape(const Shape& shape)
     : m_rank_is_static(true),
       m_shape_type(ShapeType::SHAPE_IS_STATIC),
       m_dimensions(shape.begin(), shape.end()) {}
 
-PartialShape::PartialShape(bool rank_is_static, std::vector<Dimension> dimensions)
+ov::PartialShape::PartialShape(bool rank_is_static, std::vector<Dimension> dimensions)
     : m_rank_is_static(rank_is_static),
       m_dimensions(std::move(dimensions)) {}
 
-PartialShape::PartialShape(std::vector<Dimension> dimensions)
+ov::PartialShape::PartialShape(std::vector<Dimension> dimensions)
     : m_rank_is_static(true),
       m_dimensions(std::move(dimensions)) {}
 
-bool PartialShape::is_static() const {
+bool ov::PartialShape::is_static() const {
     ShapeType shape_type = m_shape_type;
 
     if (m_shape_type == ShapeType::SHAPE_IS_UNKNOWN || m_shape_type == ShapeType::SHAPE_IS_UPDATED) {
@@ -52,7 +50,7 @@ bool PartialShape::is_static() const {
     return shape_type == ShapeType::SHAPE_IS_STATIC;
 }
 
-bool PartialShape::operator==(const PartialShape& partial_shape) const {
+bool ov::PartialShape::operator==(const PartialShape& partial_shape) const {
     if (rank() != partial_shape.rank()) {
         return false;
     }
@@ -67,15 +65,15 @@ bool PartialShape::operator==(const PartialShape& partial_shape) const {
     return true;
 }
 
-bool PartialShape::operator!=(const PartialShape& partial_shape) const {
+bool ov::PartialShape::operator!=(const PartialShape& partial_shape) const {
     return !(*this == partial_shape);
 }
 
-ngraph::Shape PartialShape::get_max_shape() const {
+ov::Shape ov::PartialShape::get_max_shape() const {
     if (rank().is_dynamic()) {
-        return ngraph::Shape();
+        return Shape();
     } else {
-        ngraph::Shape shape;
+        Shape shape;
         for (auto dimension : m_dimensions) {
             shape.push_back(dimension.get_interval().get_max_val());
         }
@@ -83,11 +81,11 @@ ngraph::Shape PartialShape::get_max_shape() const {
     }
 }
 
-ngraph::Shape PartialShape::get_min_shape() const {
+ov::Shape ov::PartialShape::get_min_shape() const {
     if (rank().is_dynamic()) {
-        return ngraph::Shape();
+        return Shape();
     } else {
-        ngraph::Shape shape;
+        Shape shape;
         for (auto dimension : m_dimensions) {
             shape.push_back(dimension.get_interval().get_min_val());
         }
@@ -95,9 +93,9 @@ ngraph::Shape PartialShape::get_min_shape() const {
     }
 }
 
-ngraph::Shape PartialShape::get_shape() const {
+ov::Shape ov::PartialShape::get_shape() const {
     NGRAPH_CHECK(rank().is_static(), "get_shape() must be called on a static shape");
-    ngraph::Shape shape;
+    Shape shape;
     for (auto dimension : m_dimensions) {
         auto min_val = dimension.get_interval().get_min_val();
         auto max_val = dimension.get_interval().get_max_val();
@@ -107,7 +105,7 @@ ngraph::Shape PartialShape::get_shape() const {
     return shape;
 }
 
-PartialShape ov::operator+(const PartialShape& s1, const PartialShape& s2) {
+ov::PartialShape ov::operator+(const PartialShape& s1, const PartialShape& s2) {
     if (s1.rank().is_dynamic() || s2.rank().is_dynamic()) {
         return PartialShape::dynamic();
     }
@@ -141,12 +139,12 @@ std::ostream& ov::operator<<(std::ostream& str, const PartialShape& shape) {
     }
 }
 
-PartialShape PartialShape::dynamic(Rank r) {
+ov::PartialShape ov::PartialShape::dynamic(Rank r) {
     return PartialShape(r.is_static(),
                         std::vector<Dimension>(r.is_static() ? r.get_length() : 0, Dimension::dynamic()));
 }
 
-bool PartialShape::compatible(const PartialShape& s) const {
+bool ov::PartialShape::compatible(const PartialShape& s) const {
     // If we don't know *this's rank, or we don't know s's rank, they are compatible.
     if (!m_rank_is_static || s.rank().is_dynamic()) {
         return true;
@@ -169,7 +167,7 @@ bool PartialShape::compatible(const PartialShape& s) const {
     }
 }
 
-bool PartialShape::same_scheme(const PartialShape& s) const {
+bool ov::PartialShape::same_scheme(const PartialShape& s) const {
     if (rank().is_dynamic() && s.rank().is_dynamic()) {
         return true;
     } else if (rank().is_static() && s.rank().is_static()) {
@@ -189,7 +187,7 @@ bool PartialShape::same_scheme(const PartialShape& s) const {
     }
 }
 
-bool PartialShape::relaxes(const PartialShape& s) const {
+bool ov::PartialShape::relaxes(const PartialShape& s) const {
     if (rank().is_dynamic()) {
         return true;
     } else if (s.rank().is_static() && rank().get_length() == s.rank().get_length()) {
@@ -205,7 +203,7 @@ bool PartialShape::relaxes(const PartialShape& s) const {
     }
 }
 
-bool PartialShape::refines(const PartialShape& s) const {
+bool ov::PartialShape::refines(const PartialShape& s) const {
     if (s.rank().is_dynamic()) {
         return true;
     } else if (rank().is_static() && rank().get_length() == s.rank().get_length()) {
@@ -221,7 +219,7 @@ bool PartialShape::refines(const PartialShape& s) const {
     }
 }
 
-bool PartialShape::merge_rank(Rank r) {
+bool ov::PartialShape::merge_rank(Rank r) {
     if (r.is_dynamic()) {
         return true;
     } else if (!m_rank_is_static) {
@@ -234,7 +232,7 @@ bool PartialShape::merge_rank(Rank r) {
     }
 }
 
-ngraph::Shape PartialShape::to_shape() const {
+ov::Shape ov::PartialShape::to_shape() const {
     if (is_dynamic()) {
         throw std::invalid_argument("to_shape was called on a dynamic shape.");
     }
@@ -247,7 +245,7 @@ ngraph::Shape PartialShape::to_shape() const {
     return shape_dimensions;
 }
 
-bool PartialShape::merge_into(PartialShape& dst, const PartialShape& src) {
+bool ov::PartialShape::merge_into(PartialShape& dst, const PartialShape& src) {
     if (dst.rank().is_dynamic()) {
         dst = src;
         return true;
@@ -267,9 +265,9 @@ bool PartialShape::merge_into(PartialShape& dst, const PartialShape& src) {
     }
 }
 
-bool PartialShape::broadcast_merge_into(PartialShape& dst,
-                                        const PartialShape& src,
-                                        const ngraph::op::AutoBroadcastSpec& autob) {
+bool ov::PartialShape::broadcast_merge_into(PartialShape& dst,
+                                            const PartialShape& src,
+                                            const ngraph::op::AutoBroadcastSpec& autob) {
     switch (autob.m_type) {
     case ngraph::op::AutoBroadcastType::NONE:
         return true;
@@ -332,7 +330,7 @@ bool PartialShape::broadcast_merge_into(PartialShape& dst,
     return false;
 }
 
-bool PartialShape::all_non_negative() const {
+bool ov::PartialShape::all_non_negative() const {
     for (auto& d : m_dimensions) {
         if (d.is_static() && d.get_length() < 0) {
             return false;
@@ -342,14 +340,14 @@ bool PartialShape::all_non_negative() const {
     return true;
 }
 
-const Dimension& PartialShape::operator[](size_t i) const {
+const ov::Dimension& ov::PartialShape::operator[](size_t i) const {
     if (i >= m_dimensions.size()) {
         throw std::out_of_range("Accessing out-of-range dimension in Dimension[]");
     }
     return m_dimensions[i];
 }
 
-Dimension& PartialShape::operator[](size_t i) {
+ov::Dimension& ov::PartialShape::operator[](size_t i) {
     if (i >= m_dimensions.size()) {
         throw std::out_of_range("Accessing out-of-range dimension in Dimension[]");
     }
@@ -357,14 +355,14 @@ Dimension& PartialShape::operator[](size_t i) {
     return m_dimensions[i];
 }
 
-const std::vector<int64_t>& ov::AttributeAdapter<PartialShape>::get() {
+const std::vector<int64_t>& ov::AttributeAdapter<ov::PartialShape>::get() {
     if (!m_buffer_valid) {
         m_buffer.clear();
         if (m_ref.rank().is_dynamic()) {
             m_buffer.push_back(-2);
         } else {
             for (int64_t i = 0; i < m_ref.rank().get_length(); ++i) {
-                const auto& elt = static_cast<const PartialShape&>(m_ref)[i];
+                const auto& elt = static_cast<const ov::PartialShape&>(m_ref)[i];
                 m_buffer.push_back(elt.is_dynamic() ? -1 : elt.get_length());
             }
         }
@@ -373,18 +371,19 @@ const std::vector<int64_t>& ov::AttributeAdapter<PartialShape>::get() {
     return m_buffer;
 }
 
-void ov::AttributeAdapter<PartialShape>::set(const std::vector<int64_t>& value) {
-    m_ref = PartialShape();
+void ov::AttributeAdapter<ov::PartialShape>::set(const std::vector<int64_t>& value) {
+    m_ref = ov::PartialShape();
     if (value.size() == 1 && value[0] == -2) {
-        m_ref = PartialShape::dynamic();
+        m_ref = ov::PartialShape::dynamic();
     } else {
         std::vector<Dimension> dims;
+        dims.reserve(value.size());
         for (auto elt : value) {
             dims.push_back(elt == -1 ? Dimension::dynamic() : elt);
         }
-        m_ref = PartialShape(dims);
+        m_ref = ov::PartialShape(dims);
     }
     m_buffer_valid = false;
 }
 
-NGRAPH_API constexpr DiscreteTypeInfo ov::AttributeAdapter<PartialShape>::type_info;
+OPENVINO_API constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<ov::PartialShape>::type_info;
diff --git a/ngraph/core/src/pass/constant_folding.cpp b/ngraph/core/src/pass/constant_folding.cpp
index f9818321d1f591..56be73617368d9 100644
--- a/ngraph/core/src/pass/constant_folding.cpp
+++ b/ngraph/core/src/pass/constant_folding.cpp
@@ -11,11 +11,10 @@
 #include "ngraph/validation_util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::ConstantFolding, "ConstantFolding", 0);
+OPENVINO_RTTI_DEFINITION(ov::pass::ConstantFolding, "ConstantFolding", 0);
 
-bool ngraph::pass::ConstantFolding::run_on_function(std::shared_ptr<ngraph::Function> f) {
+bool ov::pass::ConstantFolding::run_on_function(std::shared_ptr<ov::Function> f) {
     bool rewritten = pre_calculated_values_folding(f);
 
     for (const auto& node : f->get_ordered_ops()) {
@@ -48,7 +47,7 @@ bool ngraph::pass::ConstantFolding::run_on_function(std::shared_ptr<ngraph::Func
             }
         } else {
             // recursively constant fold operators containing subgraphs (ie: TensorIterator, Loop)
-            if (auto sub_graph_node = std::dynamic_pointer_cast<op::util::SubGraphOp>(node)) {
+            if (auto sub_graph_node = std::dynamic_pointer_cast<ngraph::op::util::SubGraphOp>(node)) {
                 if (const auto& sub_graph = sub_graph_node->get_function()) {
                     rewritten |= run_on_function(sub_graph);
                 }
@@ -79,14 +78,14 @@ bool ngraph::pass::ConstantFolding::pre_calculated_values_folding(const std::sha
     while (!nodes.empty()) {
         auto curr_node = nodes.front();
         nodes.pop_front();
-        if (visited.count(curr_node) || ov::is_type<op::Constant>(curr_node))
+        if (visited.count(curr_node) || ov::is_type<ngraph::op::Constant>(curr_node))
             continue;
         visited.insert(curr_node);
 
         for (auto& input_value : curr_node->input_values()) {
             // Check that ConstantFolding is not disabled on this path
             std::vector<Node*> order;
-            auto status = could_propagate(input_value, order);
+            auto status = ngraph::could_propagate(input_value, order);
             if (status) {
                 for (const auto& node : order) {
                     const auto& rt_info = node->get_rt_info();
@@ -99,8 +98,8 @@ bool ngraph::pass::ConstantFolding::pre_calculated_values_folding(const std::sha
 
             if (status && input_value.get_tensor().has_and_set_bound()) {
                 auto input_node = input_value.get_node_shared_ptr();
-                auto replacement = std::make_shared<op::Constant>(input_value.get_tensor().get_lower_value());
-                if (replacement && !ov::is_type<op::Constant>(input_node)) {
+                auto replacement = std::make_shared<ngraph::op::Constant>(input_value.get_tensor().get_lower_value());
+                if (replacement && !ov::is_type<ngraph::op::Constant>(input_node)) {
                     if (input_node->get_output_size() == 1) {
                         replacement->set_friendly_name(input_node->get_friendly_name());
                     } else {
diff --git a/ngraph/core/src/pass/convert_fp32_to_fp16.cpp b/ngraph/core/src/pass/convert_fp32_to_fp16.cpp
index 74386bb9da606f..8d98e5f83fc432 100644
--- a/ngraph/core/src/pass/convert_fp32_to_fp16.cpp
+++ b/ngraph/core/src/pass/convert_fp32_to_fp16.cpp
@@ -9,12 +9,11 @@
 #include "transformations/convert_precision.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::ConvertFP32ToFP16, "ConvertFP32ToFP16", 0);
+OPENVINO_RTTI_DEFINITION(ov::pass::ConvertFP32ToFP16, "ConvertFP32ToFP16", 0);
 
-bool ngraph::pass::ConvertFP32ToFP16::run_on_function(std::shared_ptr<ngraph::Function> f) {
-    ngraph::pass::Manager m(get_pass_config());
+bool ov::pass::ConvertFP32ToFP16::run_on_function(std::shared_ptr<ov::Function> f) {
+    ov::pass::Manager m(get_pass_config());
     m.register_pass<ngraph::pass::ConvertPrecision>(precisions_array{{ngraph::element::f32, ngraph::element::f16}});
     m.run_passes(f);
     return false;
diff --git a/ngraph/core/src/pass/graph_rewrite.cpp b/ngraph/core/src/pass/graph_rewrite.cpp
index 07e8472ce47cc8..b9342a885620f5 100644
--- a/ngraph/core/src/pass/graph_rewrite.cpp
+++ b/ngraph/core/src/pass/graph_rewrite.cpp
@@ -18,9 +18,6 @@
 #include "ngraph/op/util/sub_graph_base.hpp"
 #include "perf_counters.hpp"
 
-using namespace std;
-using namespace ngraph;
-
 /* GraphRewrite algorithm:
  * GraphRewrite processes an input graph in an topological order(i.e. args before users)
  * Given the following graph:          Abs2
@@ -33,7 +30,7 @@ using namespace ngraph;
  * Note, `Abs2` comes before `Neg3` as `Abs2`'s id = 2 is *less* than `Neg3`'s one (id = 3)
  * Next, GraphRewrite will invoke matchers passes registered in add_matcher order.
  * For example:
- *     ngraph::pass::GraphRewrite pass;
+ *     ov::pass::GraphRewrite pass;
  *     pass.add_matcher<m1>();
  *     pass.add_matcher<m2>();
  *     pass.add_matcher<m3>();
@@ -53,13 +50,13 @@ using namespace ngraph;
  * If MatcherPass register more than one node make sure that this nodes are registered in
  * topological order. */
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::GraphRewrite, "ngraph::pass::GraphRewrite", 0);
+NGRAPH_RTTI_DEFINITION(ov::pass::GraphRewrite, "ov::pass::GraphRewrite", 0);
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::BackwardGraphRewrite, "ngraph::pass::BackwardGraphRewrite", 0);
+NGRAPH_RTTI_DEFINITION(ov::pass::BackwardGraphRewrite, "ov::pass::BackwardGraphRewrite", 0);
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::MatcherPass, "ngraph::pass::MatcherPass", 0);
+NGRAPH_RTTI_DEFINITION(ov::pass::MatcherPass, "ov::pass::MatcherPass", 0);
 
-namespace ngraph {
+namespace ov {
 namespace pass {
 namespace internal {
 PerfCounters& perf_counters_graph_rewrite() {
@@ -68,27 +65,28 @@ PerfCounters& perf_counters_graph_rewrite() {
 }
 }  // namespace internal
 }  // namespace pass
-}  // namespace ngraph
+}  // namespace ov
 
-bool pass::BackwardGraphRewrite::run_on_function(std::shared_ptr<ngraph::Function> f) {
+bool ov::pass::BackwardGraphRewrite::run_on_function(std::shared_ptr<ov::Function> f) {
     // Initialize execution queue with nodes in topological order
-    deque<std::weak_ptr<Node>> nodes_to_run;
+    std::deque<std::weak_ptr<Node>> nodes_to_run;
     for (auto& node : f->get_ordered_ops()) {
         nodes_to_run.emplace_front(node);
     }
     return apply_matcher_passes(f, std::move(nodes_to_run));
 }
 
-bool pass::GraphRewrite::run_on_function(std::shared_ptr<ngraph::Function> f) {
+bool ov::pass::GraphRewrite::run_on_function(std::shared_ptr<ov::Function> f) {
     // Initialize execution queue with nodes in topological order
-    deque<std::weak_ptr<Node>> nodes_to_run;
+    std::deque<std::weak_ptr<Node>> nodes_to_run;
     for (auto& node : f->get_ordered_ops()) {
         nodes_to_run.emplace_back(node);
     }
     return apply_matcher_passes(f, std::move(nodes_to_run));
 }
 
-bool pass::GraphRewrite::apply_matcher_passes(shared_ptr<Function> f, deque<std::weak_ptr<Node>> nodes_to_run) {
+bool ov::pass::GraphRewrite::apply_matcher_passes(std::shared_ptr<Function> f,
+                                                  std::deque<std::weak_ptr<Node>> nodes_to_run) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "pass::GraphRewrite::run_on_function");
 
     bool rewritten = false;
@@ -111,7 +109,7 @@ bool pass::GraphRewrite::apply_matcher_passes(shared_ptr<Function> f, deque<std:
         auto root = matcher->get_pattern_value().get_node_shared_ptr();
         // pattern::op::AnyOutput operation automatically appends for multi output operations inside
         // Matcher and to gen actual root node we need to take it's parent.
-        if (auto any_type = dynamic_pointer_cast<pattern::op::AnyOutput>(root)) {
+        if (auto any_type = std::dynamic_pointer_cast<pattern::op::AnyOutput>(root)) {
             root = any_type->input_value(0).get_node_shared_ptr();
         }
 
@@ -119,8 +117,8 @@ bool pass::GraphRewrite::apply_matcher_passes(shared_ptr<Function> f, deque<std:
         // it's type
         // and use it in unordered_map as key for fast MatcherPass search. Otherwise type is unknown
         // and default algorithm is used.
-        if (auto p = dynamic_pointer_cast<pattern::op::Pattern>(root)) {
-            if (auto any_type = dynamic_pointer_cast<pattern::op::WrapType>(p)) {
+        if (auto p = std::dynamic_pointer_cast<pattern::op::Pattern>(root)) {
+            if (auto any_type = std::dynamic_pointer_cast<pattern::op::WrapType>(p)) {
                 for (const auto& root_type_info : any_type->get_wrapped_types()) {
                     type_to_matcher[root_type_info].push_back(matcher_index);
                 }
@@ -180,7 +178,7 @@ bool pass::GraphRewrite::apply_matcher_passes(shared_ptr<Function> f, deque<std:
             continue;
 
         // Recursive apply Matchers for sub-graph based nodes
-        if (auto sub_graph_node = std::dynamic_pointer_cast<op::util::SubGraphOp>(node)) {
+        if (auto sub_graph_node = std::dynamic_pointer_cast<ngraph::op::util::SubGraphOp>(node)) {
             if (auto sub_graph = sub_graph_node->get_function()) {
                 run_on_function(sub_graph);
             }
@@ -236,9 +234,9 @@ bool pass::GraphRewrite::apply_matcher_passes(shared_ptr<Function> f, deque<std:
     return rewritten;
 }
 
-void pass::GraphRewrite::add_matcher(const shared_ptr<pattern::Matcher>& m,
-                                     const graph_rewrite_callback& callback,
-                                     const PassPropertyMask& property) {
+void ov::pass::GraphRewrite::add_matcher(const std::shared_ptr<pattern::Matcher>& m,
+                                         const graph_rewrite_callback& callback,
+                                         const PassPropertyMask& property) {
     m_matchers.push_back(std::make_shared<MatcherPass>(
         m->get_name(),
         m,
@@ -258,7 +256,8 @@ void pass::GraphRewrite::add_matcher(const shared_ptr<pattern::Matcher>& m,
         property));
 }
 
-void pass::GraphRewrite::add_matcher(const shared_ptr<pattern::Matcher>& m, const graph_rewrite_callback& callback) {
+void ov::pass::GraphRewrite::add_matcher(const std::shared_ptr<pattern::Matcher>& m,
+                                         const graph_rewrite_callback& callback) {
     NGRAPH_SUPPRESS_DEPRECATED_START
     // TODO: before deprecate this function, by default expect the
     // callback require static shape.
@@ -266,7 +265,7 @@ void pass::GraphRewrite::add_matcher(const shared_ptr<pattern::Matcher>& m, cons
     NGRAPH_SUPPRESS_DEPRECATED_END
 }
 
-void pass::GraphRewrite::set_pass_config(const std::shared_ptr<PassConfig>& rhs) {
+void ov::pass::GraphRewrite::set_pass_config(const std::shared_ptr<PassConfig>& rhs) {
     auto pass_config = get_pass_config();
     // We have to preserve disabled passes because in case when we register matchers inside
     // GraphRewrite c-tor we work with local PassConfig instance.
@@ -293,9 +292,9 @@ void pass::GraphRewrite::set_pass_config(const std::shared_ptr<PassConfig>& rhs)
     }
 }
 
-void pass::RecurrentGraphRewrite::add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
-                                              const ngraph::recurrent_graph_rewrite_callback& callback,
-                                              const PassPropertyMask& property) {
+void ov::pass::RecurrentGraphRewrite::add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
+                                                  const ov::recurrent_graph_rewrite_callback& callback,
+                                                  const PassPropertyMask& property) {
     m_matchers.push_back(std::make_shared<MatcherPass>(
         "Recurrent matcher",
         nullptr,
@@ -310,24 +309,24 @@ void pass::RecurrentGraphRewrite::add_matcher(const std::shared_ptr<pattern::Rec
         property));
 }
 
-void pass::RecurrentGraphRewrite::add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
-                                              const ngraph::recurrent_graph_rewrite_callback& callback) {
+void ov::pass::RecurrentGraphRewrite::add_matcher(const std::shared_ptr<pattern::RecurrentMatcher>& m,
+                                                  const ov::recurrent_graph_rewrite_callback& callback) {
     // TODO: before deprecate this function, by default expect the
     // callback require static shape.
     add_matcher(m, callback, {PassProperty::REQUIRE_STATIC_SHAPE});
 }
 
-bool pass::RecurrentGraphRewrite::run_on_function(shared_ptr<Function> f) {
+bool ov::pass::RecurrentGraphRewrite::run_on_function(std::shared_ptr<Function> f) {
     bool changed = false;
     size_t i = 0;
 
     // This check is very expensive and is only needed for experimental features, so we will hide
     // it behind an environment variable for now. TODO: Find a less expensive way to handle this.
-    static bool s_rerun_dynamic_check = getenv_bool("NGRAPH_GRAPH_REWRITE_RERUN_DYNAMIC_CHECK");
+    static bool s_rerun_dynamic_check = ngraph::getenv_bool("NGRAPH_GRAPH_REWRITE_RERUN_DYNAMIC_CHECK");
 
     auto run_matchers = [&]() -> bool {
         bool is_dyn_func = s_rerun_dynamic_check && f->is_dynamic();
-        for (auto node : f->get_ops()) {
+        for (const auto& node : f->get_ops()) {
             for (auto& m_pass : m_matchers) {
                 if (is_dyn_func && m_pass->get_property(PassProperty::REQUIRE_STATIC_SHAPE)) {
                     NGRAPH_DEBUG << "matcher callback requires static shape but the "
@@ -356,9 +355,9 @@ bool pass::RecurrentGraphRewrite::run_on_function(shared_ptr<Function> f) {
     return changed;
 }
 
-void ngraph::pass::MatcherPass::register_matcher(const std::shared_ptr<ngraph::pattern::Matcher>& m,
-                                                 const ngraph::graph_rewrite_callback& callback,
-                                                 const PassPropertyMask& property) {
+void ov::pass::MatcherPass::register_matcher(const std::shared_ptr<ov::pass::pattern::Matcher>& m,
+                                             const ov::graph_rewrite_callback& callback,
+                                             const PassPropertyMask& property) {
     set_name(m->get_name());
     set_property(property, true);
     m_matcher = m;
@@ -376,7 +375,7 @@ void ngraph::pass::MatcherPass::register_matcher(const std::shared_ptr<ngraph::p
     };
 }
 
-bool ngraph::pass::MatcherPass::apply(std::shared_ptr<ngraph::Node> node) {
+bool ov::pass::MatcherPass::apply(std::shared_ptr<ov::Node> node) {
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, pass::internal::perf_counters_graph_rewrite()[get_type_info()]);
     m_new_nodes.clear();
     if (m_handler)
diff --git a/ngraph/core/src/pass/low_latency.cpp b/ngraph/core/src/pass/low_latency.cpp
index 879462432306b7..d270778b708a34 100644
--- a/ngraph/core/src/pass/low_latency.cpp
+++ b/ngraph/core/src/pass/low_latency.cpp
@@ -12,13 +12,12 @@
 #include <ngraph/rt_info.hpp>
 #include <ngraph/variant.hpp>
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::LowLatency2, "LowLatency2", 0);
+NGRAPH_RTTI_DEFINITION(ov::pass::LowLatency2, "LowLatency2", 0);
 
 NGRAPH_SUPPRESS_DEPRECATED_START
 NGRAPH_RTTI_DEFINITION(ngraph::pass::LowLatency, "LowLatency", 0);
 
 using namespace std;
-using namespace ngraph;
 
 namespace {
 string generate_variable_name(const string& op_name, const string& param_name, int variable_idx) {
@@ -27,8 +26,8 @@ string generate_variable_name(const string& op_name, const string& param_name, i
 
 }  // namespace
 ngraph::pass::LowLatency::LowLatency() {
-    auto tensor_iterator = ngraph::pattern::wrap_type<opset6::TensorIterator, opset6::Loop>();
-    ngraph::matcher_pass_callback callback = [](ngraph::pattern::Matcher& m) {
+    auto tensor_iterator = ov::pass::pattern::wrap_type<opset6::TensorIterator, opset6::Loop>();
+    ov::matcher_pass_callback callback = [](ov::pass::pattern::Matcher& m) {
         const auto& sub_graph_op = std::dynamic_pointer_cast<ngraph::op::util::SubGraphOp>(m.get_match_root());
         if (!sub_graph_op) {
             return false;
@@ -38,7 +37,7 @@ ngraph::pass::LowLatency::LowLatency() {
             const auto& trip_count = std::dynamic_pointer_cast<opset6::Constant>(loop->get_input_node_shared_ptr(0));
             const auto& num_iter = loop->get_num_iterations();
             if (trip_count && num_iter > 0 && trip_count->get_output_target_inputs(0).size() == 1) {
-                auto single_iter = std::make_shared<opset6::Constant>(ngraph::element::i64, Shape{}, 1);
+                auto single_iter = std::make_shared<opset6::Constant>(ov::element::i64, Shape{}, 1);
                 replace_node(trip_count, single_iter);
             } else {
                 // count of iterations is dynamic;
@@ -47,7 +46,7 @@ ngraph::pass::LowLatency::LowLatency() {
         }
         // Mark the TI layer to be unrolled. Enable unconditional ti unrolling for all plugins.
         auto& rt_info = sub_graph_op->get_rt_info();
-        rt_info["UNROLL_TI"] = std::make_shared<ngraph::VariantWrapper<int64_t>>(1);
+        rt_info["UNROLL_TI"] = std::make_shared<ov::VariantWrapper<int64_t>>(1);
 
         int64_t variable_id = 0;
         std::vector<std::shared_ptr<ngraph::op::Sink>> assigns;
@@ -63,8 +62,8 @@ ngraph::pass::LowLatency::LowLatency() {
                     sub_graph_op->get_friendly_name(),
                     func->get_parameters().at(merged_in->m_body_parameter_index)->get_friendly_name(),
                     variable_id));
-                auto variable =
-                    std::make_shared<Variable>(VariableInfo{PartialShape::dynamic(), element::dynamic, variable_name});
+                auto variable = std::make_shared<Variable>(
+                    VariableInfo{ov::PartialShape::dynamic(), element::dynamic, variable_name});
                 auto read_value =
                     std::make_shared<opset6::ReadValue>(func->get_parameters().at(merged_in->m_body_parameter_index),
                                                         variable);
@@ -87,13 +86,14 @@ ngraph::pass::LowLatency::LowLatency() {
         return false;
     };
 
-    auto m = std::make_shared<ngraph::pattern::Matcher>(tensor_iterator, "LowLatency");
+    auto m = std::make_shared<ov::pass::pattern::Matcher>(tensor_iterator, "LowLatency");
     register_matcher(m, callback);
 }
 NGRAPH_SUPPRESS_DEPRECATED_END
 
-void UnrollSingleIteration(const shared_ptr<op::util::SubGraphOp>& sub_graph_op, const shared_ptr<Function>& outer_f) {
-    using namespace opset7;
+void UnrollSingleIteration(const shared_ptr<ngraph::op::util::SubGraphOp>& sub_graph_op,
+                           const shared_ptr<ov::Function>& outer_f) {
+    using namespace ngraph::opset7;
 
     const auto& params = sub_graph_op->get_function()->get_parameters();
     const auto& results = sub_graph_op->get_function()->get_results();
@@ -109,7 +109,7 @@ void UnrollSingleIteration(const shared_ptr<op::util::SubGraphOp>& sub_graph_op,
 
     // before: TI [...-> Layer1 -> Result -> output] -> Layer2 -> ...
     // after:  ...-> Layer1 -> Layer2 -> ...
-    NodeVector new_ops;
+    ov::NodeVector new_ops;
     for (const auto& out : sub_graph_op->get_output_descriptions()) {
         const auto& connect_to = results.at(out->m_body_value_index)->get_input_source_output(0);
         for (auto& input_to : sub_graph_op->output(out->m_output_index).get_target_inputs()) {
@@ -120,7 +120,7 @@ void UnrollSingleIteration(const shared_ptr<op::util::SubGraphOp>& sub_graph_op,
 
             // IECompatibility: insert identity (Unsqueeze + Squeeze) to store the TensorIterator
             // output names
-            auto axis_1 = Constant::create(ngraph::element::i64, ngraph::Shape{1}, {1});
+            auto axis_1 = Constant::create(ov::element::i64, ov::Shape{1}, {1});
             auto identity_1 = std::make_shared<Unsqueeze>(connect_to, axis_1);
             auto identity_2 = std::make_shared<Squeeze>(identity_1, axis_1);
             identity_2->set_friendly_name(out_name);
@@ -135,36 +135,38 @@ void UnrollSingleIteration(const shared_ptr<op::util::SubGraphOp>& sub_graph_op,
     ngraph::copy_runtime_info(sub_graph_op, new_ops);
 }
 
-Output<Node> create_init_subgraph(const shared_ptr<op::util::SubGraphOp>& sub_graph_op, const Output<Node>& in_node) {
-    using namespace opset7;
+ngraph::Output<ngraph::Node> create_init_subgraph(const shared_ptr<ngraph::op::util::SubGraphOp>& sub_graph_op,
+                                                  const ngraph::Output<ngraph::Node>& in_node) {
+    using namespace ngraph::opset7;
 
-    auto const_zero = make_shared<Constant>(in_node.get_element_type(), Shape{1}, 0);
+    auto const_zero = make_shared<Constant>(in_node.get_element_type(), ov::Shape{1}, 0);
     auto shape_of = make_shared<ShapeOf>(in_node);
     auto broadcast = make_shared<Broadcast>(const_zero, shape_of);
     copy_runtime_info(sub_graph_op, {const_zero, shape_of, broadcast});
     return broadcast->output(0);
 }
 
-bool pass::LowLatency2::run_on_function(shared_ptr<Function> f) {
-    using namespace opset7;
+bool ov::pass::LowLatency2::run_on_function(shared_ptr<Function> f) {
+    using namespace ngraph::opset7;
 
-    SinkVector assigns;
+    ngraph::SinkVector assigns;
     for (const auto& op : f->get_ordered_ops()) {
-        if (const auto& sub_graph_op = dynamic_pointer_cast<op::util::SubGraphOp>(op)) {
+        if (const auto& sub_graph_op = dynamic_pointer_cast<ngraph::op::util::SubGraphOp>(op)) {
             int64_t variable_id = 0;
             const auto& func = sub_graph_op->get_function();
             const auto& params = func->get_parameters();
             for (const auto& in : sub_graph_op->get_input_descriptions()) {
                 // Process all back edges
-                if (const auto& merged_in = dynamic_pointer_cast<op::util::SubGraphOp::MergedInputDescription>(in)) {
+                if (const auto& merged_in =
+                        dynamic_pointer_cast<ngraph::op::util::SubGraphOp::MergedInputDescription>(in)) {
                     // create new Variable
                     const string& param_name = params.at(merged_in->m_body_parameter_index)->get_friendly_name();
                     const string& var_name =
                         generate_variable_name(sub_graph_op->get_friendly_name(), param_name, variable_id);
 
                     const auto& input = sub_graph_op->input(merged_in->m_input_index);
-                    if (std::dynamic_pointer_cast<op::ReadValueBase>(input.get_source_output().get_node_shared_ptr()) !=
-                        nullptr) {
+                    if (std::dynamic_pointer_cast<ngraph::op::ReadValueBase>(
+                            input.get_source_output().get_node_shared_ptr()) != nullptr) {
                         NGRAPH_DEBUG << "LowLatency2 transformation cannot be applied because the "
                                      << "ReadValue node is already an input to the TensorIterator."
                                      << "LowLatency2 transformation may have already been applied, please "
@@ -175,7 +177,7 @@ bool pass::LowLatency2::run_on_function(shared_ptr<Function> f) {
                     const auto& param =
                         sub_graph_op->get_function()->get_parameters().at(merged_in->m_body_parameter_index);
                     for (const auto& in_to : param->output(0).get_target_inputs()) {
-                        if (dynamic_cast<op::ReadValueBase*>(in_to.get_node()) != nullptr) {
+                        if (dynamic_cast<ngraph::op::ReadValueBase*>(in_to.get_node()) != nullptr) {
                             NGRAPH_DEBUG << "LowLatency2 transformation cannot be applied because the "
                                          << "ReadValue node is already inside the TensorIterator. "
                                          << "LowLatency transformation may have been applied, please do "
@@ -184,8 +186,8 @@ bool pass::LowLatency2::run_on_function(shared_ptr<Function> f) {
                         }
                     }
 
-                    VariableInfo var_info{PartialShape::dynamic(), element::dynamic, var_name};
-                    auto variable = make_shared<Variable>(var_info);
+                    ngraph::VariableInfo var_info{PartialShape::dynamic(), element::dynamic, var_name};
+                    auto variable = make_shared<ngraph::Variable>(var_info);
 
                     // insert ReadValue
                     // Layers -> [new op: ReadValue] -> Subgraph operation
@@ -204,12 +206,12 @@ bool pass::LowLatency2::run_on_function(shared_ptr<Function> f) {
                     //                      ---> Layers -> ...
                     */
                     const auto& out_desc = sub_graph_op->get_output_descriptions();
-                    bool is_output_exist =
-                        std::any_of(out_desc.begin(),
-                                    out_desc.end(),
-                                    [&merged_in](const std::shared_ptr<op::util::SubGraphOp::OutputDescription>& out) {
-                                        return out->m_body_value_index == merged_in->m_body_value_index;
-                                    });
+                    bool is_output_exist = std::any_of(
+                        out_desc.begin(),
+                        out_desc.end(),
+                        [&merged_in](const std::shared_ptr<ngraph::op::util::SubGraphOp::OutputDescription>& out) {
+                            return out->m_body_value_index == merged_in->m_body_value_index;
+                        });
                     // Create new output if it doesn't exist.
                     if (!is_output_exist) {
                         sub_graph_op->get_iter_value(func->get_results().at(merged_in->m_body_value_index));
@@ -217,7 +219,7 @@ bool pass::LowLatency2::run_on_function(shared_ptr<Function> f) {
                     for (const auto& out : sub_graph_op->get_output_descriptions()) {
                         if (out->m_body_value_index == merged_in->m_body_value_index) {
                             auto assign = make_shared<Assign>(sub_graph_op->output(out->m_output_index), variable);
-                            ngraph::copy_runtime_info(sub_graph_op, assign);
+                            copy_runtime_info(sub_graph_op, assign);
                             // control dependency so that ReadValue is processed before Assign
                             assign->add_control_dependency(read_value);
                             assigns.emplace_back(assign);
diff --git a/ngraph/core/src/pass/manager.cpp b/ngraph/core/src/pass/manager.cpp
index 613ec73bff39b1..288003dd08a406 100644
--- a/ngraph/core/src/pass/manager.cpp
+++ b/ngraph/core/src/pass/manager.cpp
@@ -24,9 +24,8 @@
 #include "perf_counters.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-namespace ngraph {
+namespace ov {
 namespace pass {
 namespace internal {
 PerfCounters& perf_counters() {
@@ -35,25 +34,25 @@ PerfCounters& perf_counters() {
 }
 }  // namespace internal
 }  // namespace pass
-}  // namespace ngraph
+}  // namespace ov
 
-pass::Manager::Manager()
+ov::pass::Manager::Manager()
     : m_pass_config(std::make_shared<PassConfig>()),
-      m_visualize(getenv_bool("NGRAPH_ENABLE_VISUALIZE_TRACING")) {}
+      m_visualize(ngraph::getenv_bool("NGRAPH_ENABLE_VISUALIZE_TRACING")) {}
 
-pass::Manager::~Manager() {}
+ov::pass::Manager::~Manager() = default;
 
-pass::Manager::Manager(std::shared_ptr<ngraph::pass::PassConfig> pass_config) : m_pass_config(std::move(pass_config)) {}
+ov::pass::Manager::Manager(std::shared_ptr<ov::pass::PassConfig> pass_config) : m_pass_config(std::move(pass_config)) {}
 
-void pass::Manager::run_passes(shared_ptr<Function> func) {
+void ov::pass::Manager::run_passes(shared_ptr<ov::Function> func) {
     NGRAPH_SUPPRESS_DEPRECATED_START
     OV_ITT_SCOPED_TASK(ov::itt::domains::nGraph, "pass::Manager::run_passes");
 
-    static bool profile_enabled = getenv_bool("NGRAPH_PROFILE_PASS_ENABLE");
+    static bool profile_enabled = ngraph::getenv_bool("NGRAPH_PROFILE_PASS_ENABLE");
 
     size_t index = 0;
-    stopwatch pass_timer;
-    stopwatch overall_timer;
+    ngraph::stopwatch pass_timer;
+    ngraph::stopwatch overall_timer;
     overall_timer.start();
     bool function_changed = false;
     for (auto& pass : m_pass_list) {
@@ -96,13 +95,13 @@ void pass::Manager::run_passes(shared_ptr<Function> func) {
             } else {
                 function_changed = function_pass->run_on_function(func);
             }
-        } else if (auto node_pass = dynamic_pointer_cast<NodePass>(pass)) {
+        } else if (auto node_pass = dynamic_pointer_cast<ngraph::pass::NodePass>(pass)) {
             if (node_pass->get_property(PassProperty::REQUIRE_STATIC_SHAPE) && func->is_dynamic()) {
                 NGRAPH_DEBUG << "Pass " << pass->get_name() << " requires static shape but the "
                              << "function is dynamic. Skipping this transformation";
                 continue;
             }
-            for (shared_ptr<Node> n : func->get_ops()) {
+            for (const shared_ptr<Node>& n : func->get_ops()) {
                 function_changed |= node_pass->run_on_node(n);
             }
         }
@@ -115,7 +114,7 @@ void pass::Manager::run_passes(shared_ptr<Function> func) {
             auto base_filename = func->get_name() + std::string("_") + index_str + std::string("_") + pass->get_name();
 
             if (m_visualize) {
-                static const string format = getenv_string("NGRAPH_VISUALIZE_TRACING_FORMAT");
+                static const string format = ngraph::getenv_string("NGRAPH_VISUALIZE_TRACING_FORMAT");
                 auto file_ext = format.empty() ? "svg" : format;
                 pass::VisualizeTree vt(base_filename + std::string(".") + file_ext);
                 vt.run_on_function(func);
diff --git a/ngraph/core/src/pass/pass.cpp b/ngraph/core/src/pass/pass.cpp
index 7ab35f96c8dfcb..4d8e3308582890 100644
--- a/ngraph/core/src/pass/pass.cpp
+++ b/ngraph/core/src/pass/pass.cpp
@@ -7,21 +7,20 @@
 #    include <cxxabi.h>
 #endif
 
-#include "ngraph/pass/manager.hpp"
 #include "ngraph/pass/pass.hpp"
+#include "openvino/pass/manager.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::FunctionPass, "ngraph::pass::FunctionPass", 0);
+OPENVINO_RTTI_DEFINITION(ov::pass::FunctionPass, "ov::pass::FunctionPass", 0);
 
-pass::PassBase::PassBase() : m_property{all_pass_property_off}, m_pass_config(std::make_shared<PassConfig>()) {}
+ov::pass::PassBase::PassBase() : m_property(), m_pass_config(std::make_shared<PassConfig>()) {}
 
-bool pass::PassBase::get_property(const PassPropertyMask& prop) const {
+bool ov::pass::PassBase::get_property(const PassPropertyMask& prop) const {
     return m_property.is_set(prop);
 }
 
-void pass::PassBase::set_property(const PassPropertyMask& prop, bool value) {
+void ov::pass::PassBase::set_property(const PassPropertyMask& prop, bool value) {
     if (value) {
         m_property.set(prop);
     } else {
@@ -29,7 +28,7 @@ void pass::PassBase::set_property(const PassPropertyMask& prop, bool value) {
     }
 }
 
-std::string pass::PassBase::get_name() const {
+std::string ov::pass::PassBase::get_name() const {
     if (m_name.empty()) {
         const PassBase* p = this;
         std::string pass_name = typeid(*p).name();
@@ -43,16 +42,16 @@ std::string pass::PassBase::get_name() const {
     }
 }
 
-void pass::PassBase::set_callback(const param_callback& callback) {
+void ov::pass::PassBase::set_callback(const param_callback& callback) {
     m_pass_config->set_callback(callback);
 }
 
 // The symbols are requiered to be in cpp file to workaround RTTI issue on Android LLVM
 
-pass::FunctionPass::~FunctionPass() {}
+ov::pass::FunctionPass::~FunctionPass() = default;
 
-NGRAPH_SUPPRESS_DEPRECATED_START
+OPENVINO_SUPPRESS_DEPRECATED_START
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::NodePass, "ngraph::pass::NodePass", 0);
+OPENVINO_RTTI_DEFINITION(ngraph::pass::NodePass, "ngraph::pass::NodePass", 0);
 
-pass::NodePass::~NodePass() {}
+ngraph::pass::NodePass::~NodePass() = default;
diff --git a/ngraph/core/src/pass/pass_config.cpp b/ngraph/core/src/pass/pass_config.cpp
index af7aa8638012be..58e33dba8e8af3 100644
--- a/ngraph/core/src/pass/pass_config.cpp
+++ b/ngraph/core/src/pass/pass_config.cpp
@@ -2,11 +2,9 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "ngraph/pass/pass_config.hpp"
+#include "openvino/pass/pass_config.hpp"
 
-using namespace ngraph;
-
-pass::param_callback pass::PassConfig::get_callback(const DiscreteTypeInfo& type_info) const {
+ov::pass::param_callback ov::pass::PassConfig::get_callback(const DiscreteTypeInfo& type_info) const {
     const auto& it = m_callback_map.find(type_info);
     if (it != m_callback_map.end()) {
         return it->second;
@@ -15,17 +13,17 @@ pass::param_callback pass::PassConfig::get_callback(const DiscreteTypeInfo& type
     }
 }
 
-void pass::PassConfig::enable(const ngraph::DiscreteTypeInfo& type_info) {
+void ov::pass::PassConfig::enable(const ngraph::DiscreteTypeInfo& type_info) {
     m_disabled.erase(type_info);
     m_enabled.insert(type_info);
 }
 
-void pass::PassConfig::disable(const ngraph::DiscreteTypeInfo& type_info) {
+void ov::pass::PassConfig::disable(const ngraph::DiscreteTypeInfo& type_info) {
     m_enabled.erase(type_info);
     m_disabled.insert(type_info);
 }
 
-void pass::PassConfig::add_disabled_passes(const PassConfig& rhs) {
+void ov::pass::PassConfig::add_disabled_passes(const PassConfig& rhs) {
     for (const auto& pass : rhs.m_disabled) {
         if (is_enabled(pass))
             continue;
diff --git a/ngraph/core/src/pass/perf_counters.cpp b/ngraph/core/src/pass/perf_counters.cpp
index b59e703ac282e5..87f6ba59d18c25 100644
--- a/ngraph/core/src/pass/perf_counters.cpp
+++ b/ngraph/core/src/pass/perf_counters.cpp
@@ -3,7 +3,7 @@
 //
 #include "perf_counters.hpp"
 
-namespace ngraph {
+namespace ov {
 namespace pass {
 openvino::itt::handle_t PerfCounters::operator[](::ngraph::Node::type_info_t const& type_inf) {
     std::lock_guard<std::mutex> guard(m_mutex);
@@ -13,4 +13,4 @@ openvino::itt::handle_t PerfCounters::operator[](::ngraph::Node::type_info_t con
     return m_counters[&type_inf] = openvino::itt::handle(type_inf.name);
 }
 }  // namespace pass
-}  // namespace ngraph
+}  // namespace ov
diff --git a/ngraph/core/src/pass/perf_counters.hpp b/ngraph/core/src/pass/perf_counters.hpp
index a359c284a77e6d..b5dad50e235636 100644
--- a/ngraph/core/src/pass/perf_counters.hpp
+++ b/ngraph/core/src/pass/perf_counters.hpp
@@ -7,7 +7,7 @@
 #include <ngraph/node.hpp>
 #include <unordered_map>
 
-namespace ngraph {
+namespace ov {
 namespace pass {
 class PerfCounters {
     PerfCounters(PerfCounters const&) = delete;
@@ -27,4 +27,4 @@ class PerfCounters {
     counters_map m_counters;
 };
 }  // namespace pass
-}  // namespace ngraph
+}  // namespace ov
diff --git a/ngraph/core/src/pass/validate.cpp b/ngraph/core/src/pass/validate.cpp
index 832354bb3f9a3b..0bfb642765acdb 100644
--- a/ngraph/core/src/pass/validate.cpp
+++ b/ngraph/core/src/pass/validate.cpp
@@ -2,16 +2,16 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "ngraph/pass/validate.hpp"
+#include "openvino/pass/validate.hpp"
 
 #include "itt.hpp"
 #include "ngraph/graph_util.hpp"
 
 using namespace ngraph;
 
-NGRAPH_RTTI_DEFINITION(ngraph::pass::Validate, "ngraph::pass::Validate", 0);
+OPENVINO_RTTI_DEFINITION(ov::pass::Validate, "ov::pass::Validate", 0);
 
-bool pass::Validate::run_on_function(std::shared_ptr<Function> f) {
+bool ov::pass::Validate::run_on_function(std::shared_ptr<Function> f) {
     f->validate_nodes_and_infer_types();
     return false;
 }
diff --git a/ngraph/core/src/pass/visualize_tree.cpp b/ngraph/core/src/pass/visualize_tree.cpp
index 1c1040eb21e588..c6089123088fb6 100644
--- a/ngraph/core/src/pass/visualize_tree.cpp
+++ b/ngraph/core/src/pass/visualize_tree.cpp
@@ -379,11 +379,11 @@ std::string pass::VisualizeTree::get_constant_value(std::shared_ptr<Node> node,
     ss << "{" << node->get_element_type().get_type_name() << "}";
     ss << pretty_partial_shape(node->get_output_partial_shape(0));
 
-    if (!op::is_constant(node))
+    if (!ngraph::op::is_constant(node))
         return ss.str();
 
     ss << "\nvalue: ";
-    const auto constant = ov::as_type_ptr<op::Constant>(node);
+    const auto constant = ov::as_type_ptr<ngraph::op::Constant>(node);
     switch (constant->get_output_element_type(0)) {
     case element::Type_t::undefined:
         ss << "[ undefined value ]";
diff --git a/ngraph/core/src/pattern/matcher.cpp b/ngraph/core/src/pattern/matcher.cpp
index 9edc0df33091a0..dc24e44ae546f8 100644
--- a/ngraph/core/src/pattern/matcher.cpp
+++ b/ngraph/core/src/pattern/matcher.cpp
@@ -13,7 +13,8 @@
 #include "ngraph/op/parameter.hpp"
 #include "ngraph/op/util/op_types.hpp"
 
-namespace ngraph {
+namespace ov {
+namespace pass {
 namespace pattern {
 MatcherState::MatcherState(Matcher* matcher)
     : m_matcher(matcher),
@@ -88,7 +89,7 @@ bool Matcher::is_contained_match(const NodeVector& exclusions, bool ignore_unuse
     NGRAPH_SUPPRESS_DEPRECATED_START
     if (exclusions.empty()) {
         NodeVector label_exclusions;
-        for (auto entry : m_pattern_map) {
+        for (const auto& entry : m_pattern_map) {
             // leaf label
             if (entry.first->get_input_size() == 0) {
                 label_exclusions.push_back(entry.second.get_node_shared_ptr());
@@ -108,7 +109,7 @@ bool Matcher::match_value(const ngraph::Output<Node>& pattern_value, const ngrap
     // This env var allows one to specify node name patterns to abort pattern matching
     // at particular nodes. The upshot is that one can quickly zero in on an offending
     // fusion by disabling individual fusions or optimizations that use Matcher.
-    static const std::string node_skip_cregex = getenv_string("NGRAPH_FAIL_MATCH_AT");
+    static const std::string node_skip_cregex = ngraph::getenv_string("NGRAPH_FAIL_MATCH_AT");
     if (!node_skip_cregex.empty()) {
         static const std::regex node_skip_regex(node_skip_cregex);
         if (std::regex_match(graph_node->get_name(), node_skip_regex)) {
@@ -201,7 +202,7 @@ void Matcher::clear_state() {
 namespace {
 std::set<std::shared_ptr<Node>> as_node_set(const std::set<std::shared_ptr<op::Label>>& label_set) {
     std::set<std::shared_ptr<Node>> result;
-    for (auto label : label_set) {
+    for (const auto& label : label_set) {
         result.insert(label);
     }
     return result;
@@ -230,7 +231,7 @@ bool RecurrentMatcher::match(Output<Node> graph) {
         graph = m.get_pattern_value_map()[m_recurrent_pattern];
 
         // copy bound nodes for the current pattern graph into a global matches map
-        for (auto cur_match : m.get_pattern_value_map()) {
+        for (const auto& cur_match : m.get_pattern_value_map()) {
             m_matches[cur_match.first].push_back(cur_match.second);
         }
 
@@ -238,7 +239,7 @@ bool RecurrentMatcher::match(Output<Node> graph) {
         // from the current match. Only bound nodes whose labels are in
         // correlated_patterns are pre-populated. Skip other labels are
         // unbounded by default
-        for (auto cor_pat : m_correlated_patterns) {
+        for (const auto& cor_pat : m_correlated_patterns) {
             previous_matches[cor_pat] = m.get_pattern_value_map()[cor_pat];
         }
         m = m_repeat;
@@ -251,4 +252,5 @@ bool RecurrentMatcher::match(Output<Node> graph) {
     return matched;
 }
 }  // namespace pattern
-}  // namespace ngraph
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/src/pattern/op/any.cpp b/ngraph/core/src/pattern/op/any.cpp
index 58ca9aed446832..c2cf96c9efecda 100644
--- a/ngraph/core/src/pattern/op/any.cpp
+++ b/ngraph/core/src/pattern/op/any.cpp
@@ -7,17 +7,16 @@
 #include "ngraph/pattern/matcher.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo pattern::op::Any::type_info;
+constexpr ov::NodeTypeInfo ov::pass::pattern::op::Any::type_info;
 
-const NodeTypeInfo& pattern::op::Any::get_type_info() const {
+const ov::NodeTypeInfo& ov::pass::pattern::op::Any::get_type_info() const {
     return type_info;
 }
 
-bool pattern::op::Any::match_value(Matcher* matcher,
-                                   const Output<Node>& pattern_value,
-                                   const Output<Node>& graph_value) {
+bool ov::pass::pattern::op::Any::match_value(Matcher* matcher,
+                                             const Output<Node>& pattern_value,
+                                             const Output<Node>& graph_value) {
     matcher->add_node(graph_value);
     return m_predicate(graph_value) &&
            matcher->match_arguments(pattern_value.get_node(), graph_value.get_node_shared_ptr());
diff --git a/ngraph/core/src/pattern/op/any_of.cpp b/ngraph/core/src/pattern/op/any_of.cpp
index affc3c48c524bb..6827ca8a69b18f 100644
--- a/ngraph/core/src/pattern/op/any_of.cpp
+++ b/ngraph/core/src/pattern/op/any_of.cpp
@@ -7,20 +7,19 @@
 #include "ngraph/pattern/matcher.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo pattern::op::AnyOf::type_info;
+constexpr ov::NodeTypeInfo ov::pass::pattern::op::AnyOf::type_info;
 
-const NodeTypeInfo& pattern::op::AnyOf::get_type_info() const {
+const ov::NodeTypeInfo& ov::pass::pattern::op::AnyOf::get_type_info() const {
     return type_info;
 }
 
-bool pattern::op::AnyOf::match_value(Matcher* matcher,
-                                     const Output<Node>& pattern_value,
-                                     const Output<Node>& graph_value) {
+bool ov::pass::pattern::op::AnyOf::match_value(Matcher* matcher,
+                                               const Output<Node>& pattern_value,
+                                               const Output<Node>& graph_value) {
     matcher->add_node(graph_value);
     return m_predicate(graph_value) && ([&]() {
-               for (auto arg : graph_value.get_node_shared_ptr()->input_values()) {
+               for (const auto& arg : graph_value.get_node_shared_ptr()->input_values()) {
                    auto saved = matcher->start_match();
                    if (matcher->match_value(input_value(0), arg)) {
                        return saved.finish(true);
diff --git a/ngraph/core/src/pattern/op/any_output.cpp b/ngraph/core/src/pattern/op/any_output.cpp
index 940eb7865fb44c..d9e36cf9cc09e3 100644
--- a/ngraph/core/src/pattern/op/any_output.cpp
+++ b/ngraph/core/src/pattern/op/any_output.cpp
@@ -7,16 +7,15 @@
 #include "ngraph/pattern/matcher.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo pattern::op::AnyOutput::type_info;
+constexpr ov::NodeTypeInfo ov::pass::pattern::op::AnyOutput::type_info;
 
-const NodeTypeInfo& pattern::op::AnyOutput::get_type_info() const {
+const ov::NodeTypeInfo& ov::pass::pattern::op::AnyOutput::get_type_info() const {
     return type_info;
 }
 
-bool pattern::op::AnyOutput::match_value(Matcher* matcher,
-                                         const Output<Node>& pattern_value,
-                                         const Output<Node>& graph_value) {
+bool ov::pass::pattern::op::AnyOutput::match_value(Matcher* matcher,
+                                                   const Output<Node>& pattern_value,
+                                                   const Output<Node>& graph_value) {
     return input_value(0).get_node()->match_node(matcher, graph_value);
 }
diff --git a/ngraph/core/src/pattern/op/label.cpp b/ngraph/core/src/pattern/op/label.cpp
index 621e0d4ebe9d6a..025ac805f29716 100644
--- a/ngraph/core/src/pattern/op/label.cpp
+++ b/ngraph/core/src/pattern/op/label.cpp
@@ -9,15 +9,14 @@
 #include "ngraph/pattern/op/true.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-constexpr NodeTypeInfo pattern::op::Label::type_info;
+constexpr ov::NodeTypeInfo ov::pass::pattern::op::Label::type_info;
 
-const NodeTypeInfo& pattern::op::Label::get_type_info() const {
+const ov::NodeTypeInfo& ov::pass::pattern::op::Label::get_type_info() const {
     return type_info;
 }
 
-Output<Node> pattern::op::Label::wrap_values(const OutputVector& wrapped_values) {
+ov::Output<ov::Node> ov::pass::pattern::op::Label::wrap_values(const ov::OutputVector& wrapped_values) {
     switch (wrapped_values.size()) {
     case 0:
         return make_shared<pattern::op::True>()->output(0);
@@ -28,9 +27,9 @@ Output<Node> pattern::op::Label::wrap_values(const OutputVector& wrapped_values)
     }
 }
 
-bool pattern::op::Label::match_value(Matcher* matcher,
-                                     const Output<Node>& pattern_value,
-                                     const Output<Node>& graph_value) {
+bool ov::pass::pattern::op::Label::match_value(ov::pass::pattern::Matcher* matcher,
+                                               const ov::Output<ov::Node>& pattern_value,
+                                               const ov::Output<ov::Node>& graph_value) {
     if (m_predicate(graph_value)) {
         auto& pattern_map = matcher->get_pattern_value_map();
         auto saved = matcher->start_match();
@@ -45,10 +44,10 @@ bool pattern::op::Label::match_value(Matcher* matcher,
     return false;
 }
 
-std::shared_ptr<Node> pattern::any_input() {
+std::shared_ptr<ov::Node> ov::pass::pattern::any_input() {
     return std::make_shared<pattern::op::Label>();
 }
 
-std::shared_ptr<Node> pattern::any_input(const pattern::op::ValuePredicate& pred) {
+std::shared_ptr<ov::Node> ov::pass::pattern::any_input(const ov::pass::pattern::op::ValuePredicate& pred) {
     return std::make_shared<pattern::op::Label>(element::dynamic, PartialShape::dynamic(), pred);
 }
diff --git a/ngraph/core/src/pattern/op/pattern.cpp b/ngraph/core/src/pattern/op/pattern.cpp
index 0c7c34a4745dd5..f3fed5add9c419 100644
--- a/ngraph/core/src/pattern/op/pattern.cpp
+++ b/ngraph/core/src/pattern/op/pattern.cpp
@@ -7,7 +7,8 @@
 #include <algorithm>
 #include <regex>
 
-namespace ngraph {
+namespace ov {
+namespace pass {
 namespace pattern {
 namespace op {
 // The symbols are required to be in cpp file to workaround RTTI issue on Android LLVM
@@ -101,4 +102,5 @@ std::function<bool(Output<Node>)> type_matches_any(const std::vector<element::Ty
     };
 }
 }  // namespace pattern
-}  // namespace ngraph
+}  // namespace pass
+}  // namespace ov
diff --git a/ngraph/core/src/preprocess/pre_post_process.cpp b/ngraph/core/src/preprocess/pre_post_process.cpp
new file mode 100644
index 00000000000000..10b75c375ea3ce
--- /dev/null
+++ b/ngraph/core/src/preprocess/pre_post_process.cpp
@@ -0,0 +1,337 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/core/preprocess/pre_post_process.hpp"
+
+#include "ngraph/opsets/opset1.hpp"
+#include "openvino/core/function.hpp"
+
+namespace ov {
+namespace preprocess {
+
+/// \brief InputTensorInfoImpl - internal data structure
+struct InputTensorInfo::InputTensorInfoImpl {
+    InputTensorInfoImpl() = default;
+    explicit InputTensorInfoImpl(const element::Type& type) : m_type(type) {}
+
+    element::Type m_type = element::dynamic;
+    Layout m_layout = Layout();
+};
+
+static int64_t get_channels_helper(const std::shared_ptr<Node>& node) {
+    auto it = node->get_rt_info().find("LAYOUT");
+    if (it == node->get_rt_info().end()) {
+        return -1;
+    }
+    auto layout = std::dynamic_pointer_cast<VariantWrapper<Layout>>(it->second);
+    OPENVINO_ASSERT(layout, "Layout runtime info for node is invalid");
+    if (!layout::has_channels(layout->get())) {
+        return -1;
+    }
+    return layout::channels(layout->get());
+}
+
+static Shape construct_mean_scale_shape(const std::shared_ptr<Node>& node, size_t values_size) {
+    // TODO: support also Mean/Scale image case
+    auto channels = get_channels_helper(node);
+    OPENVINO_ASSERT(channels >= 0, "Channels dimension is not specified in layout");
+    auto node_shape = node->get_output_partial_shape(0);
+    auto node_rank = node->get_output_partial_shape(0).rank();
+    OPENVINO_ASSERT(node_rank.is_static(), "Mean/scale vector operation is not supported for fully dynamic shape");
+    OPENVINO_ASSERT(node_rank.get_length() > channels, "Channels dimension is out of bounds");
+    OPENVINO_ASSERT(node_shape[channels] == values_size, "Number of channels and mean/values size mismatch");
+    std::vector<std::size_t> v(node_rank.get_length(), 1);
+    v[channels] = values_size;
+    return {v};
+}
+
+static void propagate_layout(const std::shared_ptr<Node>& src, const std::shared_ptr<Node>& dst) {
+    if (src->get_rt_info().count("LAYOUT")) {
+        dst->get_rt_info()["LAYOUT"] = src->get_rt_info()["LAYOUT"];
+    }
+}
+
+/// \brief PreProcessStepsImpl - internal data structure
+struct PreProcessSteps::PreProcessStepsImpl {
+    void add_scale_impl(const std::vector<float>& values) {
+        m_actions.emplace_back(std::make_tuple(
+            [values](const std::shared_ptr<Node>& node) {
+                Shape shape;
+                if (values.size() == 1) {
+                    shape = Shape{1};
+                } else {
+                    shape = construct_mean_scale_shape(node, values.size());
+                }
+                auto constant = op::v0::Constant::create(element::f32, shape, values);
+                constant->set_friendly_name(node->get_friendly_name() + "/scale/Divide_Factor");
+
+                auto new_op = std::make_shared<op::v1::Divide>(node, constant);
+                new_op->set_friendly_name(node->get_friendly_name() + "/scale/Divide");
+                propagate_layout(node, new_op);
+                return new_op;
+            },
+            false));
+    }
+
+    void add_mean_impl(const std::vector<float>& values) {
+        m_actions.emplace_back(std::make_tuple(
+            [values](const std::shared_ptr<Node>& node) {
+                Shape shape;
+                if (values.size() == 1) {
+                    shape = Shape{1};
+                } else {
+                    shape = construct_mean_scale_shape(node, values.size());
+                }
+                auto constant = op::v0::Constant::create(element::f32, shape, values);
+                constant->set_friendly_name(node->get_friendly_name() + "/mean/Mean_Const");
+
+                auto new_op = std::make_shared<op::v1::Subtract>(node, constant);
+                new_op->set_friendly_name(node->get_friendly_name() + "/mean/Subtract");
+                propagate_layout(node, new_op);
+                return new_op;
+            },
+            false));
+    }
+
+    void add_convert_impl(const element::Type& type) {
+        m_actions.emplace_back(std::make_tuple(
+            [type](const std::shared_ptr<Node>& node) {
+                if (node->get_element_type().is_dynamic()) {
+                    throw ngraph::ngraph_error("Can't insert 'convert_element_type' for dynamic source tensor type.");
+                }
+                auto convert = std::make_shared<op::v0::Convert>(node, type);
+                convert->set_friendly_name(node->get_friendly_name() + "/convert_element_type");
+                propagate_layout(node, convert);
+                return convert;
+            },
+            true));
+    }
+    std::list<std::tuple<PreProcessSteps::CustomPreprocessOp, bool>> m_actions;
+};
+
+/// \brief InputInfoImpl - internal data structure
+struct InputInfo::InputInfoImpl {
+    InputInfoImpl() = default;
+    explicit InputInfoImpl(size_t idx) : m_has_index(true), m_index(idx) {}
+
+    bool has_index() const {
+        return m_has_index;
+    }
+
+    void create_tensor_data(const element::Type& type) {
+        m_tensor_data =
+            std::unique_ptr<InputTensorInfo::InputTensorInfoImpl>(new InputTensorInfo::InputTensorInfoImpl(type));
+    }
+
+    bool m_has_index = false;
+    size_t m_index = 0;
+    std::unique_ptr<InputTensorInfo::InputTensorInfoImpl> m_tensor_data;
+    std::unique_ptr<PreProcessSteps::PreProcessStepsImpl> m_preprocess;
+};
+
+//-------------- InputInfo ------------------
+InputInfo::InputInfo() : m_impl(std::unique_ptr<InputInfoImpl>(new InputInfoImpl)) {}
+InputInfo::InputInfo(size_t input_index) : m_impl(std::unique_ptr<InputInfoImpl>(new InputInfoImpl(input_index))) {}
+InputInfo::InputInfo(InputInfo&&) noexcept = default;
+InputInfo& InputInfo::operator=(InputInfo&&) noexcept = default;
+InputInfo::~InputInfo() = default;
+
+InputInfo& InputInfo::tensor(InputTensorInfo&& builder) & {
+    m_impl->m_tensor_data = std::move(builder.m_impl);
+    return *this;
+}
+
+InputInfo&& InputInfo::tensor(InputTensorInfo&& builder) && {
+    m_impl->m_tensor_data = std::move(builder.m_impl);
+    return std::move(*this);
+}
+
+InputInfo&& InputInfo::preprocess(PreProcessSteps&& builder) && {
+    m_impl->m_preprocess = std::move(builder.m_impl);
+    return std::move(*this);
+}
+
+InputInfo& InputInfo::preprocess(PreProcessSteps&& builder) & {
+    m_impl->m_preprocess = std::move(builder.m_impl);
+    return *this;
+}
+
+// ------------------------ PrePostProcessor --------------------
+struct PrePostProcessor::PrePostProcessorImpl {
+public:
+    std::list<std::unique_ptr<InputInfo::InputInfoImpl>> in_contexts;
+};
+
+PrePostProcessor::PrePostProcessor() : m_impl(std::unique_ptr<PrePostProcessorImpl>(new PrePostProcessorImpl())) {}
+PrePostProcessor::PrePostProcessor(PrePostProcessor&&) noexcept = default;
+PrePostProcessor& PrePostProcessor::operator=(PrePostProcessor&&) noexcept = default;
+PrePostProcessor::~PrePostProcessor() = default;
+
+PrePostProcessor& PrePostProcessor::input(InputInfo&& builder) & {
+    m_impl->in_contexts.push_back(std::move(builder.m_impl));
+    return *this;
+}
+
+PrePostProcessor&& PrePostProcessor::input(InputInfo&& builder) && {
+    m_impl->in_contexts.push_back(std::move(builder.m_impl));
+    return std::move(*this);
+}
+
+std::shared_ptr<Function> PrePostProcessor::build(const std::shared_ptr<Function>& function) {
+    bool tensor_data_updated = false;
+    for (const auto& input : m_impl->in_contexts) {
+        std::shared_ptr<op::v0::Parameter> param;
+        OPENVINO_ASSERT(input, "Internal error: Invalid preprocessing input, please report a problem");
+        if (input->has_index()) {
+            param = function->get_parameters().at(input->m_index);
+        } else {
+            // Default case
+            OPENVINO_ASSERT(function->get_parameters().size() == 1,
+                            std::string("Preprocessing info expects having 1 input, however function has ") +
+                                std::to_string(function->get_parameters().size()) +
+                                " inputs. Please use ov::preprocess::InputInfo constructor specifying "
+                                "particular input instead of default one");
+            param = function->get_parameters().front();
+        }
+        auto consumers = param->output(0).get_target_inputs();
+        if (!input->m_tensor_data) {
+            input->create_tensor_data(param->get_element_type());
+        }
+        auto new_param_shape = param->get_partial_shape();
+        auto new_param = std::make_shared<op::v0::Parameter>(input->m_tensor_data->m_type, new_param_shape);
+        if (input->m_tensor_data->m_layout != Layout()) {
+            new_param->get_rt_info()["LAYOUT"] =
+                std::make_shared<VariantWrapper<Layout>>(input->m_tensor_data->m_layout);
+        }
+        // Old param will be removed, so friendly name can be reused
+        new_param->set_friendly_name(param->get_friendly_name());
+        std::shared_ptr<Node> node = new_param;
+
+        // 2. Apply preprocessing
+        for (const auto& action : input->m_preprocess->m_actions) {
+            node = std::get<0>(action)(node);
+            tensor_data_updated |= std::get<1>(action);
+        }
+
+        // Check final type
+        if (node->get_element_type() != param->get_element_type()) {
+            throw ngraph::ngraph_error(
+                std::string("Element type after preprocessing {") + node->get_element_type().c_type_string() +
+                std::string("} doesn't match with network element type {") + param->get_element_type().c_type_string() +
+                "}. Please add 'convert_element_type' explicitly");
+        }
+
+        // Replace parameter
+        for (auto consumer : consumers) {
+            consumer.replace_source_output(node);
+        }
+        if (input->has_index()) {
+            function->replace_parameter(input->m_index, new_param);
+        } else {
+            function->replace_parameter(0, new_param);
+        }
+    }
+    if (tensor_data_updated) {
+        function->validate_nodes_and_infer_types();
+    }
+    return function;
+}
+
+// --------------------- InputTensorInfo ------------------
+InputTensorInfo::InputTensorInfo() : m_impl(std::unique_ptr<InputTensorInfoImpl>(new InputTensorInfoImpl())) {}
+InputTensorInfo::InputTensorInfo(InputTensorInfo&&) noexcept = default;
+InputTensorInfo& InputTensorInfo::operator=(InputTensorInfo&&) noexcept = default;
+InputTensorInfo::~InputTensorInfo() = default;
+
+InputTensorInfo& InputTensorInfo::set_element_type(const element::Type& type) & {
+    m_impl->m_type = type;
+    return *this;
+}
+
+InputTensorInfo&& InputTensorInfo::set_element_type(const element::Type& type) && {
+    m_impl->m_type = type;
+    return std::move(*this);
+}
+
+InputTensorInfo& InputTensorInfo::set_layout(const Layout& layout) & {
+    m_impl->m_layout = layout;
+    return *this;
+}
+
+InputTensorInfo&& InputTensorInfo::set_layout(const Layout& layout) && {
+    m_impl->m_layout = layout;
+    return std::move(*this);
+}
+
+// --------------------- PreProcessSteps ------------------
+
+PreProcessSteps::PreProcessSteps() : m_impl(std::unique_ptr<PreProcessStepsImpl>(new PreProcessStepsImpl())) {}
+PreProcessSteps::PreProcessSteps(PreProcessSteps&&) noexcept = default;
+PreProcessSteps& PreProcessSteps::operator=(PreProcessSteps&&) noexcept = default;
+PreProcessSteps::~PreProcessSteps() = default;
+
+PreProcessSteps& PreProcessSteps::scale(float value) & {
+    m_impl->add_scale_impl(std::vector<float>{value});
+    return *this;
+}
+
+PreProcessSteps&& PreProcessSteps::scale(float value) && {
+    m_impl->add_scale_impl(std::vector<float>{value});
+    return std::move(*this);
+}
+
+PreProcessSteps& PreProcessSteps::scale(const std::vector<float>& values) & {
+    m_impl->add_scale_impl(values);
+    return *this;
+}
+
+PreProcessSteps&& PreProcessSteps::scale(const std::vector<float>& values) && {
+    m_impl->add_scale_impl(values);
+    return std::move(*this);
+}
+
+PreProcessSteps& PreProcessSteps::mean(float value) & {
+    m_impl->add_mean_impl(std::vector<float>{value});
+    return *this;
+}
+
+PreProcessSteps&& PreProcessSteps::mean(float value) && {
+    m_impl->add_mean_impl(std::vector<float>{value});
+    return std::move(*this);
+}
+
+PreProcessSteps& PreProcessSteps::mean(const std::vector<float>& values) & {
+    m_impl->add_mean_impl(values);
+    return *this;
+}
+
+PreProcessSteps&& PreProcessSteps::mean(const std::vector<float>& values) && {
+    m_impl->add_mean_impl(values);
+    return std::move(*this);
+}
+
+PreProcessSteps& PreProcessSteps::convert_element_type(const element::Type& type) & {
+    m_impl->add_convert_impl(type);
+    return *this;
+}
+
+PreProcessSteps&& PreProcessSteps::convert_element_type(const element::Type& type) && {
+    m_impl->add_convert_impl(type);
+    return std::move(*this);
+}
+
+PreProcessSteps& PreProcessSteps::custom(const CustomPreprocessOp& preprocess_cb) & {
+    // 'true' indicates that custom preprocessing step will trigger validate_and_infer_types
+    m_impl->m_actions.emplace_back(std::make_tuple(preprocess_cb, true));
+    return *this;
+}
+
+PreProcessSteps&& PreProcessSteps::custom(const CustomPreprocessOp& preprocess_cb) && {
+    // 'true' indicates that custom preprocessing step will trigger validate_and_infer_types
+    m_impl->m_actions.emplace_back(std::make_tuple(preprocess_cb, true));
+    return std::move(*this);
+}
+
+}  // namespace preprocess
+}  // namespace ov
diff --git a/ngraph/core/src/rt_info.cpp b/ngraph/core/src/rt_info.cpp
index 26508463b8c204..b07b200005763f 100644
--- a/ngraph/core/src/rt_info.cpp
+++ b/ngraph/core/src/rt_info.cpp
@@ -7,11 +7,13 @@
 #include "ngraph/node.hpp"
 #include "ngraph/variant.hpp"
 
+namespace {
+
 ngraph::Node::RTMap mergeRuntimeInfo(const ngraph::NodeVector& nodes) {
     std::unordered_map<std::string, std::vector<std::shared_ptr<ngraph::Variant>>> attrs;
     for (const auto& node : nodes) {
         for (const auto& item : node->get_rt_info()) {
-            if (item.second->is_copyable()) {
+            if (item.second->is_copyable() && item.first != "opset") {
                 attrs[item.first].push_back(item.second);
             }
         }
@@ -30,15 +32,38 @@ ngraph::Node::RTMap mergeRuntimeInfo(const ngraph::NodeVector& nodes) {
     return merged_attrs;
 }
 
+std::shared_ptr<ngraph::Variant> get_opset(const ngraph::Node::RTMap& rt_info) {
+    auto it = rt_info.find("opset");
+    if (it != rt_info.end()) {
+        return it->second;
+    }
+    return nullptr;
+}
+
+void assign_runtime_info(const ngraph::Node::RTMap& from, ngraph::Node::RTMap& to) {
+    auto opset = get_opset(to);
+    to = from;
+    if (opset) {
+        to["opset"] = opset;
+    }
+}
+
+}  // namespace
+
 void ngraph::copy_runtime_info(std::shared_ptr<ngraph::Node> from, std::shared_ptr<ngraph::Node> to) {
     auto& attrs = to->get_rt_info();
+    auto opset = get_opset(attrs);
     attrs.clear();
 
     for (const auto& item : from->get_rt_info()) {
-        if (item.second->is_copyable()) {
+        if (item.second->is_copyable() && item.first != "opset") {
             attrs[item.first] = item.second;
         }
     }
+
+    if (opset) {
+        attrs["opset"] = opset;
+    }
 }
 
 void ngraph::copy_runtime_info(std::shared_ptr<ngraph::Node> from, ngraph::NodeVector to) {
@@ -49,13 +74,13 @@ void ngraph::copy_runtime_info(std::shared_ptr<ngraph::Node> from, ngraph::NodeV
 
 void ngraph::copy_runtime_info(const ngraph::NodeVector& from, std::shared_ptr<ngraph::Node> to) {
     auto& rtInfoTo = to->get_rt_info();
-    rtInfoTo = mergeRuntimeInfo(from);
+    assign_runtime_info(mergeRuntimeInfo(from), rtInfoTo);
 }
 
 void ngraph::copy_runtime_info(const ngraph::NodeVector& from, ngraph::NodeVector to) {
     auto mergedInfo = mergeRuntimeInfo(from);
     for (auto& node : to) {
         auto& rtInfoTo = node->get_rt_info();
-        rtInfoTo = mergedInfo;
+        assign_runtime_info(mergedInfo, rtInfoTo);
     }
 }
diff --git a/ngraph/core/src/shape.cpp b/ngraph/core/src/shape.cpp
index 3b7b1aab445aa5..1d88ff75a2ab26 100644
--- a/ngraph/core/src/shape.cpp
+++ b/ngraph/core/src/shape.cpp
@@ -7,35 +7,34 @@
 #include "ngraph/util.hpp"
 
 using namespace std;
-using namespace ngraph;
 
-std::ostream& ngraph::operator<<(std::ostream& s, const Shape& shape) {
-    s << "Shape{";
+std::ostream& ov::operator<<(std::ostream& s, const Shape& shape) {
+    s << "{";
     s << ngraph::join(shape);
     s << "}";
     return s;
 }
 
-ngraph::Shape::Shape() : std::vector<size_t>() {}
+ov::Shape::Shape() : std::vector<size_t>() {}
 
-ngraph::Shape::Shape(const std::initializer_list<size_t>& axis_lengths) : std::vector<size_t>(axis_lengths) {}
+ov::Shape::Shape(const std::initializer_list<size_t>& axis_lengths) : std::vector<size_t>(axis_lengths) {}
 
-ngraph::Shape::Shape(const std::vector<size_t>& axis_lengths) : std::vector<size_t>(axis_lengths) {}
+ov::Shape::Shape(const std::vector<size_t>& axis_lengths) : std::vector<size_t>(axis_lengths) {}
 
-ngraph::Shape::Shape(const Shape& axis_lengths) : std::vector<size_t>(axis_lengths) {}
+ov::Shape::Shape(const Shape& axis_lengths) = default;
 
-ngraph::Shape::Shape(size_t n, size_t initial_value) : std::vector<size_t>(n, initial_value) {}
+ov::Shape::Shape(size_t n, size_t initial_value) : std::vector<size_t>(n, initial_value) {}
 
-ngraph::Shape::~Shape() {}
+ov::Shape::~Shape() = default;
 
-ngraph::Shape& ngraph::Shape::operator=(const Shape& v) {
+ov::Shape& ov::Shape::operator=(const Shape& v) {
     static_cast<std::vector<size_t>*>(this)->operator=(v);
     return *this;
 }
 
-ngraph::Shape& ngraph::Shape::operator=(Shape&& v) noexcept {
+ov::Shape& ov::Shape::operator=(Shape&& v) noexcept {
     static_cast<std::vector<size_t>*>(this)->operator=(std::move(v));
     return *this;
 }
 
-constexpr DiscreteTypeInfo ov::AttributeAdapter<Shape>::type_info;
+constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<ov::Shape>::type_info;
diff --git a/ngraph/core/src/strides.cpp b/ngraph/core/src/strides.cpp
index 123ad53bc8e635..1603c79587b418 100644
--- a/ngraph/core/src/strides.cpp
+++ b/ngraph/core/src/strides.cpp
@@ -6,34 +6,31 @@
 
 #include "ngraph/util.hpp"
 
-using namespace std;
-using namespace ngraph;
-
-std::ostream& ngraph::operator<<(std::ostream& s, const Strides& strides) {
+std::ostream& ov::operator<<(std::ostream& s, const ov::Strides& strides) {
     s << "Strides{";
     s << ngraph::join(strides);
     s << "}";
     return s;
 }
 
-ngraph::Strides::Strides() : std::vector<size_t>() {}
+ov::Strides::Strides() : std::vector<size_t>() {}
 
-ngraph::Strides::Strides(const std::initializer_list<size_t>& axis_strides) : std::vector<size_t>(axis_strides) {}
+ov::Strides::Strides(const std::initializer_list<size_t>& axis_strides) : std::vector<size_t>(axis_strides) {}
 
-ngraph::Strides::Strides(const std::vector<size_t>& axis_strides) : std::vector<size_t>(axis_strides) {}
+ov::Strides::Strides(const std::vector<size_t>& axis_strides) : std::vector<size_t>(axis_strides) {}
 
-ngraph::Strides::Strides(const Strides& axis_strides) : std::vector<size_t>(axis_strides) {}
+ov::Strides::Strides(const Strides& axis_strides) : std::vector<size_t>(axis_strides) {}
 
-ngraph::Strides::Strides(size_t n, size_t initial_value) : std::vector<size_t>(n, initial_value) {}
+ov::Strides::Strides(size_t n, size_t initial_value) : std::vector<size_t>(n, initial_value) {}
 
-ngraph::Strides& ngraph::Strides::operator=(const Strides& v) {
+ov::Strides& ov::Strides::operator=(const Strides& v) {
     static_cast<std::vector<size_t>*>(this)->operator=(v);
     return *this;
 }
 
-ngraph::Strides& ngraph::Strides::operator=(Strides&& v) noexcept {
+ov::Strides& ov::Strides::operator=(Strides&& v) noexcept {
     static_cast<std::vector<size_t>*>(this)->operator=(v);
     return *this;
 }
 
-constexpr DiscreteTypeInfo ov::AttributeAdapter<Strides>::type_info;
+constexpr ov::DiscreteTypeInfo ov::AttributeAdapter<ov::Strides>::type_info;
diff --git a/ngraph/core/src/type/element_type.cpp b/ngraph/core/src/type/element_type.cpp
index 4dd724832d0cd6..98f78573920acf 100644
--- a/ngraph/core/src/type/element_type.cpp
+++ b/ngraph/core/src/type/element_type.cpp
@@ -13,6 +13,7 @@
 #include "ngraph/type/element_type_traits.hpp"
 
 constexpr ngraph::DiscreteTypeInfo ngraph::AttributeAdapter<ov::element::Type>::type_info;
+constexpr ngraph::DiscreteTypeInfo ngraph::AttributeAdapter<ov::element::TypeVector>::type_info;
 
 namespace {
 class TypeInfo {
diff --git a/ngraph/frontend/CMakeLists.txt b/ngraph/frontend/CMakeLists.txt
index 7689778a115a4f..6ab49ec2f706b6 100644
--- a/ngraph/frontend/CMakeLists.txt
+++ b/ngraph/frontend/CMakeLists.txt
@@ -2,7 +2,7 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
-set(FRONTEND_INSTALL_INCLUDE "${NGRAPH_INSTALL_INCLUDE}/ngraph/frontend")
+set(FRONTEND_INSTALL_INCLUDE "runtime/include/ngraph/frontend")
 
 add_subdirectory(frontend_manager)
 
diff --git a/ngraph/frontend/frontend_manager/CMakeLists.txt b/ngraph/frontend/frontend_manager/CMakeLists.txt
index cdb93d5fc0f342..feee88b695b849 100644
--- a/ngraph/frontend/frontend_manager/CMakeLists.txt
+++ b/ngraph/frontend/frontend_manager/CMakeLists.txt
@@ -17,7 +17,7 @@ source_group("public include" FILES ${LIBRARY_PUBLIC_HEADERS})
 # Static library
 
 add_library(${TARGET_NAME}_static STATIC ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${LIBRARY_PUBLIC_HEADERS})
-add_library(ngraph::${TARGET_NAME}::static ALIAS ${TARGET_NAME}_static)
+add_library(${TARGET_NAME}::static ALIAS ${TARGET_NAME}_static)
 target_link_libraries(${TARGET_NAME}_static PRIVATE ${CMAKE_DL_LIBS} PUBLIC ngraph)
 target_include_directories(${TARGET_NAME}_static PUBLIC ${FRONTEND_INCLUDE_DIR})
 target_include_directories(${TARGET_NAME}_static PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src)
@@ -28,8 +28,10 @@ target_compile_definitions(${TARGET_NAME}_static PUBLIC USE_STATIC_FRONTEND_MANA
 
 add_library(${TARGET_NAME} SHARED ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${LIBRARY_PUBLIC_HEADERS})
 add_library(ngraph::${TARGET_NAME} ALIAS ${TARGET_NAME})
+add_library(openvino::frontend::manager ALIAS ${TARGET_NAME})
 
-target_include_directories(${TARGET_NAME} PUBLIC $<BUILD_INTERFACE:${FRONTEND_INCLUDE_DIR}>
+target_include_directories(${TARGET_NAME} PUBLIC
+        $<BUILD_INTERFACE:${FRONTEND_INCLUDE_DIR}>
         $<INSTALL_INTERFACE:${FRONTEND_INSTALL_INCLUDE}>)
 target_include_directories(${TARGET_NAME} PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src)
 target_link_libraries(${TARGET_NAME} PRIVATE ${CMAKE_DL_LIBS} PUBLIC ngraph)
@@ -48,14 +50,16 @@ endif()
 
 # Installation rules for shared version only
 
-install(TARGETS ${TARGET_NAME} EXPORT ngraphTargets
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        ARCHIVE DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph)
+set_target_properties(${TARGET_NAME} PROPERTIES EXPORT_NAME frontend::manager)
+install(TARGETS ${TARGET_NAME} EXPORT OpenVINOTargets
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT ngraph
+        ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT ngraph
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT ngraph)
 
 install(DIRECTORY ${FRONTEND_INCLUDE_DIR}/frontend_manager
-    DESTINATION ${FRONTEND_INSTALL_INCLUDE}
-    COMPONENT ngraph_dev
-    FILES_MATCHING PATTERN "*.hpp")
+        DESTINATION ${FRONTEND_INSTALL_INCLUDE}
+        COMPONENT ngraph_dev
+        FILES_MATCHING PATTERN "*.hpp")
 
-export(TARGETS ${TARGET_NAME} NAMESPACE ngraph:: APPEND FILE "${NGRAPH_TARGETS_FILE}")
+export(TARGETS ${TARGET_NAME} NAMESPACE openvino::
+       APPEND FILE "${CMAKE_BINARY_DIR}/OpenVINOTargets.cmake")
diff --git a/ngraph/frontend/ir/CMakeLists.txt b/ngraph/frontend/ir/CMakeLists.txt
index 181bfda9d62e07..b9c9b3d32abb48 100644
--- a/ngraph/frontend/ir/CMakeLists.txt
+++ b/ngraph/frontend/ir/CMakeLists.txt
@@ -23,12 +23,11 @@ add_library(${TARGET_NAME} SHARED  ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${LIBRARY_P
 ov_ncc_naming_style(FOR_TARGET ${TARGET_NAME}
                     INCLUDE_DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/include"
                     ADDITIONAL_INCLUDE_DIRECTORIES
-                        $<TARGET_PROPERTY:ngraph::frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>)
+                        $<TARGET_PROPERTY:frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>)
 
 target_include_directories(${TARGET_NAME}
         PUBLIC
             $<BUILD_INTERFACE:${${TARGET_NAME}_INCLUDE_DIR}>
-            $<INSTALL_INTERFACE:${FRONTEND_INSTALL_INCLUDE}>
         PRIVATE
             ${CMAKE_CURRENT_SOURCE_DIR}/src
             ${CMAKE_CURRENT_BINARY_DIR})
@@ -40,22 +39,14 @@ if(COMMAND ie_add_vs_version_file)
                            FILEDESCRIPTION "FrontEnd to load and convert IR file format")
 endif()
 
-target_link_libraries(${TARGET_NAME} PRIVATE ngraph::frontend_manager::static
-                                     PRIVATE ngraph::builder inference_engine_transformations
+target_link_libraries(${TARGET_NAME} PRIVATE frontend_manager::static
+        ngraph::builder inference_engine_transformations
         inference_engine pugixml::static inference_engine_plugin_api)
 
 add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME}
                         EXCLUDE_PATTERNS ${PROTO_SRCS} ${PROTO_HDRS})
 
-install(TARGETS ${TARGET_NAME} EXPORT ngraphTargets
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        ARCHIVE DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph)
-
-install(DIRECTORY ${${TARGET_NAME}_INCLUDE_DIR}/ir_frontend
-        DESTINATION ${FRONTEND_INSTALL_INCLUDE}
-        COMPONENT ngraph_dev
-        FILES_MATCHING PATTERN "*.hpp"
-)
-
-export(TARGETS ${TARGET_NAME} NAMESPACE ngraph:: APPEND FILE "${NGRAPH_TARGETS_FILE}")
+install(TARGETS ${TARGET_NAME}
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT ngraph
+        ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT ngraph
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT ngraph)
diff --git a/ngraph/frontend/ir/src/model.cpp b/ngraph/frontend/ir/src/model.cpp
index 096e1ebcc65551..cb677be66e136d 100644
--- a/ngraph/frontend/ir/src/model.cpp
+++ b/ngraph/frontend/ir/src/model.cpp
@@ -51,6 +51,10 @@ struct GenericLayerParams {
     }
 };
 
+void operator>>(const std::stringstream& in, ngraph::element::Type& type) {
+    type = details::convertPrecision(ngraph::trim(in.str()));
+}
+
 bool getStrAttribute(const pugi::xml_node& node, const std::string& name, std::string& value) {
     if (!node)
         return false;
@@ -558,6 +562,11 @@ void XmlDeserializer::on_adapter(const std::string& name, ngraph::ValueAccessor<
         }
 
         a->set(node_attrs);
+    } else if (const auto& a = ngraph::as_type<ngraph::AttributeAdapter<ngraph::element::TypeVector>>(&adapter)) {
+        ngraph::element::TypeVector types;
+        if (!getParameters<ngraph::element::Type>(m_node.child("data"), name, types))
+            return;
+        a->set(types);
     } else {
         IE_THROW() << "Error IR reading. Attribute adapter can not be found for " << name << " parameter";
     }
@@ -935,4 +944,4 @@ std::shared_ptr<Function> InputModelIR::convert() {
     return function;
 }
 }  // namespace frontend
-}  // namespace ngraph
\ No newline at end of file
+}  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/CMakeLists.txt b/ngraph/frontend/onnx/frontend/CMakeLists.txt
index ad830d0ddbc6cb..72838ee735eaf2 100644
--- a/ngraph/frontend/onnx/frontend/CMakeLists.txt
+++ b/ngraph/frontend/onnx/frontend/CMakeLists.txt
@@ -2,6 +2,8 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
+set(TARGET_NAME onnx_ngraph_frontend)
+
 set(ONNX_OPSET_VERSION 13 CACHE INTERNAL "Supported version of ONNX operator set")
 set(ONNX_FRONTEND_INCLUDE_DIR ${CMAKE_CURRENT_SOURCE_DIR}/include)
 
@@ -27,38 +29,39 @@ source_group("include" FILES ${LIBRARY_HEADERS})
 source_group("public include" FILES ${LIBRARY_PUBLIC_HEADERS})
 
 # Create shared library
-add_library(onnx_ngraph_frontend SHARED ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${LIBRARY_PUBLIC_HEADERS})
-add_library(ngraph::onnx_ngraph_frontend ALIAS onnx_ngraph_frontend)
+add_library(${TARGET_NAME} SHARED ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${LIBRARY_PUBLIC_HEADERS})
+add_library(openvino::frontend::onnx ALIAS ${TARGET_NAME})
 
-add_clang_format_target(onnx_ngraph_frontend_clang FOR_TARGETS onnx_ngraph_frontend)
+add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME})
 
-ov_ncc_naming_style(FOR_TARGET onnx_ngraph_frontend
+ov_ncc_naming_style(FOR_TARGET ${TARGET_NAME}
                    INCLUDE_DIRECTORY "${ONNX_FRONTEND_INCLUDE_DIR}"
                    DEFINITIONS
                        $<TARGET_PROPERTY:onnx,INTERFACE_COMPILE_DEFINITIONS>
                    ADDITIONAL_INCLUDE_DIRECTORIES
-                       $<TARGET_PROPERTY:ngraph::frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>)
+                       $<TARGET_PROPERTY:frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>)
 
 if(COMMAND ie_add_vs_version_file)
-    ie_add_vs_version_file(NAME onnx_ngraph_frontend
+    ie_add_vs_version_file(NAME ${TARGET_NAME}
                            FILEDESCRIPTION "nGraph ONNX frontend library")
 endif()
 
-target_link_libraries(onnx_ngraph_frontend PUBLIC ngraph PRIVATE frontend_manager ngraph::builder onnx_common inference_engine_transformations)
+target_link_libraries(${TARGET_NAME} PUBLIC ngraph PRIVATE frontend_manager ngraph::builder onnx_common inference_engine_transformations)
 
-target_include_directories(onnx_ngraph_frontend PUBLIC $<BUILD_INTERFACE:${ONNX_FRONTEND_INCLUDE_DIR}>
+target_include_directories(${TARGET_NAME} PUBLIC $<BUILD_INTERFACE:${ONNX_FRONTEND_INCLUDE_DIR}>
                                                 $<INSTALL_INTERFACE:${FRONTEND_INSTALL_INCLUDE}>)
-target_include_directories(onnx_ngraph_frontend PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src)
+target_include_directories(${TARGET_NAME} PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/src)
 
-target_compile_definitions(onnx_ngraph_frontend PRIVATE ONNX_OPSET_VERSION=${ONNX_OPSET_VERSION})
+target_compile_definitions(${TARGET_NAME} PRIVATE ONNX_OPSET_VERSION=${ONNX_OPSET_VERSION})
 if(NGRAPH_USE_PROTOBUF_LITE)
-    target_compile_definitions(onnx_ngraph_frontend PRIVATE NGRAPH_USE_PROTOBUF_LITE)
+    target_compile_definitions(${TARGET_NAME} PRIVATE NGRAPH_USE_PROTOBUF_LITE)
 endif()
 
-install(TARGETS onnx_ngraph_frontend EXPORT ngraphTargets
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        ARCHIVE DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph)
+set_target_properties(${TARGET_NAME} PROPERTIES EXPORT_NAME frontend::onnx)
+install(TARGETS ${TARGET_NAME} EXPORT OpenVINOTargets
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT ngraph
+        ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT ngraph
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT ngraph)
 
 install(DIRECTORY ${ONNX_FRONTEND_INCLUDE_DIR}/onnx_frontend
                   ${ONNX_FRONTEND_INCLUDE_DIR}/onnx_import
@@ -66,4 +69,5 @@ install(DIRECTORY ${ONNX_FRONTEND_INCLUDE_DIR}/onnx_frontend
         COMPONENT ngraph_dev
         FILES_MATCHING PATTERN "*.hpp")
 
-export(TARGETS onnx_ngraph_frontend NAMESPACE ngraph:: APPEND FILE "${NGRAPH_TARGETS_FILE}")
+export(TARGETS ${TARGET_NAME} NAMESPACE openvino::
+       APPEND FILE "${CMAKE_BINARY_DIR}/OpenVINOTargets.cmake")
diff --git a/ngraph/frontend/onnx/frontend/include/onnx_import/core/node.hpp b/ngraph/frontend/onnx/frontend/include/onnx_import/core/node.hpp
index c184db30188d39..83d046565781ea 100644
--- a/ngraph/frontend/onnx/frontend/include/onnx_import/core/node.hpp
+++ b/ngraph/frontend/onnx/frontend/include/onnx_import/core/node.hpp
@@ -66,8 +66,8 @@ class ONNX_IMPORTER_API Node {
 
     bool has_attribute(const std::string& name) const;
 
-    bool has_subgraph() const;
-    std::shared_ptr<Subgraph> get_subgraph() const;
+    bool has_subgraphs() const;
+    const std::unordered_map<std::string, std::shared_ptr<Subgraph>>& get_subgraphs() const;
 
     template <typename T>
     T get_attribute_value(const std::string& name, T default_value) const;
diff --git a/ngraph/frontend/onnx/frontend/src/core/attribute.cpp b/ngraph/frontend/onnx/frontend/src/core/attribute.cpp
index d65511eef57eb8..f118c230507ab9 100644
--- a/ngraph/frontend/onnx/frontend/src/core/attribute.cpp
+++ b/ngraph/frontend/onnx/frontend/src/core/attribute.cpp
@@ -10,7 +10,7 @@
 
 namespace ngraph {
 namespace onnx_import {
-Subgraph Attribute::get_subgraph(const Graph& parent_graph) const {
+Subgraph Attribute::get_subgraph(const Graph* parent_graph) const {
     if (m_attribute_proto->type() != ONNX_NAMESPACE::AttributeProto_AttributeType_GRAPH) {
         throw error::attribute::InvalidData{m_attribute_proto->type()};
     }
@@ -21,7 +21,7 @@ Subgraph Attribute::get_subgraph(const Graph& parent_graph) const {
     model_proto->mutable_graph()->CopyFrom(graph);
 
     // set opset version and domain from the parent graph
-    model_proto->mutable_opset_import()->CopyFrom(parent_graph.get_opset_imports());
+    model_proto->mutable_opset_import()->CopyFrom(parent_graph->get_opset_imports());
     return Subgraph{model_proto, parent_graph};
 }
 
diff --git a/ngraph/frontend/onnx/frontend/src/core/attribute.hpp b/ngraph/frontend/onnx/frontend/src/core/attribute.hpp
index 8a0f9592ea1aa0..fbd972444bc1f9 100644
--- a/ngraph/frontend/onnx/frontend/src/core/attribute.hpp
+++ b/ngraph/frontend/onnx/frontend/src/core/attribute.hpp
@@ -301,7 +301,7 @@ class Attribute {
     const std::string& get_string() const {
         return m_attribute_proto->s();
     }
-    Subgraph get_subgraph(const Graph& parent_graph) const;
+    Subgraph get_subgraph(const Graph* parent_graph) const;
 
     std::vector<Tensor> get_tensor_array() const {
         return {std::begin(m_attribute_proto->tensors()), std::end(m_attribute_proto->tensors())};
diff --git a/ngraph/frontend/onnx/frontend/src/core/graph.cpp b/ngraph/frontend/onnx/frontend/src/core/graph.cpp
index 025c29d907e6e0..6d7ceb063ee653 100644
--- a/ngraph/frontend/onnx/frontend/src/core/graph.cpp
+++ b/ngraph/frontend/onnx/frontend/src/core/graph.cpp
@@ -164,9 +164,12 @@ void Graph::convert_to_ngraph_nodes() {
     // Process ONNX graph nodes, convert to nGraph nodes
     for (const auto& node_proto : m_model->get_graph().node()) {
         const Node node{node_proto, *this};
-        if (node.has_subgraph()) {
-            auto subgraph = node.get_subgraph();
-            auto body_func = subgraph->convert();
+        if (node.has_subgraphs()) {
+            const auto& subgraphs = node.get_subgraphs();
+            for (auto& kv : subgraphs) {
+                auto& subgraph = kv.second;
+                subgraph->convert();
+            }
         }
         OutputVector ng_nodes{make_ng_nodes(node)};
     }
@@ -203,12 +206,21 @@ void Graph::decode_to_framework_nodes() {
     for (const auto& node_proto : m_model->get_graph().node()) {
         const Node node{node_proto, *this};
         std::shared_ptr<frontend::ONNXFrameworkNode> framework_node;
-        if (node.has_subgraph()) {
-            auto subgraph = node.get_subgraph();
-            auto body_func = subgraph->decode();
+        if (node.has_subgraphs()) {
+            const auto& subgraphs = node.get_subgraphs();
             auto inputs = node.get_ng_inputs();
-            for (const auto& input : subgraph->get_inputs_from_parent())
-                inputs.push_back(input);
+            for (const auto& kv : subgraphs) {
+                auto& subgraph = kv.second;
+                subgraph->decode();
+                for (const auto& input : subgraph->get_inputs_from_parent()) {
+                    const auto& name = input.get_node()->get_friendly_name();
+                    if (std::find_if(inputs.begin(), inputs.end(), [&name](const Output<ngraph::Node>& n) -> bool {
+                            return name == n.get_node()->get_friendly_name();
+                        }) == inputs.end()) {
+                        inputs.push_back(input);
+                    }
+                }
+            }
             framework_node =
                 std::make_shared<ngraph::frontend::ONNXSubgraphFrameworkNode>(shared_from_this(), node, inputs);
         } else {
@@ -239,8 +251,8 @@ std::shared_ptr<Function> Graph::decode() {
     return create_function();
 }
 
-const GraphCache& Graph::get_graph_cache() const {
-    return *m_cache.get();
+bool Graph::is_ng_node_in_cache(const std::string& name) const {
+    return m_cache->contains(name);
 }
 
 Output<ngraph::Node> Graph::get_ng_node_from_cache(const std::string& name) const {
@@ -309,15 +321,34 @@ const OpsetImports& Graph::get_opset_imports() const {
     return m_model->get_opset_imports();
 }
 
-Subgraph::Subgraph(std::shared_ptr<ONNX_NAMESPACE::ModelProto> model_proto, const Graph& parent_graph)
+Subgraph::Subgraph(std::shared_ptr<ONNX_NAMESPACE::ModelProto> model_proto, const Graph* parent_graph)
     : Graph(model_proto, common::make_unique<GraphCache>()),
-      m_parent_graph_cache(&parent_graph.get_graph_cache()) {}
+      m_parent_graph(parent_graph) {}
+
+bool Subgraph::is_ng_node_in_cache(const std::string& name) const {
+    if (m_cache->contains(name)) {
+        return true;
+    }
+    return m_parent_graph->is_ng_node_in_cache(name);
+}
 
 Output<ngraph::Node> Subgraph::get_ng_node_from_cache(const std::string& name) const {
     if (m_cache->contains(name)) {
         return m_cache->get_node(name);
     }
-    return m_parent_graph_cache->get_node(name);
+    return m_parent_graph->get_ng_node_from_cache(name);
+}
+
+void Subgraph::replace_input_from_parent_scope_with_parameter(const std::string& in_name,
+                                                              const Output<ngraph::Node>& from_parent_node,
+                                                              Input<ngraph::Node>&& node_to_replace_input) {
+    auto new_param = std::make_shared<ngraph::op::Parameter>(from_parent_node.get_element_type(),
+                                                             from_parent_node.get_partial_shape());
+    node_to_replace_input.replace_source_output(new_param);
+    m_parameter_to_parent_node_map.insert({new_param, in_name});
+    m_cache->emplace_node(in_name, new_param);
+    m_parameters.push_back(new_param);
+    m_inputs_from_parent.push_back(in_name);
 }
 
 void Subgraph::find_inputs_from_parent() {
@@ -326,28 +357,47 @@ void Subgraph::find_inputs_from_parent() {
     for (const auto& node_proto : m_model->get_graph().node()) {
         int input_index = 0;
         for (const auto& in_name : node_proto.input()) {
-            if (m_parent_graph_cache->contains(in_name)) {
-                const auto& from_parent_node = m_parent_graph_cache->get_node(in_name);
+            if (m_parent_graph->is_ng_node_in_cache(in_name)) {
+                const auto& from_parent_node = m_parent_graph->get_ng_node_from_cache(in_name);
                 // constants are skipped
                 if (!ngraph::is_type<ngraph::op::Constant>(from_parent_node.get_node_shared_ptr())) {
                     for (const auto& out_name : node_proto.output()) {
                         if (m_cache->contains(out_name)) {
-                            auto out_node_to_replace_input = m_cache->get_node(out_name);
-                            auto new_param =
-                                std::make_shared<ngraph::op::Parameter>(from_parent_node.get_element_type(),
-                                                                        from_parent_node.get_partial_shape());
-                            // replace input from parent scope with parameter
-                            out_node_to_replace_input.get_node()->input(input_index).replace_source_output(new_param);
-                            m_parameter_to_parent_node_map.insert({new_param, in_name});
-                            m_cache->emplace_node(in_name, new_param);
-                            m_parameters.push_back(new_param);
-                            m_inputs_from_parent.push_back(in_name);
+                            auto node_to_replace_input = m_cache->get_node(out_name);
+                            replace_input_from_parent_scope_with_parameter(
+                                in_name,
+                                from_parent_node,
+                                node_to_replace_input.get_node()->input(input_index));
                         }
                     }
                 }
             }
             ++input_index;
         }
+        // Nodes with subgraphs (like Loop or If) can have implicit inputs (so their subgraphs depend on nodes from
+        // parent) Those implicit inputs are not present in `node_proto.input()` list so to get them, we need to fetch
+        // node's nGraph representation and then we can match those inputs with parent nodes
+        for (const auto& out_name : node_proto.output()) {
+            if (m_cache->contains(out_name)) {
+                auto node_to_replace_input = m_cache->get_node(out_name).get_node();
+                if (!dynamic_cast<op::util::MultiSubGraphOp*>(node_to_replace_input))
+                    continue;
+                auto inputs = node_to_replace_input->input_values();
+                for (size_t i = 0; i < inputs.size(); i++) {
+                    const auto& input = inputs.at(i);
+                    auto input_node = input.get_node();
+                    if (op::is_constant(input_node))
+                        continue;
+                    const auto& in_name = input_node->get_friendly_name();
+                    if (m_parent_graph->is_ng_node_in_cache(in_name)) {
+                        const auto& from_parent_node = m_parent_graph->get_ng_node_from_cache(in_name);
+                        replace_input_from_parent_scope_with_parameter(in_name,
+                                                                       from_parent_node,
+                                                                       node_to_replace_input->input(i));
+                    }
+                }
+            }
+        }
     }
 }
 
@@ -365,19 +415,20 @@ void Subgraph::decode_to_framework_nodes() {
 const std::vector<Output<ngraph::Node>> Subgraph::get_inputs_from_parent() const {
     OutputVector result;
     for (const auto& name : m_inputs_from_parent) {
-        result.push_back(m_parent_graph_cache->get_node(name));
+        result.push_back(m_parent_graph->get_ng_node_from_cache(name));
     }
     return result;
 }
 
 void Subgraph::infer_inputs_from_parent() {
     for (auto& it : m_parameter_to_parent_node_map) {
-        const auto& node = m_parent_graph_cache->get_node(it.second);
+        const auto& node = m_parent_graph->get_ng_node_from_cache(it.second);
         auto& parameter = it.first;
         parameter->set_element_type(node.get_element_type());
         parameter->set_partial_shape(node.get_partial_shape());
     }
 }
+
 }  // namespace onnx_import
 
 }  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/core/graph.hpp b/ngraph/frontend/onnx/frontend/src/core/graph.hpp
index ada3d2feca58e3..831710e9226862 100644
--- a/ngraph/frontend/onnx/frontend/src/core/graph.hpp
+++ b/ngraph/frontend/onnx/frontend/src/core/graph.hpp
@@ -34,10 +34,10 @@ class Graph : public std::enable_shared_from_this<Graph> {
     const std::string& get_name() const {
         return m_model->get_graph().name();
     }
-    const GraphCache& get_graph_cache() const;
     const ParameterVector& get_ng_parameters() const {
         return m_parameters;
     }
+    virtual bool is_ng_node_in_cache(const std::string& name) const;
     virtual Output<ngraph::Node> get_ng_node_from_cache(const std::string& name) const;
     OutputVector make_ng_nodes(const Node& onnx_node) const;
     const OpsetImports& get_opset_imports() const;
@@ -71,7 +71,7 @@ class Subgraph : public Graph {
     ///
     /// \param[in]  model          The ONNX model object.
     /// \param[in]  parent_graph   The reference to the parent graph.
-    Subgraph(std::shared_ptr<ONNX_NAMESPACE::ModelProto> model, const Graph& parent_graph);
+    Subgraph(std::shared_ptr<ONNX_NAMESPACE::ModelProto> model, const Graph* parent_graph);
 
     /// \brief      Return nodes which are on the edge the subgraph and the parent graph.
     /// \return     Vector of edge nodes from parent scope.
@@ -87,14 +87,23 @@ class Subgraph : public Graph {
     Subgraph& operator=(const Subgraph&) = delete;
     Subgraph& operator=(Subgraph&&) = default;
 
+    bool is_ng_node_in_cache(const std::string& name) const override;
     Output<ngraph::Node> get_ng_node_from_cache(const std::string& name) const override;
     void infer_inputs_from_parent();
 
 private:
     void decode_to_framework_nodes() override;
     void find_inputs_from_parent();
-
-    const GraphCache* m_parent_graph_cache;
+    /// \brief      Replaces current node's input with Parameter if that input comes from parent graph scope
+    ///
+    /// \param[in]  in_name                  input node name
+    /// \param[in]  from_parent_node         nGraph node from parent scope
+    /// \param[in]  node_to_replace_input    nGraph input node to be replaced
+    void replace_input_from_parent_scope_with_parameter(const std::string& in_name,
+                                                        const Output<ngraph::Node>& from_parent_node,
+                                                        Input<ngraph::Node>&& node_to_replace_input);
+
+    const Graph* m_parent_graph;
     std::vector<std::string> m_inputs_from_parent;
     std::unordered_map<std::shared_ptr<ngraph::op::Parameter>, std::string> m_parameter_to_parent_node_map;
 };
diff --git a/ngraph/frontend/onnx/frontend/src/core/node.cpp b/ngraph/frontend/onnx/frontend/src/core/node.cpp
index fe960f92c4cee0..3a7151b6d33c72 100644
--- a/ngraph/frontend/onnx/frontend/src/core/node.cpp
+++ b/ngraph/frontend/onnx/frontend/src/core/node.cpp
@@ -24,24 +24,22 @@ class Node::Impl {
           m_graph{&graph},
           m_attributes{std::begin(node_proto.attribute()), std::end(node_proto.attribute())},
           m_output_names{std::begin(node_proto.output()), std::end(node_proto.output())} {
-        const auto it = std::find_if(std::begin(m_attributes), std::end(m_attributes), [&](const Attribute& attribute) {
-            return attribute.is_graph();
-        });
-        m_has_subgraph = it != std::end(m_attributes);
-        if (m_has_subgraph) {
-            m_subgraph = std::make_shared<Subgraph>(it->get_subgraph(*m_graph));
+        for (const auto& attribute : m_attributes) {
+            if (attribute.is_graph())
+                m_subgraphs.insert({attribute.get_name(), std::make_shared<Subgraph>(attribute.get_subgraph(m_graph))});
         }
     }
 
-    Impl(const ONNX_NAMESPACE::NodeProto& node_proto, const Graph& graph, std::shared_ptr<Subgraph> subgraph)
+    Impl(const ONNX_NAMESPACE::NodeProto& node_proto,
+         const Graph& graph,
+         const std::unordered_map<std::string, std::shared_ptr<Subgraph>>& subgraphs)
         : m_node_proto{&node_proto},
           m_name{node_proto.has_name() ? node_proto.name() : ""},
           m_domain{get_node_domain(node_proto)},
           m_graph{&graph},
           m_attributes{std::begin(node_proto.attribute()), std::end(node_proto.attribute())},
           m_output_names{std::begin(node_proto.output()), std::end(node_proto.output())},
-          m_has_subgraph(subgraph != nullptr),
-          m_subgraph(subgraph) {}
+          m_subgraphs(subgraphs) {}
 
     const std::vector<Attribute>& attributes() const;
     OutputVector get_ng_inputs() const;
@@ -57,8 +55,8 @@ class Node::Impl {
 
     bool has_attribute(const std::string& name) const;
 
-    bool has_subgraph() const;
-    std::shared_ptr<Subgraph> get_subgraph() const;
+    bool has_subgraphs() const;
+    const std::unordered_map<std::string, std::shared_ptr<Subgraph>>& get_subgraphs() const;
 
     template <typename T>
     T get_attribute_value(const std::string& name, T default_value) const;
@@ -80,8 +78,7 @@ class Node::Impl {
     std::vector<std::reference_wrapper<const std::string>> m_output_names;
     mutable std::string m_description;
 
-    bool m_has_subgraph;
-    std::shared_ptr<Subgraph> m_subgraph;
+    std::unordered_map<std::string, std::shared_ptr<Subgraph>> m_subgraphs;
 };
 
 const ONNX_NAMESPACE::NodeProto& Node::Impl::node_proto() const {
@@ -127,15 +124,15 @@ Subgraph Node::Impl::get_subgraph_from_attribute(const std::string& name) const
     if (it == std::end(m_attributes)) {
         throw error::node::UnknownAttribute{this->name(), name};
     }
-    return it->get_subgraph(*m_graph);
+    return it->get_subgraph(m_graph);
 }
 
-bool Node::Impl::has_subgraph() const {
-    return m_has_subgraph;
+bool Node::Impl::has_subgraphs() const {
+    return m_subgraphs.size() > 0;
 }
 
-std::shared_ptr<Subgraph> Node::Impl::get_subgraph() const {
-    return m_subgraph;
+const std::unordered_map<std::string, std::shared_ptr<Subgraph>>& Node::Impl::get_subgraphs() const {
+    return m_subgraphs;
 }
 
 template <typename T>
@@ -198,7 +195,7 @@ Node::Node(const ONNX_NAMESPACE::NodeProto& node_proto, const Graph& graph)
 Node::Node(Node&& other) noexcept : m_pimpl{std::move(other.m_pimpl)} {}
 
 Node::Node(const Node& other)
-    : m_pimpl{new Impl{other.m_pimpl->node_proto(), other.m_pimpl->graph(), other.get_subgraph()}, [](Impl* impl) {
+    : m_pimpl{new Impl{other.m_pimpl->node_proto(), other.m_pimpl->graph(), other.get_subgraphs()}, [](Impl* impl) {
                   delete impl;
               }} {}
 
@@ -231,12 +228,12 @@ bool Node::has_attribute(const std::string& name) const {
     return m_pimpl->has_attribute(name);
 }
 
-bool Node::has_subgraph() const {
-    return m_pimpl->has_subgraph();
+bool Node::has_subgraphs() const {
+    return m_pimpl->has_subgraphs();
 }
 
-std::shared_ptr<Subgraph> Node::get_subgraph() const {
-    return m_pimpl->get_subgraph();
+const std::unordered_map<std::string, std::shared_ptr<Subgraph>>& Node::get_subgraphs() const {
+    return m_pimpl->get_subgraphs();
 }
 
 std::vector<std::string> Node::get_attribute_names() const {
diff --git a/ngraph/frontend/onnx/frontend/src/edge_mapper.cpp b/ngraph/frontend/onnx/frontend/src/edge_mapper.cpp
index ee2bb58d5b67c4..4c6132dd78ec13 100644
--- a/ngraph/frontend/onnx/frontend/src/edge_mapper.cpp
+++ b/ngraph/frontend/onnx/frontend/src/edge_mapper.cpp
@@ -217,6 +217,24 @@ bool onnx_editor::EdgeMapper::is_correct_tensor_name(const std::string& name) co
     return false;
 }
 
+std::vector<std::string> onnx_editor::EdgeMapper::get_input_ports(const EditorNode& node) const {
+    NGRAPH_CHECK(is_correct_and_unambiguous_node(node),
+                 "The node with name: " + (node.m_node_name.empty() ? "not_given" : node.m_node_name) +
+                     ", output_name: " + (node.m_output_name.empty() ? "not_given" : node.m_output_name) +
+                     " is ambiguous");
+    const auto node_index = find_node_indexes(node.m_node_name, node.m_output_name)[0];
+    return m_node_inputs[node_index];
+}
+
+std::vector<std::string> onnx_editor::EdgeMapper::get_output_ports(const EditorNode& node) const {
+    NGRAPH_CHECK(is_correct_and_unambiguous_node(node),
+                 "The node with name: " + (node.m_node_name.empty() ? "not_given" : node.m_node_name) +
+                     ", output_name: " + (node.m_output_name.empty() ? "not_given" : node.m_output_name) +
+                     " is ambiguous");
+    const auto node_index = find_node_indexes(node.m_node_name, node.m_output_name)[0];
+    return m_node_outputs[node_index];
+}
+
 std::string onnx_editor::EdgeMapper::get_source_tensor_name(const InputEdge& edge) const {
     if (edge.m_node_idx >= 0 && edge.m_node_idx < static_cast<int>(m_node_inputs.size()) && edge.m_port_idx >= 0 &&
         edge.m_port_idx < static_cast<int>(m_node_inputs[edge.m_node_idx].size())) {
diff --git a/ngraph/frontend/onnx/frontend/src/edge_mapper.hpp b/ngraph/frontend/onnx/frontend/src/edge_mapper.hpp
index df57fbe87b4756..fb16d147adee5d 100644
--- a/ngraph/frontend/onnx/frontend/src/edge_mapper.hpp
+++ b/ngraph/frontend/onnx/frontend/src/edge_mapper.hpp
@@ -98,6 +98,20 @@ class EdgeMapper {
     ///
     bool is_correct_tensor_name(const std::string& name) const;
 
+    /// \brief     Get names of input ports of given node.
+    ///
+    /// \param node An EditorNode helper structure created based on a node name
+    ///             or a node output name.
+    ///
+    std::vector<std::string> get_input_ports(const EditorNode& node) const;
+
+    /// \brief     Get names of output ports of given node.
+    ///
+    /// \param node An EditorNode helper structure created based on a node name
+    ///             or a node output name.
+    ///
+    std::vector<std::string> get_output_ports(const EditorNode& node) const;
+
     /// \brief     Get name of the tensor which is the source of the input edge.
     ///
     /// \note      Empty string is returned if the tensor name is not found.
diff --git a/ngraph/frontend/onnx/frontend/src/editor.cpp b/ngraph/frontend/onnx/frontend/src/editor.cpp
index 0b1ca6d8b2ee28..6551543d5f1391 100644
--- a/ngraph/frontend/onnx/frontend/src/editor.cpp
+++ b/ngraph/frontend/onnx/frontend/src/editor.cpp
@@ -449,6 +449,16 @@ bool onnx_editor::ONNXModelEditor::is_correct_tensor_name(const std::string& nam
     return m_pimpl->m_edge_mapper.is_correct_tensor_name(name);
 }
 
+std::vector<std::string> onnx_editor::ONNXModelEditor::get_input_ports(const EditorNode& node) const {
+    update_mapper_if_needed();
+    return m_pimpl->m_edge_mapper.get_input_ports(node);
+}
+
+std::vector<std::string> onnx_editor::ONNXModelEditor::get_output_ports(const EditorNode& node) const {
+    update_mapper_if_needed();
+    return m_pimpl->m_edge_mapper.get_output_ports(node);
+}
+
 std::shared_ptr<Function> onnx_editor::ONNXModelEditor::decode() {
     return onnx_import::detail::decode_to_framework_nodes(m_pimpl->m_model_proto, m_model_path);
 }
diff --git a/ngraph/frontend/onnx/frontend/src/editor.hpp b/ngraph/frontend/onnx/frontend/src/editor.hpp
index 0605eb03bb254d..66d4d7e5ff0f97 100644
--- a/ngraph/frontend/onnx/frontend/src/editor.hpp
+++ b/ngraph/frontend/onnx/frontend/src/editor.hpp
@@ -204,6 +204,20 @@ class ONNX_IMPORTER_API ONNXModelEditor final {
     ///
     bool is_correct_tensor_name(const std::string& name) const;
 
+    /// \brief     Get names of input ports of given node.
+    ///
+    /// \param node An EditorNode helper structure created based on a node name
+    ///             or a node output name.
+    ///
+    std::vector<std::string> get_input_ports(const EditorNode& node) const;
+
+    /// \brief     Get names of output ports of given node.
+    ///
+    /// \param node An EditorNode helper structure created based on a node name
+    ///             or a node output name.
+    ///
+    std::vector<std::string> get_output_ports(const EditorNode& node) const;
+
     /// \brief Returns a nGraph function based on edited model
     ///        decoded to framework nodes
     ///
diff --git a/ngraph/frontend/onnx/frontend/src/input_model.cpp b/ngraph/frontend/onnx/frontend/src/input_model.cpp
index 9db743a74b93b6..1e46766b35d280 100644
--- a/ngraph/frontend/onnx/frontend/src/input_model.cpp
+++ b/ngraph/frontend/onnx/frontend/src/input_model.cpp
@@ -52,15 +52,24 @@ std::vector<Place::Ptr> InputModelONNX::get_outputs() const {
 }
 
 Place::Ptr InputModelONNX::get_place_by_tensor_name(const std::string& tensor_name) const {
-    NGRAPH_CHECK(m_editor->is_correct_tensor_name(tensor_name),
-                 "The tensor with name: " + tensor_name + " does not exist in the graph");
-    return std::make_shared<PlaceTensorONNX>(tensor_name, m_editor);
+    if (m_editor->is_correct_tensor_name(tensor_name)) {
+        return std::make_shared<PlaceTensorONNX>(tensor_name, m_editor);
+    }
+    return nullptr;
+}
+
+Place::Ptr InputModelONNX::get_place_by_operation_name(const std::string& operation_name) const {
+    if (m_editor->is_correct_and_unambiguous_node(operation_name)) {
+        return std::make_shared<PlaceOpONNX>(onnx_editor::EditorNode{operation_name}, m_editor);
+    }
+    return nullptr;
 }
 
 Place::Ptr InputModelONNX::get_place_by_operation_name_and_input_port(const std::string& operation_name,
                                                                       int input_port_index) {
-    const auto edge = m_editor->find_input_edge(onnx_editor::EditorNode(operation_name), input_port_index);
-    return std::make_shared<PlaceInputEdgeONNX>(edge, m_editor);
+    return std::make_shared<PlaceInputEdgeONNX>(
+        m_editor->find_input_edge(onnx_editor::EditorNode(operation_name), input_port_index),
+        m_editor);
 }
 
 void InputModelONNX::set_partial_shape(Place::Ptr place, const ngraph::PartialShape& shape) {
diff --git a/ngraph/frontend/onnx/frontend/src/input_model.hpp b/ngraph/frontend/onnx/frontend/src/input_model.hpp
index 2ed2ff0e8e4f0a..ae838f5b5e3bf5 100644
--- a/ngraph/frontend/onnx/frontend/src/input_model.hpp
+++ b/ngraph/frontend/onnx/frontend/src/input_model.hpp
@@ -25,6 +25,7 @@ class InputModelONNX : public InputModel {
     std::vector<Place::Ptr> get_inputs() const override;
     std::vector<Place::Ptr> get_outputs() const override;
     Place::Ptr get_place_by_tensor_name(const std::string& tensor_name) const override;
+    Place::Ptr get_place_by_operation_name(const std::string& operation_name) const override;
     Place::Ptr get_place_by_operation_name_and_input_port(const std::string& operation_name,
                                                           int input_port_index) override;
     void set_partial_shape(Place::Ptr place, const ngraph::PartialShape& shape) override;
diff --git a/ngraph/frontend/onnx/frontend/src/onnx_framework_node.hpp b/ngraph/frontend/onnx/frontend/src/onnx_framework_node.hpp
index 06256021229e2c..9bdda7657fbb02 100644
--- a/ngraph/frontend/onnx/frontend/src/onnx_framework_node.hpp
+++ b/ngraph/frontend/onnx/frontend/src/onnx_framework_node.hpp
@@ -86,14 +86,19 @@ class ONNXSubgraphFrameworkNode : public ONNXFrameworkNode {
         : ONNXFrameworkNode(graph, node, inputs) {}
 
     void infer_inputs_from_parent() {
-        m_node.get_subgraph()->infer_inputs_from_parent();
+        for (auto& subgraph : m_node.get_subgraphs())
+            subgraph.second->infer_inputs_from_parent();
     }
 
-    std::shared_ptr<Function> get_subgraph_body() const {
-        auto subgraph = m_node.get_subgraph();
-        return std::make_shared<Function>(subgraph->get_ng_outputs(),
-                                          subgraph->get_ng_parameters(),
-                                          subgraph->get_name());
+    std::vector<std::shared_ptr<Function>> get_subgraph_functions() const {
+        std::vector<std::shared_ptr<Function>> ret;
+        for (const auto& kv : m_node.get_subgraphs()) {
+            auto& subgraph = kv.second;
+            ret.push_back(std::make_shared<Function>(subgraph->get_ng_outputs(),
+                                                     subgraph->get_ng_parameters(),
+                                                     subgraph->get_name()));
+        }
+        return ret;
     }
 };
 
diff --git a/ngraph/frontend/onnx/frontend/src/op/com.microsoft/bias_gelu.cpp b/ngraph/frontend/onnx/frontend/src/op/com.microsoft/bias_gelu.cpp
new file mode 100644
index 00000000000000..8eac91852284b5
--- /dev/null
+++ b/ngraph/frontend/onnx/frontend/src/op/com.microsoft/bias_gelu.cpp
@@ -0,0 +1,21 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "op/com.microsoft/bias_gelu.hpp"
+
+#include "default_opset.hpp"
+
+namespace ngraph {
+namespace onnx_import {
+namespace op {
+namespace set_1 {
+OutputVector bias_gelu(const Node& node) {
+    auto nodes = node.get_ng_inputs();
+    NGRAPH_CHECK(nodes.size() == 2, "BiasGelu takes 2 inputs. Provided " + std::to_string(nodes.size()));
+    return {std::make_shared<default_opset::Gelu>(std::make_shared<default_opset::Add>(nodes.at(0), nodes.at(1)))};
+}
+}  // namespace set_1
+}  // namespace op
+}  // namespace onnx_import
+}  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/op/com.microsoft/bias_gelu.hpp b/ngraph/frontend/onnx/frontend/src/op/com.microsoft/bias_gelu.hpp
new file mode 100644
index 00000000000000..da847a3f4f27f5
--- /dev/null
+++ b/ngraph/frontend/onnx/frontend/src/op/com.microsoft/bias_gelu.hpp
@@ -0,0 +1,17 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "onnx_import/core/node.hpp"
+
+namespace ngraph {
+namespace onnx_import {
+namespace op {
+namespace set_1 {
+OutputVector bias_gelu(const Node& node);
+}  // namespace set_1
+}  // namespace op
+}  // namespace onnx_import
+}  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/op/conv.cpp b/ngraph/frontend/onnx/frontend/src/op/conv.cpp
index 5c280c3769acf1..230ae916bc78b5 100644
--- a/ngraph/frontend/onnx/frontend/src/op/conv.cpp
+++ b/ngraph/frontend/onnx/frontend/src/op/conv.cpp
@@ -13,6 +13,7 @@
 #include "ngraph/builder/reshape.hpp"
 #include "ngraph/op/group_conv.hpp"
 #include "ngraph/op/util/attr_types.hpp"
+#include "onnx_import/core/null_node.hpp"
 #include "utils/convpool.hpp"
 #include "utils/reshape.hpp"
 
@@ -20,7 +21,7 @@ namespace ngraph {
 namespace onnx_import {
 namespace op {
 namespace set_1 {
-namespace {
+namespace detail {
 std::shared_ptr<ngraph::op::Op> make_ng_convolution(const Output<ngraph::Node>& data,
                                                     const Output<ngraph::Node>& filters,
                                                     const ngraph::Strides& strides,
@@ -57,14 +58,13 @@ std::shared_ptr<ngraph::Node> add_bias(const Output<ngraph::Node>& ng_conv, cons
     return {
         std::make_shared<default_opset::Add>(ng_conv, reshape::reshape_channel_shaped_node_to_nchw(bias, conv_rank))};
 }
-}  // namespace
 
-OutputVector conv(const Node& node) {
+OutputVector conv(const Node& node,
+                  Output<ngraph::Node> data,
+                  Output<ngraph::Node> filters,
+                  Output<ngraph::Node> bias) {
     // in the current implementation we assume that the data input rank is static
     // and only the 'batch' dimension can be dynamic
-    const OutputVector& inputs = node.get_ng_inputs();
-    const auto data = inputs.at(0);
-    const auto filters = inputs.at(1);
     const auto groups = node.get_attribute_value<int64_t>("group", 1);
 
     NGRAPH_CHECK(data.get_partial_shape().rank().is_static(), "The input data tensor's rank has to be known (static)");
@@ -80,10 +80,9 @@ OutputVector conv(const Node& node) {
         make_ng_convolution(data, filters, strides, dilations, padding_below, padding_above, groups, auto_pad_type);
 
     // no bias param
-    if (inputs.size() < 3) {
+    if (ngraph::op::is_null(bias)) {
         return {conv_node};
     } else {
-        const auto& bias = inputs.at(2);
         const auto& bias_ps = bias.get_partial_shape();
 
         NGRAPH_CHECK(bias_ps.rank().is_static() && bias_ps.rank().get_length() == 1,
@@ -92,7 +91,11 @@ OutputVector conv(const Node& node) {
         return {add_bias(conv_node, bias)};
     }
 }
-
+}  // namespace detail
+OutputVector conv(const Node& node) {
+    const OutputVector& inputs = node.get_ng_inputs();
+    return detail::conv(node, inputs[0], inputs[1], inputs.size() < 3 ? std::make_shared<NullNode>() : inputs[2]);
+}
 }  // namespace set_1
 
 }  // namespace op
diff --git a/ngraph/frontend/onnx/frontend/src/op/conv.hpp b/ngraph/frontend/onnx/frontend/src/op/conv.hpp
index 065902af22a338..759a75110cb12f 100644
--- a/ngraph/frontend/onnx/frontend/src/op/conv.hpp
+++ b/ngraph/frontend/onnx/frontend/src/op/conv.hpp
@@ -11,6 +11,9 @@ namespace ngraph {
 namespace onnx_import {
 namespace op {
 namespace set_1 {
+namespace detail {
+OutputVector conv(const Node& node, Output<ngraph::Node> data, Output<ngraph::Node> filters, Output<ngraph::Node> bias);
+}
 /// \brief Performs ONNX Conv operation.
 ///
 /// \param node   The ONNX node object representing this operation.
diff --git a/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.cpp b/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.cpp
index bfa26cc64ada7d..ecdd5261503556 100644
--- a/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.cpp
+++ b/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.cpp
@@ -19,7 +19,7 @@
 namespace ngraph {
 namespace onnx_import {
 namespace op {
-namespace {
+namespace detail {
 Output<ngraph::Node> get_zero_point(const OutputVector& inputs) {
     if (inputs.size() == 3 && !ngraph::op::is_null(inputs[2])) {
         auto zero_point = inputs[2];
@@ -33,7 +33,7 @@ Output<ngraph::Node> get_zero_point(const OutputVector& inputs) {
         return default_opset::Constant::create(element::f32, Shape{}, {0});
     }
 }
-}  // namespace
+}  // namespace detail
 namespace set_1 {
 OutputVector dequantize_linear(const Node& node) {
     const OutputVector inputs{node.get_ng_inputs()};
@@ -44,7 +44,7 @@ OutputVector dequantize_linear(const Node& node) {
 
     const auto x = inputs[0];
     const auto scale = inputs[1];
-    const auto zero_point = get_zero_point(inputs);
+    const auto zero_point = detail::get_zero_point(inputs);
 
     common::validate_scalar_input("Dequantization scale", scale.get_node_shared_ptr(), {element::f32});
     common::validate_scalar_input("Zero point", zero_point.get_node_shared_ptr());
@@ -58,7 +58,7 @@ OutputVector dequantize_linear(const Node& node) {
 }  // namespace set_1
 
 namespace set_13 {
-namespace {
+namespace detail {
 void validate_scale(const Output<ngraph::Node> scale, const Output<ngraph::Node> x, const int64_t axis) {
     const auto& scale_shape = scale.get_partial_shape();
     NGRAPH_CHECK(scale_shape.rank().get_length() == 0 || scale_shape.rank().get_length() == 1,
@@ -129,25 +129,16 @@ std::shared_ptr<ngraph::Node> reshape_input(const Output<ngraph::Node> input,
 
     return std::make_shared<default_opset::Reshape>(input, target_shape, true);
 }
-}  // namespace
-
-OutputVector dequantize_linear(const Node& node) {
-    const OutputVector inputs{node.get_ng_inputs()};
-
-    NGRAPH_CHECK(2 <= inputs.size() && inputs.size() <= 3,
-                 "The DequantizeLinear op expects 2 required and one optional "
-                 "input. Got: ",
-                 inputs.size());
-
-    const auto x = inputs[0];
-    auto scale = inputs[1];
-    auto zero_point = get_zero_point(inputs);
 
+OutputVector dequantize_linear(Output<ngraph::Node> x,
+                               Output<ngraph::Node> scale,
+                               Output<ngraph::Node> zero_point,
+                               int64_t axis,
+                               Node node) {
     const auto x_shape = x.get_partial_shape();
 
     NGRAPH_CHECK(x_shape.rank().is_static(), "Rank of the input data tensor has to be known (static).");
 
-    int64_t axis{node.get_attribute_value<int64_t>("axis", 1)};
     axis = ngraph::normalize_axis(node.get_description(), axis, x_shape.rank());
 
     validate_scale(scale, x, axis);
@@ -163,6 +154,22 @@ OutputVector dequantize_linear(const Node& node) {
         std::make_shared<default_opset::Multiply>(std::make_shared<default_opset::Subtract>(converted_x, zero_point),
                                                   scale)};
 }
+}  // namespace detail
+
+OutputVector dequantize_linear(const Node& node) {
+    const OutputVector inputs{node.get_ng_inputs()};
+
+    NGRAPH_CHECK(2 <= inputs.size() && inputs.size() <= 3,
+                 "The DequantizeLinear op expects 2 required and one optional "
+                 "input. Got: ",
+                 inputs.size());
+    const auto x = inputs[0];
+    auto scale = inputs[1];
+    auto zero_point = op::detail::get_zero_point(inputs);
+
+    // these reshapes make sure that dequantization happens over the specified axis
+    return detail::dequantize_linear(x, scale, zero_point, node.get_attribute_value<int64_t>("axis", 1), node);
+}
 }  // namespace set_13
 }  // namespace op
 }  // namespace onnx_import
diff --git a/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.hpp b/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.hpp
index d1329a247f8ceb..be36d796a506c1 100644
--- a/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.hpp
+++ b/ngraph/frontend/onnx/frontend/src/op/dequantize_linear.hpp
@@ -10,14 +10,25 @@
 namespace ngraph {
 namespace onnx_import {
 namespace op {
+namespace detail {
+Output<ngraph::Node> get_zero_point(const OutputVector& inputs);
+}
+
 namespace set_1 {
 OutputVector dequantize_linear(const Node& node);
 
 }  // namespace set_1
 
 namespace set_13 {
-OutputVector dequantize_linear(const Node& node);
+namespace detail {
+OutputVector dequantize_linear(Output<ngraph::Node> x,
+                               Output<ngraph::Node> scale,
+                               Output<ngraph::Node> zero_point,
+                               int64_t axis,
+                               Node node);
 }
+OutputVector dequantize_linear(const Node& node);
+}  // namespace set_13
 
 }  // namespace op
 
diff --git a/ngraph/frontend/onnx/frontend/src/op/if.cpp b/ngraph/frontend/onnx/frontend/src/op/if.cpp
new file mode 100644
index 00000000000000..a011d9f0d348d0
--- /dev/null
+++ b/ngraph/frontend/onnx/frontend/src/op/if.cpp
@@ -0,0 +1,69 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "op/if.hpp"
+
+#include "core/graph.hpp"
+#include "ngraph/node.hpp"
+#include "ngraph/opsets/opset8.hpp"
+
+namespace ngraph {
+namespace onnx_import {
+namespace op {
+namespace set_1 {
+OutputVector if_op(const Node& node) {
+    const auto& ng_inputs = node.get_ng_inputs();
+    NGRAPH_CHECK(ng_inputs.size() == 1, "If operator takes only one input");
+
+    const auto& subgraphs = node.get_subgraphs();
+    NGRAPH_CHECK(subgraphs.count("then_branch") == 1, "Missing 'then_branch' attribute");
+    auto then_subgraph = subgraphs.at("then_branch");
+    const auto& then_params = then_subgraph->get_ng_parameters();
+    auto then_branch =
+        std::make_shared<Function>(then_subgraph->get_ng_outputs(), then_params, then_subgraph->get_name());
+    NGRAPH_CHECK(subgraphs.count("else_branch") == 1, "Missing 'else_branch' attribute");
+    auto else_subgraph = subgraphs.at("else_branch");
+    const auto& else_params = else_subgraph->get_ng_parameters();
+    auto else_branch =
+        std::make_shared<Function>(else_subgraph->get_ng_outputs(), else_params, else_subgraph->get_name());
+
+    auto if_node = std::make_shared<ngraph::opset8::If>(ng_inputs.at(0));
+    if_node->set_then_body(then_branch);
+    if_node->set_else_body(else_branch);
+
+    const auto then_branch_inputs_from_parent = then_subgraph->get_inputs_from_parent();
+    NGRAPH_CHECK(then_branch_inputs_from_parent.size() == then_params.size(),
+                 "Number of inputs to 'then_branch' is invalid. Expected " +
+                     std::to_string(then_branch_inputs_from_parent.size()) + ", actual " +
+                     std::to_string(then_params.size()));
+    auto then_param = then_params.cbegin();
+    for (const auto& from_parent : then_branch_inputs_from_parent) {
+        if_node->set_input(from_parent, *then_param, nullptr);
+        then_param++;
+    }
+    const auto else_branch_inputs_from_parent = else_subgraph->get_inputs_from_parent();
+    NGRAPH_CHECK(else_branch_inputs_from_parent.size() == else_params.size(),
+                 "Number of inputs to 'else_branch' is invalid. Expected " +
+                     std::to_string(else_branch_inputs_from_parent.size()) + ", actual " +
+                     std::to_string(else_params.size()));
+    auto else_param = else_params.cbegin();
+    for (const auto& from_parent : else_branch_inputs_from_parent) {
+        if_node->set_input(from_parent, nullptr, *else_param);
+        else_param++;
+    }
+    NGRAPH_CHECK(then_branch->get_results().size() == else_branch->get_results().size(),
+                 "'then' and 'else' branches have to have the same number of outputs");
+    auto else_result = else_branch->get_results().cbegin();
+    for (const auto& then_result : then_branch->get_results()) {
+        if_node->set_output(then_result, *else_result);
+        else_result++;
+    }
+    if_node->validate_and_infer_types();
+
+    return if_node->outputs();
+}
+}  // namespace set_1
+}  // namespace op
+}  // namespace onnx_import
+}  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/op/if.hpp b/ngraph/frontend/onnx/frontend/src/op/if.hpp
new file mode 100644
index 00000000000000..84a5ba041c9992
--- /dev/null
+++ b/ngraph/frontend/onnx/frontend/src/op/if.hpp
@@ -0,0 +1,25 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include "ngraph/node.hpp"
+#include "onnx_import/core/node.hpp"
+
+namespace ngraph {
+namespace onnx_import {
+namespace op {
+namespace set_1 {
+/// \brief Convert ONNX If operation to an nGraph node.
+///
+/// \param node   The ONNX node object representing this operation.
+///
+/// \return The vector containing Ngraph nodes producing output of ONNX If
+///        operation.
+OutputVector if_op(const Node& node);
+
+}  // namespace set_1
+}  // namespace op
+}  // namespace onnx_import
+}  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/op/loop.cpp b/ngraph/frontend/onnx/frontend/src/op/loop.cpp
index 430fb85b0853e5..979f16653205cd 100644
--- a/ngraph/frontend/onnx/frontend/src/op/loop.cpp
+++ b/ngraph/frontend/onnx/frontend/src/op/loop.cpp
@@ -59,7 +59,8 @@ OutputVector loop(const Node& node) {
         loop_carried_dependencies_map[i + 2] = loop_carried_dependencies[i].get_node()->get_friendly_name();
     }
 
-    auto body_graph = node.get_subgraph();
+    const auto& subgraphs = node.get_subgraphs();
+    auto body_graph = subgraphs.at("body");
     auto body_outputs = body_graph->get_ng_outputs();
     const auto& body_inputs = body_graph->get_ng_parameters();
 
diff --git a/ngraph/frontend/onnx/frontend/src/op/qlinear_conv.cpp b/ngraph/frontend/onnx/frontend/src/op/qlinear_conv.cpp
new file mode 100644
index 00000000000000..3ee14d345e9e94
--- /dev/null
+++ b/ngraph/frontend/onnx/frontend/src/op/qlinear_conv.cpp
@@ -0,0 +1,68 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+// Disabled in CMakeList
+// Update to higher opset required
+
+#include "op/qlinear_conv.hpp"
+
+#include <cstddef>
+#include <memory>
+#include <vector>
+
+#include "conv.hpp"
+#include "dequantize_linear.hpp"
+#include "exceptions.hpp"
+#include "ngraph/opsets/opset6.hpp"
+#include "onnx_import/core/null_node.hpp"
+#include "quantize_linear.hpp"
+
+namespace ngraph {
+namespace onnx_import {
+namespace op {
+namespace set_1 {
+OutputVector qlinear_conv(const Node& node) {
+    const OutputVector& inputs = node.get_ng_inputs();
+
+    auto x = inputs.at(0);
+    auto x_scale = inputs.at(1);
+    auto x_zero_point = inputs.at(2);
+    auto w = inputs.at(3);
+    auto w_scale = inputs.at(4);
+    auto w_zero_point = inputs.at(5);
+    auto y_scale = inputs.at(6);
+    auto y_zero_point = inputs.at(7);
+    Output<ngraph::Node> B = inputs.size() > 8 ? inputs.at(8) : std::make_shared<NullNode>()->output(0);
+
+    x = set_13::detail::dequantize_linear(x,
+                                          x_scale,
+                                          std::make_shared<opset6::Convert>(x_zero_point, element::f32),
+                                          1,
+                                          node)[0];
+    w = set_13::detail::dequantize_linear(w,
+                                          w_scale,
+                                          std::make_shared<opset6::Convert>(w_zero_point, element::f32),
+                                          1,
+                                          node)[0];
+
+    if (!ngraph::op::is_null(B)) {
+        B = std::make_shared<opset6::Multiply>(std::make_shared<opset6::Convert>(B, x_scale.get_element_type()),
+                                               std::make_shared<opset6::Multiply>(x_scale, w_scale))
+                ->output(0);
+    }
+
+    auto result = detail::conv(node, x, w, B)[0];
+
+    result = op::detail::make_fake_quantize(y_scale, y_zero_point, result);
+
+    return {result};
+}
+
+}  // namespace set_1
+
+}  // namespace op
+
+}  // namespace onnx_import
+
+}  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/op/qlinear_conv.hpp b/ngraph/frontend/onnx/frontend/src/op/qlinear_conv.hpp
new file mode 100644
index 00000000000000..a25cf374174f66
--- /dev/null
+++ b/ngraph/frontend/onnx/frontend/src/op/qlinear_conv.hpp
@@ -0,0 +1,31 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+// Disabled in CMakeList
+// Update to higher opset required
+
+#pragma once
+
+#include "ngraph/node.hpp"
+#include "onnx_import/core/node.hpp"
+
+namespace ngraph {
+namespace onnx_import {
+namespace op {
+namespace set_1 {
+/// \brief Performs ONNX QLinearConv operation.
+///
+/// \param node   The ONNX node object representing this operation.
+///
+/// \return The vector containing Ngraph nodes producing output of ONNX quantizied
+///         convolution operation.
+OutputVector qlinear_conv(const Node& node);
+
+}  // namespace set_1
+
+}  // namespace op
+
+}  // namespace onnx_import
+
+}  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/op/quantize_linear.cpp b/ngraph/frontend/onnx/frontend/src/op/quantize_linear.cpp
index b8466c59a2584e..b83e43c77941d4 100644
--- a/ngraph/frontend/onnx/frontend/src/op/quantize_linear.cpp
+++ b/ngraph/frontend/onnx/frontend/src/op/quantize_linear.cpp
@@ -94,7 +94,7 @@ std::tuple<std::shared_ptr<ngraph::Node>, std::shared_ptr<ngraph::Node>> get_inp
 
     return std::make_tuple(input_low, input_high);
 }
-
+}  // namespace
 std::shared_ptr<ngraph::Node> make_fake_quantize(const Output<ngraph::Node>& y_scale,
                                                  const Output<ngraph::Node>& y_zero_point,
                                                  const Output<ngraph::Node>& data) {
@@ -116,7 +116,6 @@ std::shared_ptr<ngraph::Node> make_fake_quantize(const Output<ngraph::Node>& y_s
         std::make_shared<default_opset::FakeQuantize>(data, input_low, input_high, output_low, output_high, levels),
         destination_type);
 }
-}  // namespace
 }  // namespace detail
 
 namespace set_1 {
@@ -135,11 +134,13 @@ OutputVector quantize_linear(const Node& node) {
 }  // namespace set_1
 
 namespace set_13 {
-OutputVector quantize_linear(const Node& node) {
-    OutputVector inputs{node.get_ng_inputs()};
-    auto x = inputs.at(0);
-    auto y_scale = inputs.at(1);
-    auto y_zero_point = detail::get_zero_point(inputs);
+namespace detail {
+OutputVector quantize_linear(Output<ngraph::Node> x,
+                             Output<ngraph::Node> y_scale,
+                             Output<ngraph::Node> y_zero_point,
+                             int64_t axis,
+                             Node node) {
+    namespace detail = ngraph::onnx_import::op::detail;
 
     x = detail::validate_data(node, x);
     detail::validate_zero_point_type(node, y_zero_point);
@@ -147,7 +148,6 @@ OutputVector quantize_linear(const Node& node) {
 
     const auto& x_shape = x.get_partial_shape();
 
-    int64_t axis{node.get_attribute_value<int64_t>("axis", 1)};
     axis = normalize_axis(node.get_description(), axis, x_shape.rank());
 
     const auto& y_scale_shape = y_scale.get_partial_shape();
@@ -185,7 +185,22 @@ OutputVector quantize_linear(const Node& node) {
 
     return {detail::make_fake_quantize(y_scale, y_zero_point, x)};
 }
+}  // namespace detail
+
+OutputVector quantize_linear(const Node& node) {
+    const OutputVector inputs{node.get_ng_inputs()};
 
+    NGRAPH_CHECK(2 <= inputs.size() && inputs.size() <= 3,
+                 "The QuantizeLinear op expects 2 required and one optional "
+                 "input. Got: ",
+                 inputs.size());
+
+    const auto x = inputs[0];
+    auto scale = inputs[1];
+    auto zero_point = op::detail::get_zero_point(inputs);
+
+    return detail::quantize_linear(x, scale, zero_point, node.get_attribute_value<int64_t>("axis", 1), node);
+}
 }  // namespace set_13
 
 }  // namespace op
diff --git a/ngraph/frontend/onnx/frontend/src/op/quantize_linear.hpp b/ngraph/frontend/onnx/frontend/src/op/quantize_linear.hpp
index bc049d55d4a029..531d9ac494d656 100644
--- a/ngraph/frontend/onnx/frontend/src/op/quantize_linear.hpp
+++ b/ngraph/frontend/onnx/frontend/src/op/quantize_linear.hpp
@@ -10,12 +10,18 @@
 namespace ngraph {
 namespace onnx_import {
 namespace op {
+namespace detail {
+std::shared_ptr<ngraph::Node> make_fake_quantize(const Output<ngraph::Node>& y_scale,
+                                                 const Output<ngraph::Node>& y_zero_point,
+                                                 const Output<ngraph::Node>& data);
+}
 namespace set_1 {
 OutputVector quantize_linear(const Node& node);
 
 }  // namespace set_1
 
 namespace set_13 {
+
 OutputVector quantize_linear(const Node& node);
 
 }  // namespace set_13
diff --git a/ngraph/frontend/onnx/frontend/src/ops_bridge.cpp b/ngraph/frontend/onnx/frontend/src/ops_bridge.cpp
index ed759c1b5eaf63..75a0c78e03d941 100644
--- a/ngraph/frontend/onnx/frontend/src/ops_bridge.cpp
+++ b/ngraph/frontend/onnx/frontend/src/ops_bridge.cpp
@@ -29,6 +29,7 @@
 #include "op/cast_like.hpp"
 #include "op/ceil.hpp"
 #include "op/clip.hpp"
+#include "op/com.microsoft/bias_gelu.hpp"
 #include "op/compress.hpp"
 #include "op/concat.hpp"
 #include "op/constant.hpp"
@@ -66,6 +67,7 @@
 #include "op/hard_swish.hpp"
 #include "op/hardmax.hpp"
 #include "op/identity.hpp"
+#include "op/if.hpp"
 #include "op/image_scaler.hpp"
 #include "op/instance_norm.hpp"
 #include "op/leaky_relu.hpp"
@@ -91,10 +93,6 @@
 #include "op/not.hpp"
 #include "op/onehot.hpp"
 #include "op/or.hpp"
-#include "op/pad.hpp"
-#include "op/pow.hpp"
-#include "op/prelu.hpp"
-// #include "op/quant_conv.hpp"
 #include "op/org.openvinotoolkit/deformable_conv_2d.hpp"
 #include "op/org.openvinotoolkit/detection_output.hpp"
 #include "op/org.openvinotoolkit/experimental_detectron/detection_output.hpp"
@@ -107,6 +105,10 @@
 #include "op/org.openvinotoolkit/normalize.hpp"
 #include "op/org.openvinotoolkit/prior_box.hpp"
 #include "op/org.openvinotoolkit/swish.hpp"
+#include "op/pad.hpp"
+#include "op/pow.hpp"
+#include "op/prelu.hpp"
+#include "op/qlinear_conv.hpp"
 #include "op/quantize_linear.hpp"
 #include "op/random_uniform.hpp"
 #include "op/random_uniform_like.hpp"
@@ -261,6 +263,8 @@ bool OperatorsBridge::_is_operator_registered(const std::string& name,
     }
 }
 
+static const char* const MICROSOFT_DOMAIN = "com.microsoft";
+
 #define REGISTER_OPERATOR(name_, ver_, fn_) \
     m_map[""][name_].emplace(ver_, std::bind(op::set_##ver_::fn_, std::placeholders::_1))
 
@@ -335,6 +339,7 @@ OperatorsBridge::OperatorsBridge() {
     REGISTER_OPERATOR("HardSigmoid", 1, hard_sigmoid);
     REGISTER_OPERATOR("HardSwish", 1, hard_swish);
     REGISTER_OPERATOR("Identity", 1, identity);
+    REGISTER_OPERATOR("If", 1, if_op);
     REGISTER_OPERATOR("ImageScaler", 1, image_scaler);
     REGISTER_OPERATOR("InstanceNormalization", 1, instance_norm);
     REGISTER_OPERATOR("LeakyRelu", 1, leaky_relu);
@@ -368,7 +373,7 @@ OperatorsBridge::OperatorsBridge() {
     REGISTER_OPERATOR("Pad", 11, pad);
     REGISTER_OPERATOR("Pow", 1, pow);
     REGISTER_OPERATOR("PRelu", 1, prelu);
-    // REGISTER_OPERATOR("QLinearConv", 1, quant_conv);
+    REGISTER_OPERATOR("QLinearConv", 1, qlinear_conv);
     REGISTER_OPERATOR("QuantizeLinear", 1, quantize_linear);
     REGISTER_OPERATOR("QuantizeLinear", 13, quantize_linear);
     REGISTER_OPERATOR("Range", 1, range);
@@ -472,6 +477,8 @@ OperatorsBridge::OperatorsBridge() {
     REGISTER_OPERATOR_WITH_DOMAIN(OPENVINO_ONNX_DOMAIN, "PriorBox", 1, prior_box);
     REGISTER_OPERATOR_WITH_DOMAIN(OPENVINO_ONNX_DOMAIN, "PriorBoxClustered", 1, prior_box_clustered);
     REGISTER_OPERATOR_WITH_DOMAIN(OPENVINO_ONNX_DOMAIN, "Swish", 1, swish);
+
+    REGISTER_OPERATOR_WITH_DOMAIN(MICROSOFT_DOMAIN, "BiasGelu", 1, bias_gelu);
 }
 
 #undef REGISTER_OPERATOR
diff --git a/ngraph/frontend/onnx/frontend/src/place.cpp b/ngraph/frontend/onnx/frontend/src/place.cpp
index 64c623c2957083..915b6a401f50c5 100644
--- a/ngraph/frontend/onnx/frontend/src/place.cpp
+++ b/ngraph/frontend/onnx/frontend/src/place.cpp
@@ -12,7 +12,12 @@ using namespace ngraph::frontend;
 PlaceInputEdgeONNX::PlaceInputEdgeONNX(const onnx_editor::InputEdge& edge,
                                        std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
     : m_edge{edge},
-      m_editor{editor} {}
+      m_editor{std::move(editor)} {}
+
+PlaceInputEdgeONNX::PlaceInputEdgeONNX(onnx_editor::InputEdge&& edge,
+                                       std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
+    : m_edge{std::move(edge)},
+      m_editor{std::move(editor)} {}
 
 onnx_editor::InputEdge PlaceInputEdgeONNX::get_input_edge() const {
     return m_edge;
@@ -39,14 +44,18 @@ bool PlaceInputEdgeONNX::is_equal_data(Place::Ptr another) const {
 }
 
 Place::Ptr PlaceInputEdgeONNX::get_source_tensor() const {
-    const auto tensor_name = m_editor->get_source_tensor_name(m_edge);
-    return std::make_shared<PlaceTensorONNX>(tensor_name, m_editor);
+    return std::make_shared<PlaceTensorONNX>(m_editor->get_source_tensor_name(m_edge), m_editor);
 }
 
 PlaceOutputEdgeONNX::PlaceOutputEdgeONNX(const onnx_editor::OutputEdge& edge,
                                          std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
     : m_edge{edge},
-      m_editor{editor} {}
+      m_editor{std::move(editor)} {}
+
+PlaceOutputEdgeONNX::PlaceOutputEdgeONNX(onnx_editor::OutputEdge&& edge,
+                                         std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
+    : m_edge{std::move(edge)},
+      m_editor{std::move(editor)} {}
 
 onnx_editor::OutputEdge PlaceOutputEdgeONNX::get_output_edge() const {
     return m_edge;
@@ -73,13 +82,16 @@ bool PlaceOutputEdgeONNX::is_equal_data(Place::Ptr another) const {
 }
 
 Place::Ptr PlaceOutputEdgeONNX::get_target_tensor() const {
-    const auto tensor_name = m_editor->get_target_tensor_name(m_edge);
-    return std::make_shared<PlaceTensorONNX>(tensor_name, m_editor);
+    return std::make_shared<PlaceTensorONNX>(m_editor->get_target_tensor_name(m_edge), m_editor);
 }
 
 PlaceTensorONNX::PlaceTensorONNX(const std::string& name, std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
-    : m_name(name),
-      m_editor(editor) {}
+    : m_name{name},
+      m_editor{std::move(editor)} {}
+
+PlaceTensorONNX::PlaceTensorONNX(std::string&& name, std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
+    : m_name{std::move(name)},
+      m_editor{std::move(editor)} {}
 
 std::vector<std::string> PlaceTensorONNX::get_names() const {
     return {m_name};
@@ -133,3 +145,67 @@ bool PlaceTensorONNX::is_equal_data(Place::Ptr another) const {
     return is_equal(another) || (is_input() ? false : get_producing_port()->is_equal(another)) ||
            eq_to_consuming_port(another);
 }
+
+PlaceOpONNX::PlaceOpONNX(const onnx_editor::EditorNode& node, std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
+    : m_node{node},
+      m_editor{std::move(editor)} {}
+
+PlaceOpONNX::PlaceOpONNX(onnx_editor::EditorNode&& node, std::shared_ptr<onnx_editor::ONNXModelEditor> editor)
+    : m_node{std::move(node)},
+      m_editor{std::move(editor)} {}
+
+std::vector<std::string> PlaceOpONNX::get_names() const {
+    return {m_node.m_node_name};
+}
+
+Place::Ptr PlaceOpONNX::get_output_port() const {
+    if (m_editor->get_output_ports(m_node).size() == 1) {
+        return get_output_port(0);
+    }
+    return nullptr;
+}
+
+Place::Ptr PlaceOpONNX::get_output_port(int output_port_index) const {
+    if (output_port_index < m_editor->get_output_ports(m_node).size()) {
+        return std::make_shared<PlaceOutputEdgeONNX>(
+            m_editor->find_output_edge(m_node, onnx_editor::EditorOutput{output_port_index}),
+            m_editor);
+    }
+    return nullptr;
+}
+
+Place::Ptr PlaceOpONNX::get_output_port(const std::string& output_port_name) const {
+    const auto output_ports = m_editor->get_output_ports(m_node);
+    if (std::count(std::begin(output_ports), std::end(output_ports), output_port_name) == 1) {
+        return std::make_shared<PlaceOutputEdgeONNX>(
+            m_editor->find_output_edge(m_node, onnx_editor::EditorOutput{output_port_name}),
+            m_editor);
+    }
+    return nullptr;
+}
+
+Place::Ptr PlaceOpONNX::get_input_port() const {
+    if (m_editor->get_input_ports(m_node).size() == 1) {
+        return get_input_port(0);
+    }
+    return nullptr;
+}
+
+Place::Ptr PlaceOpONNX::get_input_port(int input_port_index) const {
+    if (input_port_index < m_editor->get_input_ports(m_node).size()) {
+        return std::make_shared<PlaceInputEdgeONNX>(
+            m_editor->find_input_edge(m_node, onnx_editor::EditorInput{input_port_index}),
+            m_editor);
+    }
+    return nullptr;
+}
+
+Place::Ptr PlaceOpONNX::get_input_port(const std::string& input_name) const {
+    const auto input_ports = m_editor->get_input_ports(m_node);
+    if (std::count(std::begin(input_ports), std::end(input_ports), input_name) == 1) {
+        return std::make_shared<PlaceInputEdgeONNX>(
+            m_editor->find_input_edge(m_node, onnx_editor::EditorInput{input_name}),
+            m_editor);
+    }
+    return nullptr;
+}
diff --git a/ngraph/frontend/onnx/frontend/src/place.hpp b/ngraph/frontend/onnx/frontend/src/place.hpp
index a236d8506e9174..efc7e7a81551b8 100644
--- a/ngraph/frontend/onnx/frontend/src/place.hpp
+++ b/ngraph/frontend/onnx/frontend/src/place.hpp
@@ -13,6 +13,7 @@ namespace frontend {
 class PlaceInputEdgeONNX : public Place {
 public:
     PlaceInputEdgeONNX(const onnx_editor::InputEdge& edge, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
+    PlaceInputEdgeONNX(onnx_editor::InputEdge&& edge, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
 
     onnx_editor::InputEdge get_input_edge() const;
 
@@ -34,6 +35,7 @@ class PlaceInputEdgeONNX : public Place {
 class PlaceOutputEdgeONNX : public Place {
 public:
     PlaceOutputEdgeONNX(const onnx_editor::OutputEdge& edge, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
+    PlaceOutputEdgeONNX(onnx_editor::OutputEdge&& edge, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
 
     onnx_editor::OutputEdge get_output_edge() const;
 
@@ -55,6 +57,7 @@ class PlaceOutputEdgeONNX : public Place {
 class PlaceTensorONNX : public Place {
 public:
     PlaceTensorONNX(const std::string& name, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
+    PlaceTensorONNX(std::string&& name, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
 
     std::vector<std::string> get_names() const override;
 
@@ -76,6 +79,25 @@ class PlaceTensorONNX : public Place {
     std::string m_name;
     std::shared_ptr<onnx_editor::ONNXModelEditor> m_editor;
 };
+
+class PlaceOpONNX : public Place {
+public:
+    PlaceOpONNX(const onnx_editor::EditorNode& node, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
+    PlaceOpONNX(onnx_editor::EditorNode&& node, std::shared_ptr<onnx_editor::ONNXModelEditor> editor);
+    std::vector<std::string> get_names() const override;
+
+    Place::Ptr get_output_port() const override;
+    Place::Ptr get_output_port(int output_port_index) const override;
+    Place::Ptr get_output_port(const std::string& output_port_name) const override;
+
+    Place::Ptr get_input_port() const override;
+    Place::Ptr get_input_port(int input_port_index) const override;
+    Place::Ptr get_input_port(const std::string& input_name) const override;
+
+private:
+    onnx_editor::EditorNode m_node;
+    std::shared_ptr<onnx_editor::ONNXModelEditor> m_editor;
+};
 }  // namespace frontend
 
 }  // namespace ngraph
diff --git a/ngraph/frontend/onnx/frontend/src/utils/onnx_internal.cpp b/ngraph/frontend/onnx/frontend/src/utils/onnx_internal.cpp
index 300252d480e64d..3a2546889a267d 100644
--- a/ngraph/frontend/onnx/frontend/src/utils/onnx_internal.cpp
+++ b/ngraph/frontend/onnx/frontend/src/utils/onnx_internal.cpp
@@ -55,7 +55,9 @@ void convert_decoded_function(std::shared_ptr<Function> function) {
         if (auto raw_node = std::dynamic_pointer_cast<frontend::ONNXFrameworkNode>(node)) {
             if (auto subgraph_node = std::dynamic_pointer_cast<frontend::ONNXSubgraphFrameworkNode>(node)) {
                 subgraph_node->infer_inputs_from_parent();
-                convert_decoded_function(subgraph_node->get_subgraph_body());
+                for (auto& function : subgraph_node->get_subgraph_functions()) {
+                    convert_decoded_function(function);
+                }
             }
             auto ng_nodes = raw_node->get_ng_nodes();
             replace_node(raw_node, ng_nodes);
diff --git a/ngraph/frontend/onnx/onnx_common/CMakeLists.txt b/ngraph/frontend/onnx/onnx_common/CMakeLists.txt
index ec31841e12cccc..bc63b28893d89b 100644
--- a/ngraph/frontend/onnx/onnx_common/CMakeLists.txt
+++ b/ngraph/frontend/onnx/onnx_common/CMakeLists.txt
@@ -16,7 +16,6 @@ source_group("include" FILES ${PUBLIC_HEADERS} ${PUBLIC_HEADERS})
 # Create static library
 
 add_library(${TARGET_NAME} STATIC ${LIBRARY_SRC} ${PUBLIC_HEADERS})
-add_library(ngraph::onnx_common ALIAS ${TARGET_NAME})
 
 # TODO Add handling ie_faster_build
 
diff --git a/ngraph/frontend/paddlepaddle/CMakeLists.txt b/ngraph/frontend/paddlepaddle/CMakeLists.txt
index 75a99e1e3855de..1f347f9c9d241d 100644
--- a/ngraph/frontend/paddlepaddle/CMakeLists.txt
+++ b/ngraph/frontend/paddlepaddle/CMakeLists.txt
@@ -49,13 +49,14 @@ set_source_files_properties(${PROTO_SRCS} ${PROTO_HDRS} PROPERTIES COMPILE_OPTIO
 
 # Create shared library
 add_library(${TARGET_NAME} SHARED  ${LIBRARY_SRC} ${LIBRARY_HEADERS} ${LIBRARY_PUBLIC_HEADERS} ${PROTO_SRCS} ${PROTO_HDRS})
+add_library(openvino::frontend::paddlepaddle ALIAS ${TARGET_NAME})
 
 add_dependencies(${TARGET_NAME} paddlepaddle_ngraph_frontend_proto)
 
 ov_ncc_naming_style(FOR_TARGET ${TARGET_NAME}
                     INCLUDE_DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/include"
                     ADDITIONAL_INCLUDE_DIRECTORIES
-                        $<TARGET_PROPERTY:ngraph::frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>)
+                        $<TARGET_PROPERTY:frontend_manager::static,INTERFACE_INCLUDE_DIRECTORIES>)
 
 target_include_directories(${TARGET_NAME}
         PUBLIC
@@ -75,21 +76,22 @@ endif()
 
 link_system_libraries(${TARGET_NAME} PRIVATE ${Protobuf_LITE_LIBRARIES})
 
-target_link_libraries(${TARGET_NAME} PRIVATE ngraph::frontend_manager::static
+target_link_libraries(${TARGET_NAME} PRIVATE frontend_manager::static
                                      PRIVATE ngraph::builder inference_engine_transformations)
 
 add_clang_format_target(${TARGET_NAME}_clang FOR_TARGETS ${TARGET_NAME}
                         EXCLUDE_PATTERNS ${PROTO_SRCS} ${PROTO_HDRS})
 
-install(TARGETS ${TARGET_NAME} EXPORT ngraphTargets
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        ARCHIVE DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT ngraph)
+set_target_properties(${TARGET_NAME} PROPERTIES EXPORT_NAME frontend::paddlepaddle)
+install(TARGETS ${TARGET_NAME} EXPORT OpenVINOTargets
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT ngraph
+        ARCHIVE DESTINATION ${IE_CPACK_ARCHIVE_PATH} COMPONENT ngraph
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT ngraph)
 
 install(DIRECTORY ${${TARGET_NAME}_INCLUDE_DIR}/paddlepaddle_frontend
         DESTINATION ${FRONTEND_INSTALL_INCLUDE}
         COMPONENT ngraph_dev
-        FILES_MATCHING PATTERN "*.hpp"
-)
+        FILES_MATCHING PATTERN "*.hpp")
 
-export(TARGETS ${TARGET_NAME} NAMESPACE ngraph:: APPEND FILE "${NGRAPH_TARGETS_FILE}")
+export(TARGETS ${TARGET_NAME} NAMESPACE openvino::
+       APPEND FILE "${CMAKE_BINARY_DIR}/OpenVINOTargets.cmake")
diff --git a/ngraph/frontend/paddlepaddle/src/frontend.cpp b/ngraph/frontend/paddlepaddle/src/frontend.cpp
index 0ef30903455b61..08e9d2c7adf31b 100644
--- a/ngraph/frontend/paddlepaddle/src/frontend.cpp
+++ b/ngraph/frontend/paddlepaddle/src/frontend.cpp
@@ -49,8 +49,15 @@ NamedOutputs make_ng_node(const std::map<pdpd::TensorName, Output<Node>>& nodes,
             named_inputs[input_port.parameter()].push_back(node_it->second);
         }
     }
+    NamedOutputs outputs;
+    // In case the conversion function throws exception
+    try {
+        outputs = creator_it->second(NodeContext(DecoderPDPDProto(op_place), named_inputs));
+    } catch (std::exception& ex) {
+        FRONT_END_OP_CONVERSION_CHECK(false, "Fail to convert " + op_desc.type() + " Exception " + ex.what());
+    }
 
-    return creator_it->second(NodeContext(DecoderPDPDProto(op_place), named_inputs));
+    return outputs;
 }
 
 NamedOutputs make_framework_node(const std::map<pdpd::TensorName, Output<Node>>& nodes,
diff --git a/ngraph/frontend/paddlepaddle/src/model.cpp b/ngraph/frontend/paddlepaddle/src/model.cpp
index 22a6c330469db2..4ba7aaa78884f7 100644
--- a/ngraph/frontend/paddlepaddle/src/model.cpp
+++ b/ngraph/frontend/paddlepaddle/src/model.cpp
@@ -289,7 +289,14 @@ InputModelPDPD::InputModelPDPDImpl::InputModelPDPDImpl(const std::basic_string<T
 
     FRONT_END_GENERAL_CHECK(pb_stream && pb_stream.is_open(), "Model file doesn't exist");
     FRONT_END_GENERAL_CHECK(m_fw_ptr->ParseFromIstream(&pb_stream), "Model can't be parsed");
-
+    // According to Paddle, the saved model has the framework version
+    // For example Paddle 2.1.0 is encoded as 2001000. 0 means the latest framework.
+    // https://github.com/PaddlePaddle/Paddle/blob/develop/cmake/version.cmake
+    // https://github.com/PaddlePaddle/Paddle/blob/2100816c5190693cc7dee181e96af72e9f0fbd1d/paddle/fluid/framework/program_desc.cc#L52
+    int64_t version = m_fw_ptr->version().version();
+    FRONT_END_GENERAL_CHECK(
+        version >= 2000000 || version == 0,
+        "[Frontend]Only Support Paddle greater than 2.0.0, current version " + std::to_string(version));
     loadPlaces();
     if (weights_stream && weights_stream.is_open()) {
         loadConsts(std::basic_string<T>{}, &weights_stream);
@@ -307,7 +314,10 @@ InputModelPDPD::InputModelPDPDImpl::InputModelPDPDImpl(const std::vector<std::is
                                 "Two streams are needed to load a model: model and weights streams");
     }
     FRONT_END_GENERAL_CHECK(m_fw_ptr->ParseFromIstream(streams[0]), "Model can't be parsed");
-
+    int64_t version = m_fw_ptr->version().version();
+    FRONT_END_GENERAL_CHECK(
+        version >= 2000000 || version == 0,
+        "[Frontend]Only Support Paddle greater than 2.0.0, current version " + std::to_string(version));
     loadPlaces();
     if (streams.size() > 1)
         loadConsts(std::string(), streams[1]);
diff --git a/ngraph/frontend/paddlepaddle/src/op/fill_constant_batch_size_like.cpp b/ngraph/frontend/paddlepaddle/src/op/fill_constant_batch_size_like.cpp
index 94753f314029a6..5883dae573b99e 100644
--- a/ngraph/frontend/paddlepaddle/src/op/fill_constant_batch_size_like.cpp
+++ b/ngraph/frontend/paddlepaddle/src/op/fill_constant_batch_size_like.cpp
@@ -55,25 +55,46 @@ static std::shared_ptr<Node> set_val(int32_t idx, std::shared_ptr<Node> val_node
     return std::make_shared<ngraph::opset6::Concat>(nodes, 0);
 }
 
+template <element::Type_t Type,
+          typename StorageDataType = fundamental_type_for<Type>,
+          typename std::enable_if<Type == element::Type_t::i32 || Type == element::Type_t::i64 ||
+                                      Type == element::Type_t::f32 || Type == element::Type_t::f64,
+                                  bool>::type = true>
 static Output<Node> get_seed_node(const NodeContext& node) {
-    auto dtype = node.get_attribute<element::Type>("dtype");
     Output<Node> val_node;
+    auto dtype = node.get_attribute<element::Type>("dtype");
     auto str_value = node.get_attribute<std::string>("str_value");
+    if (str_value.empty()) {
+        auto float_value = node.get_attribute<float>("value");
+        val_node = ngraph::opset6::Constant::create(dtype, {1}, {static_cast<StorageDataType>(float_value)});
+    } else {
+        std::stringstream ss(str_value);
+        StorageDataType tmp_value;
+        ss >> tmp_value;
+        val_node = ngraph::opset6::Constant::create(dtype, {1}, {static_cast<StorageDataType>(tmp_value)});
+    }
+    return val_node;
+}
+
+static Output<Node> get_seed_node(const NodeContext& node) {
+    Output<Node> val_node;
+    auto dtype = node.get_attribute<element::Type>("dtype");
+
     switch (dtype) {
     case element::i32:
-        val_node = ngraph::opset6::Constant::create(dtype, {1}, {std::stoi(str_value)});
+        val_node = get_seed_node<element::i32>(node);
         break;
     case element::i64:
-        val_node = ngraph::opset6::Constant::create(dtype, {1}, {std::stoll(str_value)});
+        val_node = get_seed_node<element::i64>(node);
         break;
     case element::f32:
-        val_node = ngraph::opset6::Constant::create(dtype, {1}, {std::stof(str_value)});
+        val_node = get_seed_node<element::f32>(node);
         break;
     case element::f64:
-        val_node = ngraph::opset6::Constant::create(dtype, {1}, {std::stod(str_value)});
+        val_node = get_seed_node<element::f64>(node);
         break;
     default:
-        throw std::runtime_error("fill_constant_batch_size_like: dtype value is invalid");
+        throw std::runtime_error("fill_constant_batch_size_like: unsupported dtype");
     }
 
     return val_node;
diff --git a/ngraph/frontend/paddlepaddle/src/op/slice.cpp b/ngraph/frontend/paddlepaddle/src/op/slice.cpp
index 685dec69b4a897..0245fdabbe9225 100644
--- a/ngraph/frontend/paddlepaddle/src/op/slice.cpp
+++ b/ngraph/frontend/paddlepaddle/src/op/slice.cpp
@@ -35,24 +35,42 @@ NamedOutputs slice(const NodeContext& node) {
         end_idx_node = opset6::Constant::create(element::i32, {ends.size()}, ends);
     }
 
-    // the shape of input, such as [1, 1, 3, 3]
+    // The following process is:
+    // Given:
+    // data = [ [1, 2, 3, 4], [5, 6, 7, 8], ] // shape is: [2, 4]
+    // axes = [0]
+    // starts = [1]
+    // ends = [2]
+    // Our process is:
+    //  1. Get 'axes': [0, 1], 'starts', 'ends'
+    //  2. Get data shape: [2,4] and dims: 2
+    //  3. Create two tensor t1 and t2, shape is the dims from step2: 2. t1: [0, 0], t2: [INT_MAX, INT_MAX]
+    //  4. Use 'ScatterNDUpdate' to update some elements in t1, the updated indexes are coming from 'axes', the contents
+    //  are coming from 'starts', t1: [1, 0]; apply the similar process to t2
+    //  5. Call 'StrideSlice' with t1 and t2
+    // Why using ScatterNDUpdate is that 'axes' may be discontinuous.
+
+    // the shape of input, such as [2, 4]
     auto shape_node = std::make_shared<opset6::ShapeOf>(data, element::Type_t::i32);
-    // the input dim, such as [4]
+    // the input dim, such as [2]
     auto shape_shape_node = std::make_shared<opset6::ShapeOf>(shape_node, element::i32);
     auto const_0_node = opset6::Constant::create(element::i32, {}, {0});
     auto const_max_node = opset6::Constant::create(element::i32, {}, {INT_MAX});
-    // array [0:max)
+    // t1: [0, 0]
     auto start_node = std::make_shared<opset6::Broadcast>(const_0_node, shape_shape_node);
+    // t2: [INT_MAX, INT_MAX]
     auto end_node = std::make_shared<opset6::Broadcast>(const_max_node, shape_shape_node);
     auto axes_node = opset6::Constant::create(element::i32, {axes.size(), 1}, axes);
+    // update t1
     auto fixed_start_node = std::make_shared<opset6::ScatterNDUpdate>(start_node, axes_node, start_idx_node);
+    // update t2
     auto fixed_end_node = std::make_shared<opset6::ScatterNDUpdate>(end_node, axes_node, end_idx_node);
 
     return node.default_single_output_mapping({std::make_shared<ngraph::opset6::StridedSlice>(data,
                                                                                               fixed_start_node,
                                                                                               fixed_end_node,
-                                                                                              std::vector<int64_t>{},
-                                                                                              std::vector<int64_t>{})},
+                                                                                              std::vector<int64_t>{0},
+                                                                                              std::vector<int64_t>{0})},
                                               {"Out"});
 }
 }  // namespace op
diff --git a/ngraph/python/pybind11 b/ngraph/python/pybind11
deleted file mode 160000
index 8de7772cc72dac..00000000000000
--- a/ngraph/python/pybind11
+++ /dev/null
@@ -1 +0,0 @@
-Subproject commit 8de7772cc72daca8e947b79b83fea46214931604
diff --git a/ngraph/test/CMakeLists.txt b/ngraph/test/CMakeLists.txt
index 1ac9ee9fcbad84..40592a8164ad49 100644
--- a/ngraph/test/CMakeLists.txt
+++ b/ngraph/test/CMakeLists.txt
@@ -44,11 +44,13 @@ set(SRC
     input_output_assign.cpp
     int4.cpp
     intervals.cpp
+    layout.cpp
     main.cpp
     matcher_pass.cpp
     misc.cpp
     node_input_output.cpp
     op.cpp
+    opset.cpp
     op_eval/binary_convolution.cpp
     op_eval/bucketize.cpp
     op_eval/clamp.cpp
@@ -76,6 +78,7 @@ set(SRC
     pass_config.cpp
     pass_manager.cpp
     pattern.cpp
+    preprocess.cpp
     provenance.cpp
     replace_node.cpp
     reshape_opt_kernel.cpp
@@ -215,6 +218,7 @@ set(SRC
     type_prop/sign.cpp
     type_prop/sin.cpp
     type_prop/sinh.cpp
+    type_prop/slice.cpp
     type_prop/softmax.cpp
     type_prop/softplus.cpp
     type_prop/space_to_batch.cpp
@@ -268,6 +272,7 @@ set(SRC
     visitors/op/floor_mod.cpp
     visitors/op/floor.cpp
     visitors/op/gather.cpp
+    visitors/op/gather_tree.cpp
     visitors/op/gelu.cpp
     visitors/op/greater_equal.cpp
     visitors/op/greater.cpp
@@ -324,6 +329,7 @@ set(SRC
     visitors/op/reverse.cpp
     visitors/op/reverse_sequence.cpp
     visitors/op/rnn_cell.cpp
+    visitors/op/rnn_sequence.cpp
     visitors/op/roi_pooling.cpp
     visitors/op/round.cpp
     visitors/op/scatter_elements_update.cpp
@@ -333,6 +339,7 @@ set(SRC
     visitors/op/shuffle_channels.cpp
     visitors/op/sign.cpp
     visitors/op/sinh.cpp
+    visitors/op/slice.cpp
     visitors/op/softmax.cpp
     visitors/op/softplus.cpp
     visitors/op/space_to_batch.cpp
@@ -407,7 +414,6 @@ set(MULTI_TEST_SRC
     backend/api.in.cpp
     backend/asin.in.cpp
     backend/asinh.in.cpp
-    backend/atan.in.cpp
     backend/auto_broadcast.in.cpp
     backend/avg_pool.in.cpp
     backend/batch_norm.in.cpp
@@ -416,7 +422,6 @@ set(MULTI_TEST_SRC
     backend/bucketize.in.cpp
     backend/builder_reduce_ops_opset1.in.cpp
     backend/ceiling.in.cpp
-    backend/comparison.in.cpp
     backend/concat.in.cpp
     backend/constant.in.cpp
     backend/convolution_backprop.in.cpp
@@ -463,7 +468,6 @@ set(MULTI_TEST_SRC
     backend/matrix_nms.in.cpp
     backend/maximum.in.cpp
     backend/max_pool.in.cpp
-    backend/minimum.in.cpp
     backend/mish.in.cpp
     backend/mod.in.cpp
     backend/multiclass_nms.in.cpp
diff --git a/ngraph/test/backend/atan.in.cpp b/ngraph/test/backend/atan.in.cpp
deleted file mode 100644
index eb134165804aed..00000000000000
--- a/ngraph/test/backend/atan.in.cpp
+++ /dev/null
@@ -1,65 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <algorithm>
-#include <cinttypes>
-#include <cmath>
-#include <cstdlib>
-#include <random>
-#include <string>
-
-// clang-format off
-#ifdef ${BACKEND_NAME}_FLOAT_TOLERANCE_BITS
-#define DEFAULT_FLOAT_TOLERANCE_BITS ${BACKEND_NAME}_FLOAT_TOLERANCE_BITS
-#endif
-
-#ifdef ${BACKEND_NAME}_DOUBLE_TOLERANCE_BITS
-#define DEFAULT_DOUBLE_TOLERANCE_BITS ${BACKEND_NAME}_DOUBLE_TOLERANCE_BITS
-#endif
-// clang-format on
-
-#include "gtest/gtest.h"
-#include "ngraph/ngraph.hpp"
-#include "util/engine/test_engines.hpp"
-#include "util/test_case.hpp"
-#include "util/test_control.hpp"
-
-using namespace std;
-using namespace ngraph;
-
-static string s_manifest = "${MANIFEST}";
-using TestEngine = test::ENGINE_CLASS_NAME(${BACKEND_NAME});
-
-NGRAPH_TEST(${BACKEND_NAME}, atan_float) {
-    Shape shape{11};
-    auto A = make_shared<op::Parameter>(element::f32, shape);
-    auto f = make_shared<Function>(make_shared<op::Atan>(A), ParameterVector{A});
-
-    auto test_case = test::TestCase<TestEngine>(f);
-    test_case.add_input<float>({-4.f, -2.f, -1.f, -0.5f, -0.25f, 0.f, 0.25f, 0.5f, 1.f, 2.f, 4.f});
-    test_case.add_expected_output<float>(shape,
-                                         {-1.32581766f,
-                                          -1.10714872f,
-                                          -0.78539816f,
-                                          -0.46364761f,
-                                          -0.24497866f,
-                                          0.00000000f,
-                                          0.24497866f,
-                                          0.46364761f,
-                                          0.78539816f,
-                                          1.10714872f,
-                                          1.32581766f});
-    test_case.run();
-}
-
-NGRAPH_TEST(${BACKEND_NAME}, atan_int) {
-    Shape shape{5};
-    auto A = make_shared<op::Parameter>(element::i32, shape);
-    auto f = make_shared<Function>(make_shared<op::Atan>(A), ParameterVector{A});
-
-    auto test_case = test::TestCase<TestEngine>(f);
-    test_case.add_input<int32_t>({-2, -1, 0, 1, 2});
-    test_case.add_expected_output<int32_t>(shape, {-1, -1, 0, 1, 1});
-    test_case.run();
-}
diff --git a/ngraph/test/backend/avg_pool.in.cpp b/ngraph/test/backend/avg_pool.in.cpp
index cd376fad62f224..cf983ecf65924c 100644
--- a/ngraph/test/backend/avg_pool.in.cpp
+++ b/ngraph/test/backend/avg_pool.in.cpp
@@ -223,3 +223,29 @@ NGRAPH_TEST(${BACKEND_NAME}, avg_pool_2d_same_lower) {
     test_case.add_expected_output<float>(out_shape, result);
     test_case.run();
 }
+
+NGRAPH_TEST(${BACKEND_NAME}, avg_pool_2d_padding) {
+    Shape in_shape{1, 1, 3, 3};
+    Shape out_shape{1, 1, 3, 3};
+    const Strides& strides{2, 2};
+    const Shape& pads_begin{1, 1};
+    const Shape& pads_end{1, 1};
+    const Shape& kernel{2, 2};
+    const bool exclude_pad = true;
+    const op::RoundingType rounding_type = op::RoundingType::CEIL;
+    const op::PadType pad_type = op::PadType::NOTSET;
+
+    auto A = make_shared<op::Parameter>(element::f32, in_shape);
+    auto avgPool =
+        make_shared<op::v1::AvgPool>(A, strides, pads_begin, pads_end, kernel, exclude_pad, rounding_type, pad_type);
+    auto f = make_shared<Function>(avgPool, ParameterVector{A});
+
+    std::vector<float> a(1 * 1 * 3 * 3);
+    std::iota(std::begin(a), std::end(a), 1);
+    std::vector<float> result{1.0f, 2.5f, 0, 5.5f, 7.0f, 0, 0, 0, 0};
+
+    auto test_case = test::TestCase<TestEngine>(f);
+    test_case.add_input<float>({a});
+    test_case.add_expected_output<float>(out_shape, result);
+    test_case.run();
+}
diff --git a/ngraph/test/backend/comparison.in.cpp b/ngraph/test/backend/comparison.in.cpp
deleted file mode 100644
index dbe1247b89668c..00000000000000
--- a/ngraph/test/backend/comparison.in.cpp
+++ /dev/null
@@ -1,47 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <algorithm>
-#include <cinttypes>
-#include <cmath>
-#include <cstdlib>
-#include <random>
-#include <string>
-
-#include "gtest/gtest.h"
-#include "ngraph/log.hpp"
-#include "ngraph/ngraph.hpp"
-#include "ngraph/runtime/tensor.hpp"
-#include "runtime/backend.hpp"
-#include "util/all_close.hpp"
-#include "util/all_close_f.hpp"
-#include "util/ndarray.hpp"
-#include "util/random.hpp"
-#include "util/test_control.hpp"
-#include "util/test_tools.hpp"
-
-using namespace std;
-using namespace ngraph;
-
-static string s_manifest = "${MANIFEST}";
-
-NGRAPH_TEST(${BACKEND_NAME}, notequal) {
-    Shape shape{2, 2, 2};
-    auto A = make_shared<op::Parameter>(element::f32, shape);
-    auto B = make_shared<op::Parameter>(element::f32, shape);
-    auto f = make_shared<Function>(make_shared<op::v1::NotEqual>(A, B), ParameterVector{A, B});
-
-    auto backend = runtime::Backend::create("${BACKEND_NAME}");
-
-    // Create some tensors for input/output
-    auto a = backend->create_tensor(element::f32, shape);
-    copy_data(a, vector<float>{1, 8, -8, 17, -0.5, 0, 1, 1});
-    auto b = backend->create_tensor(element::f32, shape);
-    copy_data(b, vector<float>{1, 8, 4, 8, 0, 0, 1, 1.5});
-    auto result = backend->create_tensor(element::boolean, shape);
-
-    auto handle = backend->compile(f);
-    handle->call_with_validate({result}, {a, b});
-    EXPECT_EQ((vector<char>{0, 0, 1, 1, 1, 0, 0, 1}), read_vector<char>(result));
-}
diff --git a/ngraph/test/backend/minimum.in.cpp b/ngraph/test/backend/minimum.in.cpp
deleted file mode 100644
index 3f5ec0a132d901..00000000000000
--- a/ngraph/test/backend/minimum.in.cpp
+++ /dev/null
@@ -1,99 +0,0 @@
-// Copyright (C) 2018-2021 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <algorithm>
-#include <cinttypes>
-#include <cmath>
-#include <cstdlib>
-#include <random>
-#include <string>
-
-// clang-format off
-#ifdef ${BACKEND_NAME}_FLOAT_TOLERANCE_BITS
-#define DEFAULT_FLOAT_TOLERANCE_BITS ${BACKEND_NAME}_FLOAT_TOLERANCE_BITS
-#endif
-
-#ifdef ${BACKEND_NAME}_DOUBLE_TOLERANCE_BITS
-#define DEFAULT_DOUBLE_TOLERANCE_BITS ${BACKEND_NAME}_DOUBLE_TOLERANCE_BITS
-#endif
-// clang-format on
-
-#include "gtest/gtest.h"
-#include "ngraph/ngraph.hpp"
-#include "util/engine/test_engines.hpp"
-#include "util/test_case.hpp"
-#include "util/test_control.hpp"
-
-using namespace std;
-using namespace ngraph;
-
-static string s_manifest = "${MANIFEST}";
-using TestEngine = test::ENGINE_CLASS_NAME(${BACKEND_NAME});
-
-NGRAPH_TEST(${BACKEND_NAME}, minimum) {
-    Shape shape{2, 2, 2};
-    auto A = make_shared<op::Parameter>(element::f32, shape);
-    auto B = make_shared<op::Parameter>(element::f32, shape);
-    auto f = make_shared<Function>(make_shared<op::v1::Minimum>(A, B), ParameterVector{A, B});
-
-    std::vector<float> a{1, 8, -8, 17, -0.5, 0.5, 2, 1};
-    std::vector<float> b{1, 2, 4, 8, 0, 0, 1, 1.5};
-
-    auto test_case = test::TestCase<TestEngine>(f);
-    test_case.add_multiple_inputs<float>({a, b});
-    test_case.add_expected_output<float>(shape, {1, 2, -8, 8, -.5, 0, 1, 1});
-    test_case.run();
-}
-
-NGRAPH_TEST(${BACKEND_NAME}, minimum_int32) {
-    Shape shape{2, 2, 2};
-    auto A = make_shared<op::Parameter>(element::i32, shape);
-    auto B = make_shared<op::Parameter>(element::i32, shape);
-    auto f = make_shared<Function>(make_shared<op::v1::Minimum>(A, B), ParameterVector{A, B});
-
-    std::vector<int32_t> a{1, 8, -8, 17, -5, 67635216, 2, 1};
-    std::vector<int32_t> b{1, 2, 4, 8, 0, 18448, 1, 6};
-
-    auto test_case = test::TestCase<TestEngine>(f);
-    test_case.add_multiple_inputs<int32_t>({a, b});
-    test_case.add_expected_output<int32_t>(shape, {1, 2, -8, 8, -5, 18448, 1, 1});
-    test_case.run();
-}
-
-NGRAPH_TEST(${BACKEND_NAME}, minimum_int64) {
-    Shape shape{2, 2, 2};
-    auto A = make_shared<op::Parameter>(element::i64, shape);
-    auto B = make_shared<op::Parameter>(element::i64, shape);
-    auto f = make_shared<Function>(make_shared<op::v1::Minimum>(A, B), ParameterVector{A, B});
-
-    std::vector<int64_t> a{1, 8, -8, 17, -5, 67635216, 2, 17179887632};
-    std::vector<int64_t> b{1, 2, 4, 8, 0, 18448, 1, 280592};
-
-    auto test_case = test::TestCase<TestEngine>(f);
-    test_case.add_multiple_inputs<int64_t>({a, b});
-    test_case.add_expected_output<int64_t>(shape, {1, 2, -8, 8, -5, 18448, 1, 280592});
-    test_case.run();
-}
-
-// TODO Refactor to use TestCase if u16 will be handled correctly
-NGRAPH_TEST(${BACKEND_NAME}, minimum_u16) {
-    const Shape shape{3};
-    const auto A = make_shared<op::Parameter>(element::u16, shape);
-    const auto B = make_shared<op::Parameter>(element::u16, shape);
-    auto f = make_shared<Function>(make_shared<op::v1::Minimum>(A, B), ParameterVector{A, B});
-
-    auto backend = runtime::Backend::create("${BACKEND_NAME}");
-
-    // Create some tensors for input/output
-    auto a = backend->create_tensor(element::u16, shape);
-    copy_data(a, std::vector<uint16_t>{3, 2, 1});
-    auto b = backend->create_tensor(element::u16, shape);
-    copy_data(b, std::vector<uint16_t>{1, 4, 4});
-    auto result = backend->create_tensor(element::u16, shape);
-
-    auto handle = backend->compile(f);
-    handle->call_with_validate({result}, {a, b});
-
-    EXPECT_TRUE(test::all_close((std::vector<uint16_t>{1, 2, 1}), read_vector<uint16_t>(result)));
-}
diff --git a/ngraph/test/backend/zero_sized.in.cpp b/ngraph/test/backend/zero_sized.in.cpp
index 29846308d63c1b..ba8bdf53dbf57b 100644
--- a/ngraph/test/backend/zero_sized.in.cpp
+++ b/ngraph/test/backend/zero_sized.in.cpp
@@ -227,10 +227,6 @@ NGRAPH_TEST(${BACKEND_NAME}, zero_sized_multiply) {
     make_binary_empty_test<op::v1::Multiply>("${BACKEND_NAME}");
 }
 
-NGRAPH_TEST(${BACKEND_NAME}, zero_sized_not_equal) {
-    make_binary_empty_test<op::v1::NotEqual>("${BACKEND_NAME}", true);
-}
-
 NGRAPH_TEST(${BACKEND_NAME}, zero_sized_power) {
     make_binary_empty_test<op::v1::Power>("${BACKEND_NAME}");
 }
diff --git a/ngraph/test/check.cpp b/ngraph/test/check.cpp
index 72e04f3834abc3..485686688e94b2 100644
--- a/ngraph/test/check.cpp
+++ b/ngraph/test/check.cpp
@@ -6,39 +6,78 @@
 
 #include <gtest/gtest.h>
 
-using namespace ngraph;
+#include "openvino/core/except.hpp"
+
 using namespace std;
 
 TEST(check, check_true_string_info) {
-    NGRAPH_CHECK(true, "this should not throw");
+    OPENVINO_ASSERT(true, "this should not throw");
 }
 
 TEST(check, check_true_non_string_info) {
-    NGRAPH_CHECK(true, "this should not throw", 123);
+    OPENVINO_ASSERT(true, "this should not throw", 123);
 }
 
 TEST(check, check_true_no_info) {
-    NGRAPH_CHECK(true);
+    OPENVINO_ASSERT(true);
 }
 
 TEST(check, check_false_string_info) {
-    EXPECT_THROW({ NGRAPH_CHECK(false, "this should throw"); }, CheckFailure);
+    EXPECT_THROW({ OPENVINO_ASSERT(false, "this should throw"); }, ov::AssertFailure);
 }
 
 TEST(check, check_false_non_string_info) {
-    EXPECT_THROW({ NGRAPH_CHECK(false, "this should throw", 123); }, CheckFailure);
+    EXPECT_THROW({ OPENVINO_ASSERT(false, "this should throw", 123); }, ov::AssertFailure);
 }
 
 TEST(check, check_false_no_info) {
-    EXPECT_THROW({ NGRAPH_CHECK(false); }, CheckFailure);
+    EXPECT_THROW({ OPENVINO_ASSERT(false); }, ov::AssertFailure);
 }
 
 TEST(check, check_with_explanation) {
     bool check_failure_thrown = false;
 
+    try {
+        OPENVINO_ASSERT(false, "xyzzyxyzzy", 123);
+    } catch (const ov::AssertFailure& e) {
+        check_failure_thrown = true;
+        EXPECT_PRED_FORMAT2(testing::IsSubstring, "Check 'false' failed at", e.what());
+        EXPECT_PRED_FORMAT2(testing::IsSubstring, "xyzzyxyzzy123", e.what());
+    }
+
+    EXPECT_TRUE(check_failure_thrown);
+}
+
+TEST(check, ngraph_check_true_string_info) {
+    NGRAPH_CHECK(true, "this should not throw");
+}
+
+TEST(check, ngraph_check_true_non_string_info) {
+    NGRAPH_CHECK(true, "this should not throw", 123);
+}
+
+TEST(check, ngraph_check_true_no_info) {
+    NGRAPH_CHECK(true);
+}
+
+TEST(check, ngraph_check_false_string_info) {
+    EXPECT_THROW({ NGRAPH_CHECK(false, "this should throw"); }, ngraph::CheckFailure);
+}
+
+TEST(check, ngraph_check_false_non_string_info) {
+    EXPECT_THROW({ NGRAPH_CHECK(false, "this should throw", 123); }, ngraph::CheckFailure);
+}
+
+TEST(check, ngraph_check_false_no_info) {
+    EXPECT_THROW({ NGRAPH_CHECK(false); }, ngraph::CheckFailure);
+}
+
+TEST(check, ngraph_check_with_explanation) {
+    bool check_failure_thrown = false;
+
     try {
         NGRAPH_CHECK(false, "xyzzyxyzzy", 123);
-    } catch (const CheckFailure& e) {
+    } catch (const ngraph::CheckFailure& e) {
         check_failure_thrown = true;
         EXPECT_PRED_FORMAT2(testing::IsSubstring, "Check 'false' failed at", e.what());
         EXPECT_PRED_FORMAT2(testing::IsSubstring, "xyzzyxyzzy123", e.what());
diff --git a/ngraph/test/files/onnx/qlinearconv3d/x.bin b/ngraph/test/files/onnx/qlinearconv3d/x.bin
deleted file mode 100644
index 2cfb4e9b24ffb3..00000000000000
Binary files a/ngraph/test/files/onnx/qlinearconv3d/x.bin and /dev/null differ
diff --git a/ngraph/test/files/onnx/qlinearconv3d/y.bin b/ngraph/test/files/onnx/qlinearconv3d/y.bin
deleted file mode 100644
index 4ac0510ba7f864..00000000000000
Binary files a/ngraph/test/files/onnx/qlinearconv3d/y.bin and /dev/null differ
diff --git a/ngraph/test/frontend/CMakeLists.txt b/ngraph/test/frontend/CMakeLists.txt
index 901d917edc7295..798118442b4357 100644
--- a/ngraph/test/frontend/CMakeLists.txt
+++ b/ngraph/test/frontend/CMakeLists.txt
@@ -24,5 +24,5 @@ add_dependencies(unit-test mock1_ngraph_frontend)
 add_clang_format_target(mock1_ngraph_frontend_clang FOR_TARGETS mock1_ngraph_frontend)
 
 install(TARGETS mock1_ngraph_frontend
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL)
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
diff --git a/ngraph/test/frontend/paddlepaddle/CMakeLists.txt b/ngraph/test/frontend/paddlepaddle/CMakeLists.txt
index 52b898192d0beb..dc29868bd0e84d 100644
--- a/ngraph/test/frontend/paddlepaddle/CMakeLists.txt
+++ b/ngraph/test/frontend/paddlepaddle/CMakeLists.txt
@@ -30,23 +30,16 @@ target_compile_definitions(${TARGET_NAME} PRIVATE -D TEST_PADDLE_MODELS_DIRNAME=
 if (paddlepaddle_FOUND)
     set(TEST_PADDLE_MODELS ${CMAKE_RUNTIME_OUTPUT_DIRECTORY}/${TEST_PADDLE_MODELS_DIRNAME}/)
 
-    file(GLOB_RECURSE PADDLE_GEN_SCRIPTS ${CMAKE_CURRENT_SOURCE_DIR}/test_models/gen_scripts/generate_*.py)
     file(GLOB_RECURSE PADDLE_ALL_SCRIPTS ${CMAKE_CURRENT_SOURCE_DIR}/*.py)
-    set(OUT_FILES "")
-    foreach(GEN_SCRIPT ${PADDLE_GEN_SCRIPTS})
-        get_filename_component(FILE_WE ${GEN_SCRIPT} NAME_WE)
-        set(OUT_DONE_FILE ${TEST_PADDLE_MODELS}/${FILE_WE}_done.txt)
-        set(OUT_FILES ${OUT_DONE_FILE} ${OUT_FILES})
-        add_custom_command(OUTPUT ${OUT_DONE_FILE}
-                COMMAND ${PYTHON_EXECUTABLE}
-                ${CMAKE_CURRENT_SOURCE_DIR}/test_models/gen_wrapper.py
-                ${GEN_SCRIPT}
-                ${TEST_PADDLE_MODELS}
-                ${OUT_DONE_FILE}
-                DEPENDS ${PADDLE_ALL_SCRIPTS}
-                )
-    endforeach()
-    add_custom_target(paddlepaddle_test_models DEPENDS ${OUT_FILES})
+    set(OUT_FILE ${TEST_PADDLE_MODELS}/generate_done.txt)
+    add_custom_command(OUTPUT ${OUT_FILE}
+            COMMAND ${PYTHON_EXECUTABLE}
+            ${CMAKE_CURRENT_SOURCE_DIR}/test_models/gen_wrapper.py
+            ${CMAKE_CURRENT_SOURCE_DIR}/test_models/gen_scripts
+            ${TEST_PADDLE_MODELS}
+            DEPENDS ${PADDLE_ALL_SCRIPTS}
+            )
+    add_custom_target(paddlepaddle_test_models DEPENDS ${OUT_FILE})
 
     install(DIRECTORY ${TEST_PADDLE_MODELS}
             DESTINATION tests/${TEST_PADDLE_MODELS_DIRNAME}
diff --git a/ngraph/test/frontend/paddlepaddle/requirements_dev.txt b/ngraph/test/frontend/paddlepaddle/requirements_dev.txt
index f9f5ae3d96c92b..477403b86372c0 100644
--- a/ngraph/test/frontend/paddlepaddle/requirements_dev.txt
+++ b/ngraph/test/frontend/paddlepaddle/requirements_dev.txt
@@ -3,4 +3,3 @@ paddlepaddle==2.1.0
 gast==0.3.3
 numpy~=1.19.2
 six~=1.15.0
-
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_lower_version.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_lower_version.py
new file mode 100644
index 00000000000000..414eec0bd9b0f4
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_lower_version.py
@@ -0,0 +1,39 @@
+import paddle
+import numpy as np
+import os
+import sys
+from paddle.fluid.proto import framework_pb2
+
+paddle.enable_static()
+
+inp_blob = np.random.randn(1, 3, 4, 4).astype(np.float32)
+print(sys.path)
+main_program = paddle.static.Program()
+startup_program = paddle.static.Program()
+
+with paddle.static.program_guard(main_program, startup_program):
+    x = paddle.static.data(name='x', shape=[1, 3, 4, 4], dtype='float32')
+    test_layer = paddle.static.nn.conv2d(input=x, num_filters=5, filter_size=(1, 1), stride=(1, 1), padding=(1, 1),
+                                     dilation=(1, 1), groups=1, bias_attr=False)
+
+    cpu = paddle.static.cpu_places(1)
+    exe = paddle.static.Executor(cpu[0])
+    exe.run(startup_program)
+    inp_dict = {'x': inp_blob}
+    var = [test_layer]
+    res_paddle = exe.run(paddle.static.default_main_program(), fetch_list=var, feed=inp_dict)
+    paddle.static.save_inference_model(os.path.join(sys.argv[1], "lower_version/", "lower_version"), [x], [test_layer], exe, program=main_program)
+
+
+fw_model = framework_pb2.ProgramDesc()
+with open(os.path.join(sys.argv[1], "lower_version", "lower_version.pdmodel"), mode='rb') as file:
+    fw_model.ParseFromString(file.read())
+
+fw_model.version.version = 1800000
+print(fw_model.version.version)
+with open(os.path.join(sys.argv[1], "lower_version", "lower_version.pdmodel"), "wb") as f:
+    f.write(fw_model.SerializeToString())
+
+
+
+
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_pad3d.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_pad3d.py
index 51b3a81f0e9c91..5a711f6f83d89b 100644
--- a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_pad3d.py
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_pad3d.py
@@ -57,6 +57,12 @@ def main():
     input_data = np.random.rand(*input_shape).astype(np.float32)
     pad3d("pad3d_test3", input_data, in_dtype, pad, data_format, mode)
 
+    input_shape = (2, 3, 4, 5, 6)
+    pad = [1, 2, 1, 1, 1, 2]
+    mode = "circular"
+    data_format = 'NDHWC'
+    input_data = np.random.rand(*input_shape).astype(np.float32)
+    pad3d("throw_in_conversion", input_data, in_dtype, pad, data_format, mode)
     # padding of type int feature only supported by PaddlePaddle 'develop' version(>=2.1.0)
 #    input_shape = (1, 2, 3, 4, 5)
 #    pad_int = 1
diff --git a/ngraph/test/frontend/paddlepaddle/test_models/gen_wrapper.py b/ngraph/test/frontend/paddlepaddle/test_models/gen_wrapper.py
index bb982baca187d4..fc860357ce7398 100644
--- a/ngraph/test/frontend/paddlepaddle/test_models/gen_wrapper.py
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_wrapper.py
@@ -1,19 +1,25 @@
+import glob
 import os
 import subprocess
-
 import sys
 
 print(sys.argv)
-if len(sys.argv) < 4:
-    print("Script, output folder and mark file must be specified as arguments")
-    exit(1)
+if len(sys.argv) < 3:
+    print("Gen folder and output folder must be specified as arguments")
+    sys.exit(1)
 
-gen_script = sys.argv[1]
+gen_folder = sys.argv[1]
 out_folder = sys.argv[2]
-mark_file = sys.argv[3]
+mark_file = os.path.join(out_folder, "generate_done.txt")
+
+gen_files = glob.glob(os.path.join(gen_folder, '**/generate_*.py'), recursive=True)
 
-print("Processing: {} ".format(gen_script))
-subprocess.run([sys.executable, gen_script, out_folder], env=os.environ)
+for gen_script in gen_files:
+    print("Processing: {} ".format(gen_script))
+    status = subprocess.run([sys.executable, gen_script, out_folder], env=os.environ)
+    if status.returncode != 0:
+        print("ERROR: PaddlePaddle model gen script FAILED: {}".format(gen_script))
+        sys.exit(1)
 
 # Create mark file indicating that script was executed
 with open(mark_file, "w") as fp:
diff --git a/ngraph/test/frontend/paddlepaddle/throw_in_conversion.cpp b/ngraph/test/frontend/paddlepaddle/throw_in_conversion.cpp
new file mode 100644
index 00000000000000..3032c2722022a3
--- /dev/null
+++ b/ngraph/test/frontend/paddlepaddle/throw_in_conversion.cpp
@@ -0,0 +1,39 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <frontend_manager/frontend_exceptions.hpp>
+#include <frontend_manager/frontend_manager.hpp>
+
+#include "common_test_utils/ngraph_test_utils.hpp"
+#include "paddle_utils.hpp"
+#include "utils.hpp"
+
+using namespace ngraph;
+using namespace ngraph::frontend;
+
+TEST(FrontEndConvertModelTest, throw_in_conversion) {
+    FrontEndManager fem;
+    FrontEnd::Ptr frontEnd;
+    InputModel::Ptr inputModel;
+    ASSERT_NO_THROW(frontEnd = fem.load_by_framework(PADDLE_FE));
+    ASSERT_NE(frontEnd, nullptr);
+    auto model_filename = FrontEndTestUtils::make_model_path(
+        std::string(TEST_PADDLE_MODELS_DIRNAME) + std::string("throw_in_conversion/throw_in_conversion.pdmodel"));
+    ASSERT_NO_THROW(inputModel = frontEnd->load(model_filename));
+    ASSERT_NE(inputModel, nullptr);
+    std::shared_ptr<ngraph::Function> function;
+    ASSERT_THROW(function = frontEnd->convert(inputModel), OpConversionFailure);
+}
+
+TEST(FrontEndConvertModelTest, unsupported_version) {
+    FrontEndManager fem;
+    FrontEnd::Ptr frontEnd;
+    InputModel::Ptr inputModel;
+    ASSERT_NO_THROW(frontEnd = fem.load_by_framework(PADDLE_FE));
+    ASSERT_NE(frontEnd, nullptr);
+    auto model_filename = FrontEndTestUtils::make_model_path(std::string(TEST_PADDLE_MODELS_DIRNAME) +
+                                                             std::string("lower_version/lower_version.pdmodel"));
+
+    ASSERT_THROW(inputModel = frontEnd->load(model_filename), GeneralFailure);
+}
diff --git a/ngraph/test/intervals.cpp b/ngraph/test/intervals.cpp
index 7f1e383cdd46be..314e8248e3e067 100644
--- a/ngraph/test/intervals.cpp
+++ b/ngraph/test/intervals.cpp
@@ -143,3 +143,20 @@ TEST(intervals, sets) {
     }
     EXPECT_TRUE(Interval(min_int, max_int) == a_int_b);
 }
+
+TEST(intervals, corner_cases) {
+    Interval::value_type max = numeric_limits<Interval::value_type>::max();
+    Interval almost_max(0, max - 10);
+    Interval dynamic(0, max);
+    Interval zero(0, 0);
+
+    EXPECT_TRUE(almost_max + almost_max == dynamic);
+    EXPECT_TRUE(dynamic + almost_max == dynamic);
+    EXPECT_TRUE(almost_max + dynamic == dynamic);
+    EXPECT_TRUE(dynamic - almost_max == dynamic);
+
+    EXPECT_TRUE(dynamic * almost_max == dynamic);
+    EXPECT_TRUE(almost_max * dynamic == dynamic);
+    EXPECT_TRUE(zero * almost_max == zero);
+    EXPECT_TRUE(almost_max * zero == zero);
+}
diff --git a/ngraph/test/layout.cpp b/ngraph/test/layout.cpp
new file mode 100644
index 00000000000000..e11a626e98942c
--- /dev/null
+++ b/ngraph/test/layout.cpp
@@ -0,0 +1,197 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/core/layout.hpp"
+
+#include "gtest/gtest.h"
+
+using namespace ov;
+
+TEST(layout, basic) {
+    Layout l = "NcDHw";
+    EXPECT_TRUE(layout::has_batch(l));
+    EXPECT_EQ(layout::batch(l), 0);
+    EXPECT_TRUE(layout::has_channels(l));
+    EXPECT_EQ(layout::channels(l), 1);
+    EXPECT_TRUE(layout::has_depth(l));
+    EXPECT_EQ(layout::depth(l), 2);
+    EXPECT_TRUE(layout::has_height(l));
+    EXPECT_EQ(layout::height(l), 3);
+    EXPECT_TRUE(layout::has_width(l));
+    EXPECT_EQ(layout::width(l), 4);
+}
+
+TEST(layout, advanced_syntax) {
+    Layout l = "[batch, channels, depth, height, width]";
+    EXPECT_TRUE(layout::has_batch(l));
+    EXPECT_EQ(layout::batch(l), 0);
+    EXPECT_TRUE(layout::has_channels(l));
+    EXPECT_EQ(layout::channels(l), 1);
+    EXPECT_TRUE(layout::has_depth(l));
+    EXPECT_EQ(layout::depth(l), 2);
+    EXPECT_TRUE(layout::has_height(l));
+    EXPECT_EQ(layout::height(l), 3);
+    EXPECT_TRUE(layout::has_width(l));
+    EXPECT_EQ(layout::width(l), 4);
+    EXPECT_EQ(l, Layout("ncdhw"));
+
+    l = "[custom1, ?, custom2]";
+    EXPECT_EQ(l.get_index_by_name("CUSTOm1"), 0);
+    EXPECT_EQ(l.get_index_by_name("Custom2"), 2);
+
+    l = "[?, N , ... , channels , ?]";
+    EXPECT_EQ(l, Layout("?N...C?"));
+    l = "[?, N , ... , custom1 , ?]";
+    EXPECT_EQ(l.get_index_by_name("Custom1"), -2);
+}
+
+TEST(layout, empty) {
+    Layout l;
+    EXPECT_FALSE(layout::has_batch(l));
+    EXPECT_THROW(layout::batch(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_channels(l));
+    EXPECT_THROW(layout::channels(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_depth(l));
+    EXPECT_THROW(layout::depth(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_height(l));
+    EXPECT_THROW(layout::height(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_width(l));
+    EXPECT_THROW(layout::width(l), ov::AssertFailure);
+}
+
+TEST(layout, to_string) {
+    std::vector<Layout> layouts = {{"NCHW"},
+                                   {"[?, N, CHANNELS, ?, ?, Custom_dim_name]"},
+                                   {"012?...3?456"},
+                                   {"...3?456"},
+                                   {"12?34..."},
+                                   {"..."},
+                                   Layout::scalar()};
+    for (const auto& l : layouts) {
+        EXPECT_EQ(l, Layout(l.to_string()));
+    }
+}
+
+TEST(layout, scalar) {
+    auto l = Layout::scalar();
+    EXPECT_FALSE(layout::has_batch(l));
+    EXPECT_THROW(layout::batch(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_channels(l));
+    EXPECT_THROW(layout::channels(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_depth(l));
+    EXPECT_THROW(layout::depth(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_height(l));
+    EXPECT_THROW(layout::height(l), ov::AssertFailure);
+    EXPECT_FALSE(layout::has_width(l));
+    EXPECT_THROW(layout::width(l), ov::AssertFailure);
+}
+
+TEST(layout, custom_dims) {
+    Layout l = "0ac";
+    EXPECT_FALSE(layout::has_batch(l));
+    EXPECT_THROW(layout::batch(l), ov::AssertFailure);
+    EXPECT_TRUE(layout::has_channels(l));
+    EXPECT_EQ(layout::channels(l), 2);
+    EXPECT_TRUE(l.has_name("0"));
+    EXPECT_TRUE(l.has_name("A"));
+    EXPECT_EQ(l.get_index_by_name("a"), 1);
+}
+
+TEST(layout, dims_unknown) {
+    Layout l = "n??c";
+    EXPECT_TRUE(layout::has_batch(l));
+    EXPECT_EQ(layout::batch(l), 0);
+    EXPECT_TRUE(layout::has_channels(l));
+    EXPECT_EQ(layout::channels(l), 3);
+    EXPECT_FALSE(l.has_name("?"));
+    EXPECT_EQ(l.get_index_by_name("C"), 3);
+}
+
+TEST(layout, dims_undefined) {
+    Layout l = "?n?...?c?";
+    EXPECT_TRUE(layout::has_batch(l));
+    EXPECT_EQ(layout::batch(l), 1);
+    EXPECT_TRUE(layout::has_channels(l));
+    EXPECT_EQ(layout::channels(l), -2);
+    EXPECT_FALSE(l.has_name("?"));
+}
+
+TEST(layout, dims_valid_syntax) {
+    Layout l;
+    EXPECT_NO_THROW(l = "...");
+    EXPECT_NO_THROW(l = "?...?");
+    EXPECT_NO_THROW(l = "...?");
+    EXPECT_NO_THROW(l = "?...");
+    EXPECT_NO_THROW(l = "????");
+    EXPECT_NO_THROW(l = "[?,?,?,?]");
+    EXPECT_NO_THROW(l = "[?, ... ,?]");
+    EXPECT_NO_THROW(l = "[...,?]");
+    EXPECT_NO_THROW(l = "[?,...]");
+}
+
+TEST(layout, dims_wrong_syntax) {
+    Layout l;
+    EXPECT_THROW(l = "", ov::AssertFailure);
+    EXPECT_THROW(l = " ", ov::AssertFailure);
+    std::string invalidChars = "`~!@#$%^&*()-=+{}\"'><,|";
+    for (auto c : invalidChars) {
+        EXPECT_THROW(l = Layout(std::string(1, c)), ov::AssertFailure);
+    }
+    EXPECT_THROW(l = "....", ov::AssertFailure);
+    EXPECT_THROW(l = ".nchw", ov::AssertFailure);
+    EXPECT_THROW(l = "n...c...", ov::AssertFailure);
+    EXPECT_THROW(l = "ncChw", ov::AssertFailure);
+    EXPECT_THROW(l = "c...C", ov::AssertFailure);
+    EXPECT_THROW(l = ".", ov::AssertFailure);
+    EXPECT_THROW(l = "[....]", ov::AssertFailure);
+    EXPECT_THROW(l = "[c, ..., n, ...]", ov::AssertFailure);
+    EXPECT_THROW(l = "[c,,]", ov::AssertFailure);
+    EXPECT_THROW(l = "[c", ov::AssertFailure);
+    EXPECT_THROW(l = "[c]]", ov::AssertFailure);
+    EXPECT_THROW(l = "[]", ov::AssertFailure);
+    EXPECT_THROW(l = "[ ]", ov::AssertFailure);
+    EXPECT_THROW(l = "[,]", ov::AssertFailure);
+    EXPECT_THROW(l = "[...,]", ov::AssertFailure);
+    EXPECT_THROW(l = "[   ]", ov::AssertFailure);
+    EXPECT_THROW(l = "[?...]", ov::AssertFailure);
+    EXPECT_THROW(l = "[? ...]", ov::AssertFailure);
+    EXPECT_THROW(l = "[...N]", ov::AssertFailure);
+    EXPECT_THROW(l = "[... N]", ov::AssertFailure);
+}
+
+TEST(layout, layout_equals) {
+    EXPECT_EQ(Layout("nchw"), Layout("NCHW"));
+    EXPECT_NE(Layout("nc?hw"), Layout("NC...HW"));
+    EXPECT_NE(Layout("nc"), Layout("NC..."));
+    EXPECT_NE(Layout("n???"), Layout("NCHW"));
+    EXPECT_NE(Layout("nchw"), Layout("n???"));
+    EXPECT_NE(Layout("?n..."), Layout("...n?"));
+    EXPECT_EQ(Layout("0A?...HWC"), Layout("0a?...hwc"));
+    EXPECT_NE(Layout("?..."), Layout("?"));
+    EXPECT_NE(Layout("...?"), Layout("..."));
+    EXPECT_EQ(Layout("[Batch, ..., Channels, ? , ? ]"), Layout("N...C??"));
+    EXPECT_EQ(Layout::scalar(), Layout::scalar());
+    EXPECT_NE(Layout::scalar(), Layout("..."));
+}
+
+TEST(layout, dims_implicit_api) {
+    EXPECT_EQ(Layout("nchw"), Layout("NCHW"));
+    EXPECT_NE(Layout("nchw"), Layout("NHWC"));
+    Layout l = "NCHW";
+    auto l2 = l;
+    auto l3 = l;
+    auto l4 = std::move(l3);
+    l2 = l4;
+    l3 = std::move(l2);
+    EXPECT_EQ(l3, l4);
+}
+
+TEST(layout, attribute_adapter) {
+    Layout l = "NCHW";
+    Layout l2 = "NHCW";
+    AttributeAdapter<Layout> at(l);
+    EXPECT_EQ(at.get(), l.to_string());
+    at.set("NHCW");
+    EXPECT_EQ(l, l2);
+}
diff --git a/ngraph/test/models/onnx/bias_gelu.prototxt b/ngraph/test/models/onnx/bias_gelu.prototxt
new file mode 100644
index 00000000000000..f01a6ca2c42f0d
--- /dev/null
+++ b/ngraph/test/models/onnx/bias_gelu.prototxt
@@ -0,0 +1,61 @@
+ir_version: 3
+producer_name: "nGraph ONNX Importer"
+graph {
+  node {
+    input: "X"
+    input: "Y"
+    output: "out"
+    name: "Gelu_AddBias_1"
+    op_type: "BiasGelu"
+    domain: "com.microsoft"
+  }
+  name: "test_graph"
+  input {
+    name: "X"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 2
+          }
+          dim {
+            dim_value: 5
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "Y"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 5
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "out"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 2
+          }
+          dim {
+            dim_value: 5
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_branches_with_different_inputs.prototxt b/ngraph/test/models/onnx/controlflow/if_branches_with_different_inputs.prototxt
new file mode 100644
index 00000000000000..93933c39da7af0
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_branches_with_different_inputs.prototxt
@@ -0,0 +1,134 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      g {
+        node {
+          input: "x"
+          input: "y"
+          output: "add"
+          name: "add"
+          op_type: "Add"
+        }
+        name: "then_branch"
+        output {
+          name: "add"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+    attribute {
+      name: "else_branch"
+      g {
+        node {
+          input: "y"
+          output: "abs"
+          name: "abs"
+          op_type: "Abs"
+        }
+        name: "else_branch"
+        output {
+          name: "abs"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_branches_with_multiple_outputs.prototxt b/ngraph/test/models/onnx/controlflow/if_branches_with_multiple_outputs.prototxt
new file mode 100644
index 00000000000000..e0f721e7bfea3a
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_branches_with_multiple_outputs.prototxt
@@ -0,0 +1,264 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if1"
+    output: "if2"
+    output: "if3"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      type: GRAPH
+      g {
+        node {
+          input: "x"
+          output: "split1_1"
+          output: "split1_2"
+          output: "split1_3"
+          name: "split1"
+          op_type: "Split"
+          attribute {
+            name: "axis"
+            type: INT
+            i: 0
+          }
+        }
+        output {
+          name: "split1_1"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+        output {
+          name: "split1_2"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+        output {
+          name: "split1_3"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+    }
+    attribute {
+      name: "else_branch"
+      type: GRAPH
+      g {
+        node {
+          input: "x"
+          output: "split2_1"
+          output: "split2_2"
+          output: "split2_3"
+          name: "split2"
+          op_type: "Split"
+          attribute {
+            name: "axis"
+            type: INT
+            i: 1
+          }
+        }
+        node {
+          output: "perm"
+          name: "perm"
+          op_type: "Constant"
+          attribute {
+            name: "value"
+            type: TENSOR
+            t {
+              dims: 2
+              data_type: 6
+              int32_data: 1
+              int32_data: 0
+              name: "perm"
+            }
+          }
+        }
+        node {
+          input: "split2_1"
+          input: "perm"
+          output: "transpose_1"
+          name: "transpose_1"
+          op_type: "Transpose"
+        }
+        node {
+          input: "split2_2"
+          input: "perm"
+          output: "transpose_2"
+          name: "transpose_2"
+          op_type: "Transpose"
+        }
+        node {
+          input: "split2_3"
+          input: "perm"
+          output: "transpose_3"
+          name: "transpose_3"
+          op_type: "Transpose"
+        }
+        output {
+          name: "transpose_1"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+        output {
+          name: "transpose_2"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+        output {
+          name: "transpose_3"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 6
+          }
+          dim {
+            dim_value: 6
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if1"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 2
+          }
+          dim {
+            dim_value: 6
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if2"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 2
+          }
+          dim {
+            dim_value: 6
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if3"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 2
+          }
+          dim {
+            dim_value: 6
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_branches_with_same_inputs.prototxt b/ngraph/test/models/onnx/controlflow/if_branches_with_same_inputs.prototxt
new file mode 100644
index 00000000000000..28aa8a0eeb6ac5
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_branches_with_same_inputs.prototxt
@@ -0,0 +1,135 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      g {
+        node {
+          input: "x"
+          input: "y"
+          output: "add"
+          name: "add"
+          op_type: "Add"
+        }
+        name: "then_branch"
+        output {
+          name: "add"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+    attribute {
+      name: "else_branch"
+      g {
+        node {
+          input: "x"
+          input: "y"
+          output: "mul"
+          name: "mul"
+          op_type: "Mul"
+        }
+        name: "else_branch"
+        output {
+          name: "mul"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_branches_without_inputs.prototxt b/ngraph/test/models/onnx/controlflow/if_branches_without_inputs.prototxt
new file mode 100644
index 00000000000000..8224617781ee0d
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_branches_without_inputs.prototxt
@@ -0,0 +1,135 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      type: GRAPH
+      g {
+        name: "then_branch"
+        node {
+          output: "const1"
+          name: "const1"
+          op_type: "Constant"
+          attribute {
+            name: "value"
+            type: TENSOR
+            t {
+              dims: 2
+              dims: 4
+              data_type: 1
+              float_data: 0
+              float_data: 1
+              float_data: 2
+              float_data: 3
+              float_data: 4
+              float_data: 5
+              float_data: 6
+              float_data: 7
+              name: "const_tensor"
+            }
+          }
+        }
+        output {
+          name: "const1"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+    }
+    attribute {
+      name: "else_branch"
+      g {
+        node {
+          output: "const2"
+          name: "const2"
+          op_type: "Constant"
+          attribute {
+            name: "value"
+            t {
+              dims: 2
+              dims: 4
+              data_type: 1
+              float_data: 0
+              float_data: 5
+              float_data: 10
+              float_data: 15
+              float_data: 20
+              float_data: 25
+              float_data: 20
+              float_data: 15
+              name: "const_tensor"
+            }
+            type: TENSOR
+          }
+        }
+        name: "else_branch"
+        output {
+          name: "const2"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 2
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 2
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_dynamic_inputs.prototxt b/ngraph/test/models/onnx/controlflow/if_dynamic_inputs.prototxt
new file mode 100644
index 00000000000000..e3d2c2f1b3ec33
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_dynamic_inputs.prototxt
@@ -0,0 +1,90 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      g {
+        node {
+          input: "x"
+          input: "y"
+          output: "add"
+          name: "add"
+          op_type: "Add"
+        }
+        name: "then_branch"
+        output {
+          name: "add"
+          type {
+            tensor_type {
+              elem_type: 1
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+    attribute {
+      name: "else_branch"
+      g {
+        node {
+          input: "x"
+          input: "y"
+          output: "mul"
+          name: "mul"
+          op_type: "Mul"
+        }
+        name: "else_branch"
+        output {
+          name: "mul"
+          type {
+            tensor_type {
+              elem_type: 1
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+      }
+    }
+  }
+  input {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 1
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_inside_if.prototxt b/ngraph/test/models/onnx/controlflow/if_inside_if.prototxt
new file mode 100644
index 00000000000000..afb79d0140278c
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_inside_if.prototxt
@@ -0,0 +1,234 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      g {
+        name: "then_branch"
+        node {
+          input: "x"
+          input: "y"
+          output: "greater"
+          name: "greater"
+          op_type: "Greater"
+        }
+        node {
+          input: "greater"
+          output: "cast_to_int"
+          name: "cast_to_int"
+          op_type: "Cast"
+          attribute {
+            name: "to"
+            type: INT
+            i: 6
+          }
+        }
+        node {
+          input: "cast_to_int"
+          output: "reduce_max"
+          name: "reduce_max"
+          op_type: "ReduceMax"
+          attribute {
+            name: "keepdims"
+            type: INT
+            i: 0
+          }
+        }
+        node {
+          input: "reduce_max"
+          output: "cast_to_bool"
+          name: "cast_to_bool"
+          op_type: "Cast"
+          attribute {
+            name: "to"
+            type: INT
+            i: 9
+          }
+        }
+        node {
+          input: "cast_to_bool"
+          output: "if_inside"
+          name: "if"
+          op_type: "If"
+          attribute {
+            name: "then_branch"
+            type: GRAPH
+            g {
+              name: "then_branch_inside"
+              node {
+                input: "x"
+                input: "y"
+                output: "mul"
+                name: "mul"
+                op_type: "Mul"
+              }
+              output {
+                name: "mul"
+                type {
+                  tensor_type {
+                    elem_type: 1
+                    shape {
+                      dim {
+                        dim_value: 10
+                      }
+                       dim {
+                        dim_value: 4
+                      }
+                    }
+                  }
+                }
+              }
+            }
+          }
+          attribute {
+            name: "else_branch"
+            type: GRAPH
+            g {
+              name: "else_branch_inside"
+              node {
+                input: "x"
+                input: "y"
+                output: "add"
+                name: "add"
+                op_type: "Add"
+              }
+              output {
+                name: "add"
+                type {
+                  tensor_type {
+                    elem_type: 1
+                    shape {
+                      dim {
+                        dim_value: 10
+                      }
+                       dim {
+                        dim_value: 4
+                      }
+                    }
+                  }
+                }
+              }
+            }
+          }
+        }
+        output {
+          name: "if_inside"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+    attribute {
+      name: "else_branch"
+      type: GRAPH
+      g {
+        name: "else_branch"
+        node {
+          input: "x"
+          input: "y"
+          output: "sub"
+          name: "sub"
+          op_type: "Sub"
+        }
+        output {
+          name: "sub"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_inside_loop.prototxt b/ngraph/test/models/onnx/controlflow/if_inside_loop.prototxt
new file mode 100644
index 00000000000000..544bb6b8602364
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_inside_loop.prototxt
@@ -0,0 +1,209 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if inside loop"
+  node {
+    input: "scale"
+    input: "scale"
+    name: "mul_node"
+    op_type: "Mul"
+    output: "b"
+  }
+  node {
+    input: "trip_count"
+    input: ""
+    input: "a_init"
+    output: "a_final"
+    output: "a_values"
+    op_type: "Loop"
+    attribute {
+      name: "body"
+      type: GRAPH
+      g {
+        name: "loop body"
+        node {
+          output: "zero"
+          op_type: "Constant"
+          attribute {
+            name: "value"
+            type: TENSOR
+            t {
+              dims: 1
+              data_type: 7
+              int64_data: 0
+            }
+          }
+        }
+        node {
+          input: "i"
+          input: "zero"
+          output: "first_iter"
+          name: "equal"
+          op_type: "Equal"
+        }
+        node {
+          input: "first_iter"
+          output: "current_a"
+          name: "current_a"
+          op_type: "If"
+          attribute {
+            name: "then_branch"
+            type: GRAPH
+            g {
+              name: "then_branch"
+              node {
+                input: "b"
+                input: "a_in"
+                output: "a_out"
+                name: "loop_body_add"
+                op_type: "Add"
+              }
+              output {
+                name: "a_out"
+                type {
+                  tensor_type {
+                    elem_type: 1
+                  }
+                }
+              }
+            }
+          }
+          attribute {
+            name: "else_branch"
+            type: GRAPH
+            g {
+              name: "else_branch"
+              node {
+                input: "b"
+                input: "a_in"
+                output: "a_out"
+                name: "loop_body_mul"
+                op_type: "Mul"
+              }
+              output {
+                name: "a_out"
+                type {
+                  tensor_type {
+                    elem_type: 1
+                  }
+                }
+              }
+            }
+          }
+        }
+        node {
+          input: "cond"
+          output: "cond_out"
+          name: "cond_identity"
+          op_type: "Identity"
+        }
+        node {
+          input: "current_a"
+          output: "a_out"
+          name: "output_accumulator"
+          op_type: "Identity"
+        }
+        input {
+          name: "i"
+          type {
+            tensor_type {
+              elem_type: 7
+              shape {
+                dim {
+                  dim_value: 1
+                }
+              }
+            }
+          }
+        }
+        input {
+          name: "cond"
+          type {
+            tensor_type {
+              elem_type: 9
+            }
+          }
+        }
+        input {
+          name: "a_in"
+          type {
+            tensor_type {
+              elem_type: 1
+            }
+          }
+        }
+        output {
+          name: "cond_out"
+          type {
+            tensor_type {
+              elem_type: 9
+            }
+          }
+        }
+        output {
+          name: "current_a"
+          type {
+            tensor_type {
+              elem_type: 1
+            }
+          }
+        }
+        output {
+          name: "a_out"
+          type {
+            tensor_type {
+              elem_type: 1
+            }
+          }
+        }
+      }
+    }
+  }
+  initializer {
+    dims: 1
+    data_type: 7
+    int64_data: 3
+    name: "trip_count"
+  }
+  initializer {
+    dims: 1
+    data_type: 1
+    float_data: 2
+    name: "scale"
+  }
+  input {
+    name: "a_init"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 2
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "a_final"
+    type {
+      tensor_type {
+        elem_type: 1
+      }
+    }
+  }
+  output {
+    name: "a_values"
+    type {
+      tensor_type {
+        elem_type: 1
+      }
+    }
+  }
+}
+opset_import {
+  version: 11
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_missing_else_branch.prototxt b/ngraph/test/models/onnx/controlflow/if_missing_else_branch.prototxt
new file mode 100644
index 00000000000000..c7e8d9a9e36d68
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_missing_else_branch.prototxt
@@ -0,0 +1,105 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      g {
+        node {
+          input: "x"
+          input: "y"
+          output: "add"
+          name: "add"
+          op_type: "Add"
+        }
+        name: "then_branch"
+        output {
+          name: "add"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_missing_then_branch.prototxt b/ngraph/test/models/onnx/controlflow/if_missing_then_branch.prototxt
new file mode 100644
index 00000000000000..5f8007a6dce8d6
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_missing_then_branch.prototxt
@@ -0,0 +1,105 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "else_branch"
+      g {
+        node {
+          input: "x"
+          input: "y"
+          output: "mul"
+          name: "mul"
+          op_type: "Mul"
+        }
+        name: "else_branch"
+        output {
+          name: "mul"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/controlflow/if_negative_mismatch_between_branches_output.prototxt b/ngraph/test/models/onnx/controlflow/if_negative_mismatch_between_branches_output.prototxt
new file mode 100644
index 00000000000000..88515b28f92c3a
--- /dev/null
+++ b/ngraph/test/models/onnx/controlflow/if_negative_mismatch_between_branches_output.prototxt
@@ -0,0 +1,158 @@
+ir_version: 6
+producer_name: "nGraph ONNX Importer"
+graph {
+  name: "if graph"
+  node {
+    input: "condition"
+    output: "if"
+    name: "if"
+    op_type: "If"
+    attribute {
+      name: "then_branch"
+      g {
+        name: "then_branch"
+        node {
+          input: "x"
+          input: "y"
+          output: "add"
+          name: "add"
+          op_type: "Add"
+        }
+        output {
+          name: "add"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+    attribute {
+      name: "else_branch"
+      g {
+        name: "else_branch"
+        node {
+          input: "x"
+          input: "y"
+          output: "mul"
+          name: "mul"
+          op_type: "Mul"
+        }
+        node {
+          input: "x"
+          input: "y"
+          output: "add"
+          name: "add"
+          op_type: "Add"
+        }
+        output {
+          name: "add"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+        output {
+          name: "mul"
+          type {
+            tensor_type {
+              elem_type: 1
+              shape {
+                dim {
+                  dim_value: 10
+                }
+                dim {
+                  dim_value: 4
+                }
+              }
+            }
+          }
+        }
+      }
+      type: GRAPH
+    }
+  }
+  input {
+    name: "condition"
+    type {
+      tensor_type {
+        elem_type: 9
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+  output {
+    name: "if"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 10
+          }
+          dim {
+            dim_value: 4
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 13
+}
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_cond_and_trip_count_as_inputs.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_cond_and_trip_count_as_inputs.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_cond_and_trip_count_as_inputs.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_cond_and_trip_count_as_inputs.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_cond_and_trip_count_as_inputs_static_shapes.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_cond_and_trip_count_as_inputs_static_shapes.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_cond_and_trip_count_as_inputs_static_shapes.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_cond_and_trip_count_as_inputs_static_shapes.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_const_cond.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_const_cond.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_const_cond.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_const_cond.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_const_no_identity_termination_cond.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_const_no_identity_termination_cond.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_const_no_identity_termination_cond.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_const_no_identity_termination_cond.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_const_no_identity_termination_cond_static_shapes.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_const_no_identity_termination_cond_static_shapes.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_const_no_identity_termination_cond_static_shapes.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_const_no_identity_termination_cond_static_shapes.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_incorrect_access_body_scope.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_incorrect_access_body_scope.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_incorrect_access_body_scope.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_incorrect_access_body_scope.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_initializer_from_parent_scope.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_initializer_from_parent_scope.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_initializer_from_parent_scope.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_initializer_from_parent_scope.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_input_from_parent_graph.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_input_from_parent_graph.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_input_from_parent_graph.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_input_from_parent_graph.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_no_identity_termination_cond.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_no_identity_termination_cond.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_no_identity_termination_cond.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_no_identity_termination_cond.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_no_identity_termination_cond_false.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_no_identity_termination_cond_false.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_no_identity_termination_cond_false.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_no_identity_termination_cond_false.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_no_identity_termination_cond_static_shapes.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_no_identity_termination_cond_static_shapes.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_no_identity_termination_cond_static_shapes.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_no_identity_termination_cond_static_shapes.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_node_from_parent_scope.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_node_from_parent_scope.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_node_from_parent_scope.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_node_from_parent_scope.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_the_same_name.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_the_same_name.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_the_same_name.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_the_same_name.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_trip_count_and_cond_skipped.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_trip_count_and_cond_skipped.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_trip_count_and_cond_skipped.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_trip_count_and_cond_skipped.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_trip_count_dynamic.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_trip_count_dynamic.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_trip_count_dynamic.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_trip_count_dynamic.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_add_trip_count_max_int.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_add_trip_count_max_int.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_add_trip_count_max_int.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_add_trip_count_max_int.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_2d_mul_opset1.prototxt b/ngraph/test/models/onnx/controlflow/loop_2d_mul_opset1.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_2d_mul_opset1.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_2d_mul_opset1.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_add_node_from_parent_scope_infer_types.prototxt b/ngraph/test/models/onnx/controlflow/loop_add_node_from_parent_scope_infer_types.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_add_node_from_parent_scope_infer_types.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_add_node_from_parent_scope_infer_types.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_add_node_from_parent_scope_used_in_parent_and_in_body.prototxt b/ngraph/test/models/onnx/controlflow/loop_add_node_from_parent_scope_used_in_parent_and_in_body.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_add_node_from_parent_scope_used_in_parent_and_in_body.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_add_node_from_parent_scope_used_in_parent_and_in_body.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_concat_values.prototxt b/ngraph/test/models/onnx/controlflow/loop_concat_values.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_concat_values.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_concat_values.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_infinite.prototxt b/ngraph/test/models/onnx/controlflow/loop_infinite.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_infinite.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_infinite.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_no_variadic_inputs_and_outputs.prototxt b/ngraph/test/models/onnx/controlflow/loop_no_variadic_inputs_and_outputs.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_no_variadic_inputs_and_outputs.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_no_variadic_inputs_and_outputs.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_pow.prototxt b/ngraph/test/models/onnx/controlflow/loop_pow.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_pow.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_pow.prototxt
diff --git a/ngraph/test/models/onnx/loop/loop_scalars_add.prototxt b/ngraph/test/models/onnx/controlflow/loop_scalars_add.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/loop_scalars_add.prototxt
rename to ngraph/test/models/onnx/controlflow/loop_scalars_add.prototxt
diff --git a/ngraph/test/models/onnx/loop/onnx_controlflow_loop_2d_infer_types.prototxt b/ngraph/test/models/onnx/controlflow/onnx_controlflow_loop_2d_infer_types.prototxt
similarity index 100%
rename from ngraph/test/models/onnx/loop/onnx_controlflow_loop_2d_infer_types.prototxt
rename to ngraph/test/models/onnx/controlflow/onnx_controlflow_loop_2d_infer_types.prototxt
diff --git a/ngraph/test/models/onnx/quantization/quant_conv_linear_onnx_example.prototxt b/ngraph/test/models/onnx/quantization/quant_conv_linear_onnx_example.prototxt
new file mode 100644
index 00000000000000..94cf76c2b95775
--- /dev/null
+++ b/ngraph/test/models/onnx/quantization/quant_conv_linear_onnx_example.prototxt
@@ -0,0 +1,152 @@
+ir_version: 5
+producer_name: "onnx-examples"
+graph {
+  node {
+    input: "x"
+    input: "x_scale"
+    input: "x_zero_point"
+    input: "w"
+    input: "w_scale"
+    input: "w_zero_point"
+    input: "y_scale"
+    input: "y_zero_point"
+    output: "y"
+    op_type: "QLinearConv"
+  }
+  name: "test_qlinearconv"
+  input {
+    name: "x"
+    type {
+      tensor_type {
+        elem_type: 2
+        shape {
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 7
+          }
+          dim {
+            dim_value: 7
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "x_scale"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+        }
+      }
+    }
+  }
+  input {
+    name: "x_zero_point"
+    type {
+      tensor_type {
+        elem_type: 2
+        shape {
+        }
+      }
+    }
+  }
+  input {
+    name: "w"
+    type {
+      tensor_type {
+        elem_type: 2
+        shape {
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "w_scale"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "w_zero_point"
+    type {
+      tensor_type {
+        elem_type: 2
+        shape {
+          dim {
+            dim_value: 1
+          }
+        }
+      }
+    }
+  }
+  input {
+    name: "y_scale"
+    type {
+      tensor_type {
+        elem_type: 1
+        shape {
+        }
+      }
+    }
+  }
+  input {
+    name: "y_zero_point"
+    type {
+      tensor_type {
+        elem_type: 2
+        shape {
+        }
+      }
+    }
+  }
+  output {
+    name: "y"
+    type {
+      tensor_type {
+        elem_type: 2
+        shape {
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 1
+          }
+          dim {
+            dim_value: 7
+          }
+          dim {
+            dim_value: 7
+          }
+        }
+      }
+    }
+  }
+}
+opset_import {
+  version: 11
+}
diff --git a/ngraph/test/onnx/onnx_editor.cpp b/ngraph/test/onnx/onnx_editor.cpp
index 590dc7e9350e1a..960340296777f2 100644
--- a/ngraph/test/onnx/onnx_editor.cpp
+++ b/ngraph/test/onnx/onnx_editor.cpp
@@ -1347,3 +1347,60 @@ NGRAPH_TEST(onnx_editor, is_correct_tensor_name) {
     EXPECT_FALSE(editor.is_correct_tensor_name("not_existed"));
     EXPECT_FALSE(editor.is_correct_tensor_name(""));
 }
+
+NGRAPH_TEST(onnx_editor, get_input_ports) {
+    ONNXModelEditor editor{file_util::path_join(SERIALIZED_ZOO, "onnx/model_editor/subgraph_extraction_tests.onnx")};
+
+    const auto ports_1 = editor.get_input_ports(EditorNode{"relu1_name"});
+    EXPECT_EQ(ports_1.size(), 1);
+    EXPECT_EQ(ports_1[0], "in1");
+    const auto ports_2 = editor.get_input_ports(EditorNode{"split_name"});
+    EXPECT_EQ(ports_2.size(), 1);
+    EXPECT_EQ(ports_2[0], "add2");
+    const auto ports_3 = editor.get_input_ports(EditorNode{EditorOutput{"add2"}});
+    EXPECT_EQ(ports_3.size(), 2);
+    EXPECT_EQ(ports_3[0], "relu1");
+    EXPECT_EQ(ports_3[1], "add1");
+    try {
+        editor.get_input_ports(EditorNode{"add_ambiguous_name"});
+    } catch (const std::exception& e) {
+        std::string msg{e.what()};
+        EXPECT_TRUE(msg.find("The node with name: add_ambiguous_name, output_name: not_given is ambiguous") !=
+                    std::string::npos);
+    }
+    try {
+        editor.get_input_ports(EditorNode{""});
+    } catch (const std::exception& e) {
+        std::string msg{e.what()};
+        EXPECT_TRUE(msg.find("The node with name: not_given, output_name: not_given is ambiguous") !=
+                    std::string::npos);
+    }
+}
+NGRAPH_TEST(onnx_editor, get_output_ports) {
+    ONNXModelEditor editor{file_util::path_join(SERIALIZED_ZOO, "onnx/model_editor/subgraph_extraction_tests.onnx")};
+
+    const auto ports_1 = editor.get_output_ports(EditorNode{"relu1_name"});
+    EXPECT_EQ(ports_1.size(), 1);
+    EXPECT_EQ(ports_1[0], "relu1");
+    const auto ports_2 = editor.get_output_ports(EditorNode{"split_name"});
+    EXPECT_EQ(ports_2.size(), 2);
+    EXPECT_EQ(ports_2[0], "split1");
+    EXPECT_EQ(ports_2[1], "split2");
+    const auto ports_3 = editor.get_output_ports(EditorNode{EditorOutput{"add2"}});
+    EXPECT_EQ(ports_3.size(), 1);
+    EXPECT_EQ(ports_3[0], "add2");
+    try {
+        editor.get_output_ports(EditorNode{"add_ambiguous_name"});
+    } catch (const std::exception& e) {
+        std::string msg{e.what()};
+        EXPECT_TRUE(msg.find("The node with name: add_ambiguous_name, output_name: not_given is ambiguous") !=
+                    std::string::npos);
+    }
+    try {
+        editor.get_output_ports(EditorNode{""});
+    } catch (const std::exception& e) {
+        std::string msg{e.what()};
+        EXPECT_TRUE(msg.find("The node with name: not_given, output_name: not_given is ambiguous") !=
+                    std::string::npos);
+    }
+}
diff --git a/ngraph/test/onnx/onnx_import.in.cpp b/ngraph/test/onnx/onnx_import.in.cpp
index 177052530cbcda..25f0899f0f50ef 100644
--- a/ngraph/test/onnx/onnx_import.in.cpp
+++ b/ngraph/test/onnx/onnx_import.in.cpp
@@ -4150,3 +4150,23 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_model_random_uniform_like) {
     test_case.add_input<ngraph::float16>(Shape{2, 2}, {41, 42, 43, 44});
     test_case.run();
 }
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_model_bias_gelu) {
+    const auto function = onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/bias_gelu.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+    test_case.add_input<float>({0.5488135,
+                                0.71518934,
+                                0.60276335,
+                                0.5448832,
+                                0.4236548,
+                                0.6458941,
+                                0.4375872,
+                                0.891773,
+                                0.96366274,
+                                0.3834415});
+    test_case.add_input<float>({0.79172504, 0.5288949, 0.56804454, 0.92559665, 0.07103606});
+    test_case.add_expected_output<float>(
+        {1.2198428, 1.1112978, 1.0293297, 1.366493, 0.3411342, 1.329408, 0.8051748, 1.354462, 1.8336612, 0.3068893});
+    test_case.run();
+}
diff --git a/ngraph/test/onnx/onnx_import_controlflow.in.cpp b/ngraph/test/onnx/onnx_import_controlflow.in.cpp
index e7c3bc0e30f42f..6a29e1d8587c96 100644
--- a/ngraph/test/onnx/onnx_import_controlflow.in.cpp
+++ b/ngraph/test/onnx/onnx_import_controlflow.in.cpp
@@ -31,7 +31,7 @@ using TestEngine = test::ENGINE_CLASS_NAME(${BACKEND_NAME});
 //     }
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_add) {
     const auto function =
-        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add.onnx"));
+        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add.onnx"));
 
     // Shape inference tests
     const auto& parameters = function->get_parameters();
@@ -65,7 +65,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_add) {
 //     }
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_no_identity_termination_cond) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_no_identity_termination_cond.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_no_identity_termination_cond.onnx"));
 
     auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
     // termination condition
@@ -80,7 +80,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_no_identity_termination_co
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_trip_count_max_int) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_trip_count_max_int.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_trip_count_max_int.onnx"));
 
     auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
     // termination condition
@@ -95,7 +95,8 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_trip_count_max_int) {
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_no_identity_termination_cond_static_shapes) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_no_identity_termination_cond_static_shapes.onnx"));
+        file_util::path_join(SERIALIZED_ZOO,
+                             "onnx/controlflow/loop_2d_add_no_identity_termination_cond_static_shapes.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // termination condition
@@ -111,7 +112,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_no_identity_termination_co
 // input ("", cond) // Note this is analogous to a while loop
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_no_identity_termination_cond_false) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_no_identity_termination_cond_false.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_no_identity_termination_cond_false.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -129,7 +130,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_no_identity_termination_co
 //      }
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_const_no_identity_termination_cond) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_const_no_identity_termination_cond.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_const_no_identity_termination_cond.onnx"));
 
     auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
     // a_init
@@ -143,7 +144,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_const_no_identity_terminat
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_const_no_identity_termination_cond_static_shapes) {
     const auto function = onnx_import::import_onnx_model(
         file_util::path_join(SERIALIZED_ZOO,
-                             "onnx/loop/loop_2d_add_const_no_identity_termination_cond_static_shapes.onnx"));
+                             "onnx/controlflow/loop_2d_add_const_no_identity_termination_cond_static_shapes.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -161,7 +162,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_const_no_identity_terminat
 //      }
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_both_cond_and_trip_count_as_inputs) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_cond_and_trip_count_as_inputs.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_cond_and_trip_count_as_inputs.onnx"));
 
     auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
     // trip count
@@ -180,7 +181,8 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_both_cond_and_trip_count_a
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_both_cond_and_trip_count_as_inputs_static_shapes) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_cond_and_trip_count_as_inputs_static_shapes.onnx"));
+        file_util::path_join(SERIALIZED_ZOO,
+                             "onnx/controlflow/loop_2d_add_cond_and_trip_count_as_inputs_static_shapes.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // trip count
@@ -200,7 +202,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_both_cond_and_trip_count_a
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_initializer_from_parent_scope) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_initializer_from_parent_scope.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_initializer_from_parent_scope.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
 
@@ -214,7 +216,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_initializer_from_parent_s
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_node_from_parent_scope) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_node_from_parent_scope.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_node_from_parent_scope.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -228,7 +230,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_node_from_parent_scope) {
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_node_from_parent_scope_used_in_parent_and_in_body) {
     const auto function = onnx_import::import_onnx_model(
         file_util::path_join(SERIALIZED_ZOO,
-                             "onnx/loop/loop_add_node_from_parent_scope_used_in_parent_and_in_body.onnx"));
+                             "onnx/controlflow/loop_add_node_from_parent_scope_used_in_parent_and_in_body.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -245,7 +247,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_node_from_parent_scope_us
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_value_access_to_body_scope_exception) {
     try {
         const auto function = onnx_import::import_onnx_model(
-            file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_incorrect_access_body_scope.onnx"));
+            file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_incorrect_access_body_scope.onnx"));
         FAIL() << "Incorrect access to body scope not detected";
     } catch (const ngraph_error& e) {
         // patent graph should have no access to subgraph (body Loop) scope
@@ -257,7 +259,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_value_access_to_body_scop
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_value_the_same_node_from_parent_and_subgraph) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_the_same_name.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_the_same_name.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -270,7 +272,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_value_the_same_node_from_
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_input_from_parent_graph) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_input_from_parent_graph.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_input_from_parent_graph.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -284,8 +286,8 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_input_from_parent_graph)
 }
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_the_proper_opset_in_subgraph) {
-    const auto function =
-        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_mul_opset1.onnx"));
+    const auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_mul_opset1.onnx"));
 
     const auto parent_ops = function->get_ops();
     const auto loop_node_it = std::find_if(parent_ops.begin(), parent_ops.end(), [](const std::shared_ptr<Node>& op) {
@@ -303,7 +305,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_the_proper_opset_in_subgraph)
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_scalars) {
     const auto function =
-        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_scalars_add.onnx"));
+        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_scalars_add.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -315,8 +317,8 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_scalars) {
 }
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_add_const_cond) {
-    const auto function =
-        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_const_cond.onnx"));
+    const auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_const_cond.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -329,7 +331,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_add_const_cond) {
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_trip_count_dynamic) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_trip_count_dynamic.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_trip_count_dynamic.onnx"));
 
     auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
     // trip count
@@ -345,7 +347,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_trip_count_dynamic) {
 // ~~~~~~~~SUBGRAPH TYPES INFERENCE:~~~~~~~~
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_infer_types) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/onnx_controlflow_loop_2d_infer_types.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/onnx_controlflow_loop_2d_infer_types.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // trip count
@@ -363,7 +365,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_infer_types) {
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_node_from_parent_scope_infer_types) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_add_node_from_parent_scope_infer_types.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_add_node_from_parent_scope_infer_types.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // a_init
@@ -380,8 +382,8 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_add_node_from_parent_scope_in
 // ~~~~~~~~ADDITIONAL TESTS:~~~~~~~~
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_concat_values) {
-    const auto function =
-        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_concat_values.onnx"));
+    const auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_concat_values.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // trip_count
@@ -405,7 +407,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_concat_values) {
 //       }
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_trip_count_and_cond_skipped_shape_inference) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_2d_add_trip_count_and_cond_skipped.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_2d_add_trip_count_and_cond_skipped.onnx"));
 
     const auto& results = function->get_results();
     EXPECT_EQ(results.size(), 2);
@@ -421,7 +423,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_2d_trip_count_and_cond_skippe
 // infinitive loop execution
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_infinite) {
     const auto function =
-        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_infinite.onnx"));
+        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_infinite.onnx"));
 
     auto test_case = test::TestCase<TestEngine>(function);
     // trip_count
@@ -442,7 +444,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_infinite) {
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_no_variadic_inputs_and_outputs) {
     const auto function = onnx_import::import_onnx_model(
-        file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_no_variadic_inputs_and_outputs.onnx"));
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_no_variadic_inputs_and_outputs.onnx"));
 
     auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
     // trip_count
@@ -457,7 +459,7 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_no_variadic_inputs_and_output
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_power) {
     const auto function =
-        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/loop/loop_pow.onnx"));
+        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/loop_pow.onnx"));
 
     auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
     // trip_count
@@ -471,3 +473,291 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_controlflow_loop_power) {
     test_case.add_expected_output<int64_t>(Shape{5}, {0, 1, 4, 9, 16});
     test_case.run();
 }
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_branches_with_same_inputs) {
+    /*
+       if (condition) {
+         add(x, y)
+       } else {
+         mul(x, y)
+       }
+    */
+    const auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_branches_with_same_inputs.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+    std::vector<float> x(40, 2);
+    std::vector<float> y(40);
+    std::iota(y.begin(), y.end(), -20);
+
+    // condition
+    test_case.add_input<bool>({true});
+    test_case.add_input<float>(x);
+    test_case.add_input<float>(y);
+
+    std::vector<float> expected;
+    std::transform(x.begin(), x.end(), y.begin(), std::back_inserter(expected), [](float i, float j) -> float {
+        return i + j;
+    });
+    test_case.add_expected_output<float>(expected);
+    test_case.run();
+
+    std::transform(x.begin(), x.end(), y.begin(), expected.begin(), [](float i, float j) -> float {
+        return i * j;
+    });
+    test_case.add_input<bool>({false});
+    test_case.add_input<float>(x);
+    test_case.add_input<float>(y);
+    test_case.add_expected_output<float>(expected);
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_branches_with_different_inputs) {
+    /*
+       if (condition) {
+         add(x, y)
+       } else {
+         abs(y)
+       }
+    */
+    const auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_branches_with_different_inputs.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+    std::vector<float> x(40, 2);
+    std::vector<float> y(40);
+    std::iota(y.begin(), y.end(), -20);
+
+    // condition
+    test_case.add_input<bool>({true});
+    test_case.add_input<float>(x);
+    test_case.add_input<float>(y);
+
+    std::vector<float> expected;
+    std::transform(x.begin(), x.end(), y.begin(), std::back_inserter(expected), [](float i, float j) -> float {
+        return i + j;
+    });
+    test_case.add_expected_output<float>(expected);
+    test_case.run();
+
+    std::transform(y.begin(), y.end(), expected.begin(), [](float i) -> float {
+        return std::fabs(i);
+    });
+    test_case.add_input<bool>({false});
+    test_case.add_input<float>(x);
+    test_case.add_input<float>(y);
+    test_case.add_expected_output<float>(expected);
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_branches_without_inputs) {
+    /*
+       if (condition) {
+         return const tensor {0, 1, 2, 3, 4, 5, 6, 7}
+       } else {
+         return const tensor {0, 5, 10, 15, 20, 25, 20}
+       }
+    */
+    const auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_branches_without_inputs.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+
+    // condition
+    test_case.add_input<bool>({true});
+
+    test_case.add_expected_output<float>({0, 1, 2, 3, 4, 5, 6, 7});
+    test_case.run();
+
+    test_case.add_input<bool>({false});
+    test_case.add_expected_output<float>({0, 5, 10, 15, 20, 25, 20, 15});
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_inside_if) {
+    /*
+       if (condition) {
+         if (any(x > y) {
+           mul(x, y)
+         } else {
+           add(x, y)
+         }
+       } else {
+         sub(x, y)
+       }
+    */
+    const auto function =
+        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_inside_if.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+
+    // case when condition == true and any(x > y)
+    // expected value == x * y
+    std::vector<float> x(40, 2);
+    std::vector<float> y(40);
+    std::iota(y.begin(), y.end(), -20);
+    std::vector<float> expected;
+    std::transform(x.begin(), x.end(), y.begin(), std::back_inserter(expected), [](float i, float j) -> float {
+        return i * j;
+    });
+    test_case.add_input<bool>({true});  // condition
+    test_case.add_input<float>(x);
+    test_case.add_input<float>(y);
+    test_case.add_expected_output<float>(expected);
+    test_case.run();
+
+    // case when condition == true and all(x < y)
+    // expected value == x + y
+    std::iota(x.begin(), x.end(), -static_cast<float>(x.size()));
+    std::iota(y.begin(), y.end(), 1);
+    std::transform(x.begin(), x.end(), y.begin(), expected.begin(), [](float i, float j) -> float {
+        return i + j;
+    });
+    test_case.add_input<bool>({true});  // condition
+    test_case.add_input<float>(x);
+    test_case.add_input<float>(y);
+    test_case.add_expected_output<float>(expected);
+    test_case.run();
+
+    // case when condition == false
+    // expected value == x - y
+    std::transform(x.begin(), x.end(), y.begin(), expected.begin(), [](float i, float j) -> float {
+        return i - j;
+    });
+    test_case.add_input<bool>({false});
+    test_case.add_input<float>(x);
+    test_case.add_input<float>(y);
+    test_case.add_expected_output<float>(expected);
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_branches_with_multiple_outputs) {
+    /*
+       if (condition) {
+         split(x, axis=0)
+       } else {
+         part1, part2, part3 = split(x, axis=1)
+         transpose(part1), transpose(part2), transpose(part3)
+       }
+    */
+    const auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_branches_with_multiple_outputs.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+
+    // case when condition == true so split is along axis 0
+    std::vector<float> x(36);
+    std::iota(x.begin(), x.end(), 0);
+    std::vector<float> expected1(12);
+    std::iota(expected1.begin(), expected1.end(), 0);
+    std::vector<float> expected2(12);
+    std::iota(expected2.begin(), expected2.end(), 12);
+    std::vector<float> expected3(12);
+    std::iota(expected3.begin(), expected3.end(), 24);
+    test_case.add_input<bool>({true});  // condition
+    test_case.add_input<float>(x);
+    test_case.add_expected_output<float>(expected1);
+    test_case.add_expected_output<float>(expected2);
+    test_case.add_expected_output<float>(expected3);
+    test_case.run();
+
+    // case when condition == false so split is along axis 1
+    test_case.add_input<bool>({false});  // condition
+    test_case.add_input<float>(x);
+    test_case.add_expected_output<float>({0, 6, 12, 18, 24, 30, 1, 7, 13, 19, 25, 31});
+    test_case.add_expected_output<float>({2, 8, 14, 20, 26, 32, 3, 9, 15, 21, 27, 33});
+    test_case.add_expected_output<float>({4, 10, 16, 22, 28, 34, 5, 11, 17, 23, 29, 35});
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_inside_loop) {
+    /*
+        for (i = 0; i < 3; i++) {
+            if (i == 0)
+                a = a + b
+            else
+                a = a * b
+        }
+    */
+    const auto function =
+        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_inside_loop.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+    // a_init
+    test_case.add_input<float>({0.f, 0.f});
+
+    test_case.add_expected_output<float>(Shape{1, 2}, {64.f, 64.f});
+    test_case.add_expected_output<float>(Shape{3, 1, 2}, {4.f, 4.f, 16.f, 16.f, 64.f, 64.f});
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_dynamic_inputs) {
+    /*
+       if (condition) {
+         add(x, y)
+       } else {
+         mul(x, y)
+       }
+    */
+    const auto function =
+        onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_dynamic_inputs.onnx"));
+
+    auto test_case = test::TestCase<TestEngine, TestCaseType::DYNAMIC>(function);
+    std::vector<float> x(40, 2);
+    std::vector<float> y(40);
+    std::iota(y.begin(), y.end(), -20);
+    std::vector<float> expected;
+    std::transform(x.begin(), x.end(), y.begin(), std::back_inserter(expected), [](float i, float j) -> float {
+        return i + j;
+    });
+
+    test_case.add_input<bool>(Shape{}, {true});  // condition
+    test_case.add_input<float>(Shape{4, 10}, x);
+    test_case.add_input<float>(Shape{4, 10}, y);
+    test_case.add_expected_output<float>(Shape{4, 10}, expected);
+    test_case.run();
+
+    std::transform(x.begin(), x.end(), y.begin(), expected.begin(), [](float i, float j) -> float {
+        return i * j;
+    });
+    test_case.add_input<bool>(Shape{}, {false});
+    test_case.add_input<float>(Shape{4, 10}, x);
+    test_case.add_input<float>(Shape{4, 10}, y);
+    test_case.add_expected_output<float>(Shape{4, 10}, expected);
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_negative_missing_branches) {
+    try {
+        const auto function = onnx_import::import_onnx_model(
+            file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_missing_then_branch.onnx"));
+        FAIL() << "Model import succeed, but it shouldn't";
+    } catch (const ngraph_error& e) {
+        EXPECT_HAS_SUBSTRING(e.what(), std::string("Missing 'then_branch' attribute"));
+    } catch (...) {
+        FAIL() << "Model import failed for unexpected reason";
+    }
+
+    try {
+        const auto function = onnx_import::import_onnx_model(
+            file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_missing_else_branch.onnx"));
+        FAIL() << "Model import succeed, but it shouldn't";
+    } catch (const ngraph_error& e) {
+        EXPECT_HAS_SUBSTRING(e.what(), std::string("Missing 'else_branch' attribute"));
+    } catch (...) {
+        FAIL() << "Model import failed for unexpected reason";
+    }
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_if_negative_mismatch_between_branches_output) {
+    try {
+        const auto function = onnx_import::import_onnx_model(
+            file_util::path_join(SERIALIZED_ZOO, "onnx/controlflow/if_negative_mismatch_between_branches_output.onnx"));
+        FAIL() << "Model import succeed, but it shouldn't";
+    } catch (const ngraph_error& e) {
+        EXPECT_HAS_SUBSTRING(e.what(),
+                             std::string("'then' and 'else' branches have to have the same number of outputs"));
+    } catch (...) {
+        FAIL() << "Model import failed for unexpected reason";
+    }
+}
diff --git a/ngraph/test/onnx/onnx_import_quant.in.cpp b/ngraph/test/onnx/onnx_import_quant.in.cpp
index 96faa74393439e..cfb3a918785797 100644
--- a/ngraph/test/onnx/onnx_import_quant.in.cpp
+++ b/ngraph/test/onnx/onnx_import_quant.in.cpp
@@ -264,20 +264,32 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_model_dequantize_linear_1d_zero_scale_uint8_ne
 NGRAPH_TEST(${BACKEND_NAME}, onnx_model_quant_conv_linear) {
     auto function = onnx_import::import_onnx_model(file_util::path_join(SERIALIZED_ZOO, "onnx/quant_conv_lin.onnx"));
 
+    auto test_case = test::TestCase<TestEngine>(function);
+
+    // don't change style for better readibility
+    // clang-format off
     std::vector<std::vector<std::uint8_t>> inputs;
-    inputs.emplace_back(std::vector<std::uint8_t>{
-        1,  2,  3,  4,  5,  6,  7,  8,  9,  10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27,
-        28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54,
-        55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81});
-
-    std::vector<std::vector<std::int8_t>> expected_output{std::vector<std::int8_t>{
-        2,  3,  3,  3,  4,  4,  4,  5,  2,  4,  6,  7,  8,  8,  9,  9,  10, 3,  8,  11, 12, 13, 13, 14, 14, 15, 5,
-        11, 16, 17, 18, 18, 19, 19, 20, 7,  14, 22, 22, 23, 23, 24, 24, 25, 8,  18, 27, 27, 28, 28, 29, 29, 30, 10,
-        21, 32, 32, 33, 33, 34, 34, 35, 12, 24, 37, 37, 38, 38, 39, 40, 40, 13, 17, 26, 27, 27, 27, 28, 28, 28, 9}};
-
-    std::vector<std::vector<std::int8_t>> outputs{
-        execute<std::uint8_t, std::int8_t>(function, inputs, "${BACKEND_NAME}")};
-    EXPECT_TRUE(test::all_close(expected_output.front(), outputs.front()));
+    test_case.add_input(std::vector<uint8_t>{ 1,  2,  3,  4,  5,  6,  7,  8,  9,
+                                             10, 11, 12, 13, 14, 15, 16, 17, 18,
+                                             19, 20, 21, 22, 23, 24, 25, 26, 27,
+                                             28, 29, 30, 31, 32, 33, 34, 35, 36,
+                                             37, 38, 39, 40, 41, 42, 43, 44, 45,
+                                             46, 47, 48, 49, 50, 51, 52, 53, 54,
+                                             55, 56, 57, 58, 59, 60, 61, 62, 63,
+                                             64, 65, 66, 67, 68, 69, 70, 71, 72,
+                                             73, 74, 75, 76, 77, 78, 79, 80, 81});
+
+    test_case.add_expected_output<uint8_t>({1, 1, 9, 9}, std::vector<uint8_t>{ 2,  3,  3,  3,  4,  4,  4,  5,  2,
+                                                                               4,  6,  7,  8,  8,  9,  9, 10,  3,
+                                                                               8, 11, 12, 13, 13, 14, 14, 15,  5,
+                                                                              11, 16, 17, 18, 18, 19, 19, 20,  7,
+                                                                              14, 22, 22, 23, 23, 24, 24, 25,  8,
+                                                                              18, 27, 27, 28, 28, 29, 29, 30, 10,
+                                                                              21, 32, 32, 33, 33, 34, 34, 35, 12,
+                                                                              24, 37, 37, 38, 38, 39, 40, 40, 13,
+                                                                              17, 26, 27, 27, 27, 28, 28, 28, 9});
+    //clang-format on
+    test_case.run();
 }
 
 NGRAPH_TEST(${BACKEND_NAME}, onnx_model_quant_conv_linear_2d) {
@@ -303,7 +315,27 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_model_quant_conv_linear_3d) {
 
     auto test_case = test::TestCase<TestEngine>(function);
 
-    test_case.add_input_from_file<uint8_t>(TEST_FILES, "onnx/qlinearconv3d/x.bin");
+    // don't change style for better readibility
+    // clang-format off
+    test_case.add_input(std::vector<uint8_t>{130,  14, 244,  53,
+                                             244, 119, 236,  79,
+                                               9, 138,  93,  62,
+                                              66, 158,  81, 176,
+
+                                             225, 118, 160, 117,
+                                             246,  69, 172,  50,
+                                              23,  42, 139,  0,
+                                             146, 157, 248, 251,
+
+                                              30, 112,  99, 138,
+                                             190,  22, 143, 186,
+                                             199, 148, 190, 148,
+                                              89,  16, 134, 220,
+
+                                             191,  69,  34,   5,
+                                             156, 255, 196, 134,
+                                              49, 233, 220, 129,
+                                             107, 220, 172, 124});  // x
     test_case.add_input(std::vector<float>{0.00389225385151803f});  // x_scale
     test_case.add_input(std::vector<uint8_t>{127});                 // x_zero_point
     test_case.add_input(std::vector<uint8_t>{255});                 // w
@@ -312,7 +344,61 @@ NGRAPH_TEST(${BACKEND_NAME}, onnx_model_quant_conv_linear_3d) {
     test_case.add_input(std::vector<float>{0.0011764180380851f});   // y_scale
     test_case.add_input(std::vector<uint8_t>{128});                 // y_zero_point
 
-    test_case.add_expected_output_from_file<uint8_t>({1, 1, 4, 4, 4}, TEST_FILES, "onnx/qlinearconv3d/y.bin");
+    test_case.add_expected_output<uint8_t>({1, 1, 4, 4, 4},
+                                           {128, 128, 128, 128,
+                                            128, 128, 128, 128,
+                                            128, 128, 128, 128,
+                                            128, 128, 128, 128,
+
+                                            128, 128, 128, 128,
+                                            128, 131, 255, 128,
+                                            128,   0,  91, 128,
+                                            128, 128, 128, 128,
+
+                                            128, 128, 128, 128,
+                                            128,  23,  98, 128,
+                                            128, 206, 196, 128,
+                                            128, 128, 128, 128,
+
+                                            128, 128, 128, 128,
+                                            128, 128, 128, 128,
+                                            128, 128, 128, 128,
+                                            128, 128, 128, 128});
+    // clang-format on
+    test_case.run();
+}
+
+NGRAPH_TEST(${BACKEND_NAME}, onnx_model_quant_conv_linear_onnx_example) {
+    auto function = onnx_import::import_onnx_model(
+        file_util::path_join(SERIALIZED_ZOO, "onnx/quantization/quant_conv_linear_onnx_example.onnx"));
+
+    auto test_case = test::TestCase<TestEngine>(function);
+
+    // don't change style for better readibility
+    // clang-format off
+    test_case.add_input(std::vector<uint8_t>{255, 174, 162,  25, 203, 168,  58,
+                                              15,  59, 237,  95, 129,   0,  64,
+                                              56, 242, 153, 221, 168,  12, 166,
+                                             232, 178, 186, 195, 237, 162, 237,
+                                             188,  39, 124,  77,  80, 102,  43,
+                                             127, 230,  21,  83,  41,  40, 134,
+                                             255, 154,  92, 141,  42, 148, 247});  // x
+    test_case.add_input(std::vector<float>{0.00369204697f});                       // x_scale
+    test_case.add_input(std::vector<uint8_t>{132});                                // x_zero_point
+    test_case.add_input(std::vector<uint8_t>{0});                                  // w
+    test_case.add_input(std::vector<float>{0.00172794575f});                       // w_scale
+    test_case.add_input(std::vector<uint8_t>{255});                                // w_zero_point
+    test_case.add_input(std::vector<float>{0.00162681262f});                       // y_scale
+    test_case.add_input(std::vector<uint8_t>{123});                                // y_zero_point
+
+    test_case.add_expected_output<uint8_t>({1, 1, 7, 7}, std::vector<uint8_t>{  0,  81,  93, 230,  52,  87, 197,
+                                                                              240, 196,  18, 160, 126, 255, 191,
+                                                                              199,  13, 102,  34,  87, 243,  89,
+                                                                               23,  77,  69,  60,  18,  93,  18,
+                                                                               67, 216, 131, 178, 175, 153, 212,
+                                                                              128,  25, 234, 172, 214, 215, 121,
+                                                                                0, 101, 163, 114, 213, 107,   8});
+    // clang-format on
     test_case.run();
 }
 
diff --git a/ngraph/test/opset.cpp b/ngraph/test/opset.cpp
new file mode 100644
index 00000000000000..24a6e4d2857b84
--- /dev/null
+++ b/ngraph/test/opset.cpp
@@ -0,0 +1,144 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/opsets/opset.hpp"
+
+#include <gtest/gtest.h>
+
+#include "openvino/opsets/opset1.hpp"
+#include "openvino/opsets/opset2.hpp"
+#include "openvino/opsets/opset3.hpp"
+#include "openvino/opsets/opset4.hpp"
+#include "openvino/opsets/opset5.hpp"
+#include "openvino/opsets/opset6.hpp"
+#include "openvino/opsets/opset7.hpp"
+#include "openvino/opsets/opset8.hpp"
+
+TEST(opset, opset1) {
+    auto op = std::make_shared<ov::opset1::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset1_dump) {
+    const auto& opset = ov::get_opset1();
+    std::cout << "All opset1 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(110, opset.get_types_info().size());
+}
+
+TEST(opset, opset2) {
+    auto op = std::make_shared<ov::opset2::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset2_dump) {
+    const auto& opset = ov::get_opset2();
+    std::cout << "All opset2 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(112, opset.get_types_info().size());
+}
+
+TEST(opset, opset3) {
+    auto op = std::make_shared<ov::opset3::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset3_dump) {
+    const auto& opset = ov::get_opset3();
+    std::cout << "All opset3 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(127, opset.get_types_info().size());
+}
+
+TEST(opset, opset4) {
+    auto op = std::make_shared<ov::opset4::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset4_dump) {
+    const auto& opset = ov::get_opset4();
+    std::cout << "All opset4 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(137, opset.get_types_info().size());
+}
+
+TEST(opset, opset5) {
+    auto op = std::make_shared<ov::opset5::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset5_dump) {
+    const auto& opset = ov::get_opset5();
+    std::cout << "All opset5 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(145, opset.get_types_info().size());
+}
+
+TEST(opset, opset6) {
+    auto op = std::make_shared<ov::opset6::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset6_dump) {
+    const auto& opset = ov::get_opset6();
+    std::cout << "All opset6 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(152, opset.get_types_info().size());
+}
+
+TEST(opset, opset7) {
+    auto op = std::make_shared<ov::opset7::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset7_dump) {
+    const auto& opset = ov::get_opset7();
+    std::cout << "All opset7 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(156, opset.get_types_info().size());
+}
+
+TEST(opset, opset8) {
+    auto op = std::make_shared<ov::opset8::Parameter>();
+    ASSERT_NE(nullptr, op);
+    EXPECT_TRUE(ov::op::util::is_parameter(op));
+}
+
+TEST(opset, opset8_dump) {
+    const auto& opset = ov::get_opset8();
+    std::cout << "All opset8 operations: ";
+    for (const auto& t : opset.get_types_info()) {
+        std::cout << t.name << " ";
+    }
+    std::cout << std::endl;
+    ASSERT_EQ(163, opset.get_types_info().size());
+}
diff --git a/ngraph/test/opset1.cpp b/ngraph/test/opset1.cpp
index 7f5a2cfdba3151..969944a75d9fb4 100644
--- a/ngraph/test/opset1.cpp
+++ b/ngraph/test/opset1.cpp
@@ -162,7 +162,7 @@ class NewOp : public op::Op {
     }
     void validate_and_infer_types() override{};
 
-    virtual std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& /* new_args */) const override {
+    std::shared_ptr<Node> clone_with_new_inputs(const OutputVector& /* new_args */) const override {
         return make_shared<NewOp>();
     };
 };
@@ -173,6 +173,7 @@ TEST(opset, new_op) {
     // Copy opset1; don't bash the real thing in a test
     OpSet opset1_copy(get_opset1());
     opset1_copy.insert<NewOp>();
+    ASSERT_TRUE(opset1_copy.contains_type<NewOp>());
     {
         shared_ptr<Node> op(opset1_copy.create(NewOp::type_info.name));
         ASSERT_TRUE(op);
@@ -193,6 +194,7 @@ TEST(opset, new_op) {
     EXPECT_TRUE(fred);
     // Fred should not be in the registry
     ASSERT_FALSE(get_opset1().contains_type(NewOp::type_info));
+    ASSERT_FALSE(get_opset1().contains_type<NewOp>());
 }
 
 TEST(opset, dump) {
diff --git a/ngraph/test/preprocess.cpp b/ngraph/test/preprocess.cpp
new file mode 100644
index 00000000000000..0bbe570facbf4e
--- /dev/null
+++ b/ngraph/test/preprocess.cpp
@@ -0,0 +1,239 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "gtest/gtest.h"
+#include "ngraph/ngraph.hpp"
+#include "ngraph/ops.hpp"
+#include "openvino/core/preprocess/pre_post_process.hpp"
+#include "util/all_close.hpp"
+#include "util/all_close_f.hpp"
+#include "util/test_tools.hpp"
+
+using namespace ov;
+using namespace ov::preprocess;
+using namespace ngraph::test;
+
+static std::shared_ptr<Function> create_simple_function(element::Type type, const PartialShape& shape) {
+    auto data1 = std::make_shared<op::v0::Parameter>(type, shape);
+    data1->set_friendly_name("input1");
+    auto res = std::make_shared<op::v0::Result>(data1);
+    res->set_friendly_name("Result");
+    return std::make_shared<Function>(ResultVector{res}, ParameterVector{data1});
+}
+
+static std::shared_ptr<Function> create_2inputs(element::Type type, const PartialShape& shape) {
+    auto data1 = std::make_shared<op::v0::Parameter>(type, shape);
+    data1->set_friendly_name("input1");
+    auto data2 = std::make_shared<op::v0::Parameter>(type, shape);
+    data2->set_friendly_name("input2");
+    auto res1 = std::make_shared<op::v0::Result>(data1);
+    res1->set_friendly_name("Result");
+    auto res2 = std::make_shared<op::v0::Result>(data2);
+    res2->set_friendly_name("Result");
+    return std::make_shared<Function>(ResultVector{res1, res2}, ParameterVector{data1, data2});
+}
+
+TEST(pre_post_process, simple_mean_scale) {
+    auto f = create_simple_function(element::f32, Shape{1, 3, 2, 2});
+    f = PrePostProcessor().input(InputInfo().preprocess(PreProcessSteps().mean(1.f).scale(2.f))).build(f);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate(
+        {result},
+        {make_host_tensor<element::f32>(Shape{1, 3, 2, 2}, {1., 3., 5., 7., 9., 11., 13., 15., 17., 19., 21., 23.})});
+    auto result_val = read_vector<float>(result);
+    EXPECT_TRUE(all_close_f(std::vector<float>{0., 1., 2., 3., 4., 5., 6., 7., 8., 9., 10., 11.}, result_val));
+}
+
+TEST(pre_post_process, scale_then_mean) {
+    auto f = create_simple_function(element::f32, Shape{1, 3, 2, 2});
+    f = PrePostProcessor().input(InputInfo().preprocess(PreProcessSteps().scale(2.0f).mean(2.0f))).build(f);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate({result},
+                {make_host_tensor<element::f32>(Shape{1, 3, 2, 2},
+                                                {2., 4., 6., 8., 10., 12., 14., 16., 18., 20., 100., 200.})});
+    auto result_val = read_vector<float>(result);
+    EXPECT_TRUE(all_close_f(std::vector<float>{-1., 0, 1., 2., 3., 4., 5., 6., 7., 8., 48., 98.}, result_val));
+}
+
+TEST(pre_post_process, convert_element_type_and_scale) {
+    auto f = create_simple_function(element::i8, Shape{1, 3, 2, 2});
+    f = PrePostProcessor()
+            .input(InputInfo()
+                       .tensor(InputTensorInfo().set_element_type(element::i16))
+                       .preprocess(PreProcessSteps()
+                                       .convert_element_type(element::f32)
+                                       .scale(2.f)
+                                       .convert_element_type(element::i8)))
+            .build(f);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate({result},
+                {make_host_tensor<element::i16>(Shape{1, 3, 2, 2}, {2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 10000, 200})});
+    auto result_val = read_vector<int8_t>(result);
+    EXPECT_TRUE(all_close(std::vector<int8_t>{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, (int8_t)5000, 100}, result_val));
+    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::i16);
+
+    ASSERT_EQ(f->get_output_element_type(0), element::i8);
+}
+
+TEST(pre_post_process, convert_element_type_from_unknown) {
+    auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
+    ASSERT_ANY_THROW(
+        f = PrePostProcessor()
+                .input(InputInfo().preprocess(
+                    PreProcessSteps().convert_element_type(element::dynamic).convert_element_type(element::i32)))
+                .build(f));
+}
+
+TEST(pre_post_process, convert_element_type_no_match) {
+    auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
+    ASSERT_ANY_THROW(f = PrePostProcessor()
+                             .input(InputInfo()
+                                        .tensor(InputTensorInfo().set_element_type(element::i32))
+                                        .preprocess(PreProcessSteps().convert_element_type(element::f32).scale(2.0f)))
+                             .build(f));
+}
+
+TEST(pre_post_process, scale_not_float) {
+    auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
+    ASSERT_ANY_THROW(
+        f = PrePostProcessor()
+                .input(InputInfo().preprocess(PreProcessSteps().convert_element_type(element::f32).scale(2.0f)))
+                .build(f));
+}
+
+TEST(pre_post_process, mean_not_float) {
+    auto f = create_simple_function(element::i32, Shape{1, 3, 224, 224});
+    ASSERT_ANY_THROW(
+        f = PrePostProcessor()
+                .input(InputInfo().preprocess(PreProcessSteps().convert_element_type(element::f32).mean(2.0f)))
+                .build(f));
+}
+
+TEST(pre_post_process, tensor_element_type_and_scale) {
+    auto f = create_simple_function(element::i8, Shape{1, 3, 1, 1});
+    f = PrePostProcessor()
+            .input(InputInfo()
+                       .tensor(InputTensorInfo().set_element_type(element::f32))
+                       .preprocess(PreProcessSteps().scale(2.0f).convert_element_type(element::i8)))
+            .build(f);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate({result}, {make_host_tensor<element::f32>(Shape{1, 3, 1, 1}, {2., 4., 6.})});
+    auto result_val = read_vector<int8_t>(result);
+    EXPECT_TRUE(all_close(std::vector<int8_t>{1, 2, 3}, result_val));
+    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::f32);
+
+    ASSERT_EQ(f->get_output_element_type(0), element::i8);
+}
+
+TEST(pre_post_process, custom_preprocessing) {
+    auto f = create_simple_function(element::i32, Shape{1, 3, 1, 1});
+    f = PrePostProcessor()
+            .input(InputInfo().preprocess(PreProcessSteps().custom([](const std::shared_ptr<Node>& node) {
+                auto abs = std::make_shared<op::v0::Abs>(node);
+                abs->set_friendly_name(node->get_friendly_name() + "/abs");
+                return abs;
+            })))
+            .build(f);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate({result}, {make_host_tensor<element::i32>(Shape{1, 3, 1, 1}, {0, 4, -6})});
+    auto result_val = read_vector<int32_t>(result);
+    EXPECT_TRUE(all_close(std::vector<int32_t>{0, 4, 6}, result_val));
+}
+
+TEST(pre_post_process, test_lvalue) {
+    auto f = create_simple_function(element::i8, Shape{1, 3, 1, 1});
+    auto p = PrePostProcessor();
+    auto p1 = std::move(p);
+    p = std::move(p1);
+    auto inputInfo = InputInfo();
+    auto inputInfo2 = std::move(inputInfo);
+    inputInfo = std::move(inputInfo2);
+    {
+        auto inputTensorInfo = InputTensorInfo();
+        auto inputTensorInfo2 = std::move(inputTensorInfo);
+        inputTensorInfo = std::move(inputTensorInfo2);
+        auto& same = inputTensorInfo.set_element_type(element::f32);
+        same.set_layout("?CHW");
+        inputInfo.tensor(std::move(same));
+    }
+    {
+        auto preprocessSteps = PreProcessSteps();
+        auto preprocessSteps2 = std::move(preprocessSteps);
+        preprocessSteps = std::move(preprocessSteps2);
+        preprocessSteps.mean(1.f);
+        preprocessSteps.scale(2.f);
+        preprocessSteps.mean({1.f, 2.f, 3.f});
+        preprocessSteps.scale({2.f, 3.f, 4.f});
+        preprocessSteps.custom([](const std::shared_ptr<Node>& node) {
+            auto abs = std::make_shared<op::v0::Abs>(node);
+            abs->set_friendly_name(node->get_friendly_name() + "/abs");
+            return abs;
+        });
+        auto& same = preprocessSteps.convert_element_type(element::i8);
+        inputInfo.preprocess(std::move(same));
+    }
+    p.input(std::move(inputInfo));
+    f = p.build(f);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate({result}, {make_host_tensor<element::f32>(Shape{1, 3, 1, 1}, {-9., 17., -1.})});
+    auto result_val = read_vector<int8_t>(result);
+    EXPECT_TRUE(all_close(std::vector<int8_t>{3, 2, 1}, result_val));
+    EXPECT_EQ(f->get_parameters().front()->get_element_type(), element::f32);
+
+    ASSERT_EQ(f->get_output_element_type(0), element::i8);
+}
+
+TEST(pre_post_process, test_2_inputs_basic) {
+    auto f = create_2inputs(element::f32, Shape{1, 3, 1, 1});
+    { f = PrePostProcessor().input(InputInfo(1).preprocess(PreProcessSteps().mean(1.f).scale(2.0f))).build(f); }
+    auto result1 = std::make_shared<HostTensor>();
+    auto result2 = std::make_shared<HostTensor>();
+    auto input1 = make_host_tensor<element::f32>(Shape{1, 3, 1, 1}, {3., 5., 7.});
+    auto input2 = make_host_tensor<element::f32>(Shape{1, 3, 1, 1}, {3., 5., 7.});
+    f->evaluate({result1, result2}, {input1, input2});
+
+    auto result1_val = read_vector<float>(result1);
+    EXPECT_TRUE(all_close_f(std::vector<float>{3, 5, 7}, result1_val));
+
+    auto result2_val = read_vector<float>(result2);
+    EXPECT_TRUE(all_close_f(std::vector<float>{1, 2, 3}, result2_val));
+}
+
+TEST(pre_post_process, mean_scale_vector_tensor_layout) {
+    auto f = create_simple_function(element::f32, PartialShape{Dimension::dynamic(), 3, 2, 1});
+    ASSERT_EQ(f->get_output_element_type(0), element::f32);
+    f = PrePostProcessor()
+            .input(InputInfo()
+                       .tensor(InputTensorInfo().set_layout("NC??"))
+                       .preprocess(PreProcessSteps().mean({1.f, 2.f, 3.f}).scale({2.f, 3.f, 4.f})))
+            .build(f);
+
+    auto result = std::make_shared<HostTensor>();
+    f->evaluate({result}, {make_host_tensor<ngraph::element::f32>(Shape{1, 3, 2, 1}, {5., 1., 5., 11., 11., -1.})});
+    auto result_val = read_vector<float>(result);
+    EXPECT_TRUE(all_close_f(std::vector<float>{2., 0., 1., 3., 2., -1.}, result_val));
+}
+
+TEST(pre_post_process, scale_vector_no_channels_layout) {
+    auto f = create_simple_function(element::f32, Shape{1, 3, 224, 224});
+    ASSERT_EQ(f->get_output_element_type(0), element::f32);
+    ASSERT_ANY_THROW(f = PrePostProcessor()
+                             .input(InputInfo()
+                                        .tensor(InputTensorInfo().set_layout("N?HW"))
+                                        .preprocess(PreProcessSteps().scale({0.1f, 0.2f, 0.3f})))
+                             .build(f));
+}
+
+TEST(pre_post_process, mean_vector_no_layout) {
+    auto f = create_simple_function(element::f32, PartialShape{Dimension::dynamic(), 3, 224, 224});
+    ASSERT_EQ(f->get_output_element_type(0), element::f32);
+    ASSERT_ANY_THROW(
+        f = PrePostProcessor().input(InputInfo().preprocess(PreProcessSteps().mean({0.1f, 0.2f, 0.3f}))).build(f));
+}
diff --git a/ngraph/test/runtime/CMakeLists.txt b/ngraph/test/runtime/CMakeLists.txt
index d17a37a8b7080a..8bd949c46d0cb7 100644
--- a/ngraph/test/runtime/CMakeLists.txt
+++ b/ngraph/test/runtime/CMakeLists.txt
@@ -47,8 +47,8 @@ endif()
 target_include_directories(ngraph_backend PUBLIC ${CMAKE_CURRENT_SOURCE_DIR})
 
 install(TARGETS ngraph_backend
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL)
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
 
 add_subdirectory(interpreter)
 add_subdirectory(ie)
diff --git a/ngraph/test/runtime/ie/CMakeLists.txt b/ngraph/test/runtime/ie/CMakeLists.txt
index 938b2d32ce5f6b..d89b723ee24981 100644
--- a/ngraph/test/runtime/ie/CMakeLists.txt
+++ b/ngraph/test/runtime/ie/CMakeLists.txt
@@ -29,5 +29,5 @@ add_dependencies(ie_backend inference_engine)
 target_link_libraries(ie_backend PUBLIC ngraph_backend inference_engine)
 
 install(TARGETS ie_backend
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL)
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
diff --git a/ngraph/test/runtime/ie/unit_test.manifest b/ngraph/test/runtime/ie/unit_test.manifest
index c32732c3c2639c..59ddde899f607c 100644
--- a/ngraph/test/runtime/ie/unit_test.manifest
+++ b/ngraph/test/runtime/ie/unit_test.manifest
@@ -130,7 +130,6 @@ onnx_model_scatterND_param_i64_indices
 IE_CPU.onnx_constant_sparse_tensor_int64_3x4
 IE_CPU.onnx_constant_sparse_tensor_uint64_3x4
 
-
 # TopK Incorrect input data/index values precision
 onnx_model_argmax_int32
 onnx_model_argmin_int32
@@ -241,6 +240,9 @@ onnx_size_op_single
 onnx_size_op_graph_end
 onnx_size_op_graph_middle
 
+# /openvino/inference-engine/src/mkldnn_plugin/mkldnn_graph.cpp:747
+# Output blob byte size is not equal network output byte size (64!=216)." thrown in the test body.
+onnx_model_quant_conv_linear_3d
 
 #-------------------------------------------------------------------------------
 #
@@ -288,7 +290,6 @@ zero_sized_lesseq
 zero_sized_maximum
 zero_sized_minimum
 zero_sized_multiply
-zero_sized_not_equal
 zero_sized_power
 zero_sized_subtract
 sum_trivial
@@ -643,11 +644,6 @@ gemm_broadcast_axes_1_input_C
 scale_shift_no_broadcast
 scale_shift
 
-# Detected op not belonging to opset1!
-onnx_model_quant_conv_linear
-onnx_model_quant_conv_linear_2d
-onnx_model_quant_conv_linear_3d
-
 # Cannot cast ngraph node Dot to CNNLayer!
 dot_4d_5d_multi_axis
 dot_4d_5d_multi_axis_more
@@ -1445,6 +1441,7 @@ onnx_controlflow_loop_2d_const_no_identity_termination_cond
 onnx_controlflow_loop_2d_both_cond_and_trip_count_as_inputs
 onnx_controlflow_loop_no_variadic_inputs_and_outputs
 onnx_controlflow_loop_power
+onnx_if_dynamic_inputs
 
 # Input body shape is changed during Loop iterations
 # Exception is throw during Loop shape inference
@@ -1497,8 +1494,6 @@ IE_GPU.onnx_model_gather_elements_float_3D_axis_2
 # not supported fp16 blob input
 IE_CPU.evaluate_ctc_greedy_decoder_seq_len_f16
 
-# incorrect result for Minimum if u16 type is used
-minimum_u16
 IE_CPU/ElemTypesTests/1.onnx_test_add_abc_set_precission
 
 # not yet implemented on CPU/GPU Gather 7
diff --git a/ngraph/test/runtime/interpreter/CMakeLists.txt b/ngraph/test/runtime/interpreter/CMakeLists.txt
index 58ca96a1c6b54e..9977342702b01a 100644
--- a/ngraph/test/runtime/interpreter/CMakeLists.txt
+++ b/ngraph/test/runtime/interpreter/CMakeLists.txt
@@ -24,5 +24,5 @@ target_compile_definitions(interpreter_backend PRIVATE INTERPRETER_BACKEND_EXPOR
 target_link_libraries(interpreter_backend PUBLIC ngraph_backend)
 
 install(TARGETS interpreter_backend
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL)
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
diff --git a/ngraph/test/runtime/interpreter/evaluates_map.cpp b/ngraph/test/runtime/interpreter/evaluates_map.cpp
index a381faeaa6f711..08d5c3171d09f2 100644
--- a/ngraph/test/runtime/interpreter/evaluates_map.cpp
+++ b/ngraph/test/runtime/interpreter/evaluates_map.cpp
@@ -35,7 +35,6 @@
 #include <ngraph/runtime/reference/experimental_detectron_topk_rois.hpp>
 #include <ngraph/runtime/reference/experimental_detectron_proposal_single_image.hpp>
 #include <ngraph/runtime/reference/extract_image_patches.hpp>
-#include <ngraph/runtime/reference/fake_quantize.hpp>
 #include <ngraph/runtime/reference/fft.hpp>
 #include <ngraph/runtime/reference/gather.hpp>
 #include <ngraph/runtime/reference/gather_elements.hpp>
@@ -2434,28 +2433,6 @@ namespace
         return true;
     }
 
-    template <element::Type_t ET>
-    bool evaluate(const shared_ptr<op::v0::FakeQuantize>& op,
-                  const HostTensorVector& outputs,
-                  const HostTensorVector& inputs)
-    {
-        using T = typename element_type_traits<ET>::value_type;
-        runtime::reference::fake_quantize<T>(inputs[0]->get_data_ptr<const T>(),
-                                             inputs[1]->get_data_ptr<const T>(),
-                                             inputs[2]->get_data_ptr<const T>(),
-                                             inputs[3]->get_data_ptr<const T>(),
-                                             inputs[4]->get_data_ptr<const T>(),
-                                             outputs[0]->get_data_ptr<T>(),
-                                             op->get_input_shape(0),
-                                             op->get_input_shape(1),
-                                             op->get_input_shape(2),
-                                             op->get_input_shape(3),
-                                             op->get_input_shape(4),
-                                             op->get_levels(),
-                                             op->get_auto_broadcast());
-        return true;
-    }
-
     template <element::Type_t ET>
     bool evaluate(const shared_ptr<op::v0::NormalizeL2>& op,
                   const HostTensorVector& outputs,
@@ -2959,18 +2936,7 @@ namespace
         {
             element_type = node->get_input_element_type(0);
         }
-        for (size_t i = 1; i < node->outputs().size(); i++)
-        {
-            if ((ov::is_type<op::v5::NonMaxSuppression>(node) ||
-                 ov::is_type<op::v8::MulticlassNms>(node) ||
-                 ov::is_type<op::v8::MatrixNms>(node) ||
-                 ov::is_type<op::v6::ExperimentalDetectronDetectionOutput>(node) ||
-                 ov::is_type<op::v8::AdaptiveMaxPool>(node)) &&
-                 i == 1)
-            {
-                continue;
-            }
-        }
+
         switch (element_type)
         {
         case element::Type_t::boolean:
diff --git a/ngraph/test/runtime/interpreter/unit_test.manifest b/ngraph/test/runtime/interpreter/unit_test.manifest
index ec77901f320283..880872f4491cf2 100644
--- a/ngraph/test/runtime/interpreter/unit_test.manifest
+++ b/ngraph/test/runtime/interpreter/unit_test.manifest
@@ -1,4 +1,3 @@
-INTERPRETER.onnx_model_quant_conv_linear
 INTERPRETER.onnx_top_k_opset_10
 
 # Temporarily disabled:
@@ -80,8 +79,6 @@ INTERPRETER.onnx_model_dequantize_linear_1d_zero_scale_uint8
 INTERPRETER.onnx_model_dequantize_linear_1d_zero_scale_int8
 INTERPRETER.onnx_model_dequantize_linear_1d_zero_scale_int8_4d
 INTERPRETER.onnx_model_dequantize_linear_1d_zero_scale_uint8_negative_axis
-INTERPRETER.onnx_model_quant_conv_linear_2d
-INTERPRETER.onnx_model_quant_conv_linear_3d
 INTERPRETER.onnx_model_conv_integer
 INTERPRETER.onnx_model_conv_integer_zero_point_zero
 INTERPRETER.onnx_model_conv_integer_no_zero_point
diff --git a/ngraph/test/runtime/pass/dyn_elimination.cpp b/ngraph/test/runtime/pass/dyn_elimination.cpp
index 95a08bc0ec3b7a..5b4a4980587d16 100644
--- a/ngraph/test/runtime/pass/dyn_elimination.cpp
+++ b/ngraph/test/runtime/pass/dyn_elimination.cpp
@@ -2,9 +2,10 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
+#include "dyn_elimination.hpp"
+
 #include <numeric>
 
-#include "dyn_elimination.hpp"
 #include "ngraph/builder/reshape.hpp"
 #include "ngraph/op/broadcast.hpp"
 #include "ngraph/op/range.hpp"
@@ -19,9 +20,7 @@ NGRAPH_SUPPRESS_DEPRECATED_START
 using namespace std;
 using namespace ngraph;
 
-pass::DynElimination::DynElimination()
-    : GraphRewrite()
-{
+pass::DynElimination::DynElimination() : GraphRewrite() {
     construct_range();
 }
 
@@ -29,28 +28,22 @@ template <typename T>
 std::shared_ptr<op::Constant> make_range_replacement(const element::Type& et,
                                                      const Shape& shape,
                                                      const std::shared_ptr<op::Constant>& start_arg,
-                                                     const std::shared_ptr<op::Constant>& step_arg)
-{
+                                                     const std::shared_ptr<op::Constant>& step_arg) {
     std::vector<T> elements(shape_size(shape));
     std::vector<T> start_vec = start_arg->get_vector<T>();
     std::vector<T> step_vec = step_arg->get_vector<T>();
 
     NGRAPH_CHECK(start_vec.size() == 1 && step_vec.size() == 1);
 
-    runtime::reference::range<T>(
-        start_vec.data(), step_vec.data(), shape_size(shape), elements.data());
+    runtime::reference::range<T>(start_vec.data(), step_vec.data(), shape_size(shape), elements.data());
 
     return make_shared<op::Constant>(et, shape, elements);
 }
 
-void pass::DynElimination::construct_range()
-{
-    auto start_arg_label =
-        make_shared<pattern::op::Label>(element::f32, Shape{}, pattern::has_class<op::Constant>());
-    auto stop_arg_label =
-        make_shared<pattern::op::Label>(element::f32, Shape{}, pattern::has_class<op::Constant>());
-    auto step_arg_label =
-        make_shared<pattern::op::Label>(element::f32, Shape{}, pattern::has_class<op::Constant>());
+void pass::DynElimination::construct_range() {
+    auto start_arg_label = make_shared<pattern::op::Label>(element::f32, Shape{}, pattern::has_class<op::Constant>());
+    auto stop_arg_label = make_shared<pattern::op::Label>(element::f32, Shape{}, pattern::has_class<op::Constant>());
+    auto step_arg_label = make_shared<pattern::op::Label>(element::f32, Shape{}, pattern::has_class<op::Constant>());
 
     auto range_pat = make_shared<op::Range>(start_arg_label, stop_arg_label, step_arg_label);
 
@@ -70,12 +63,11 @@ void pass::DynElimination::construct_range()
         std::shared_ptr<op::Constant> replacement;
 
 #if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#pragma GCC diagnostic push
-#pragma GCC diagnostic error "-Wswitch"
-#pragma GCC diagnostic error "-Wswitch-enum"
+#    pragma GCC diagnostic push
+#    pragma GCC diagnostic error "-Wswitch"
+#    pragma GCC diagnostic error "-Wswitch-enum"
 #endif
-        switch (et)
-        {
+        switch (et) {
         case element::Type_t::bf16:
             replacement = make_range_replacement<bfloat16>(et, shape, start_arg, step_arg);
             break;
@@ -122,7 +114,7 @@ void pass::DynElimination::construct_range()
             break;
         }
 #if defined(__GNUC__) && !(__GNUC__ == 4 && __GNUC_MINOR__ == 8)
-#pragma GCC diagnostic pop
+#    pragma GCC diagnostic pop
 #endif
 
         replace_node(range_node, replacement);
diff --git a/ngraph/test/type_prop/broadcast.cpp b/ngraph/test/type_prop/broadcast.cpp
index 2d76c8df845732..094377bb5e2305 100644
--- a/ngraph/test/type_prop/broadcast.cpp
+++ b/ngraph/test/type_prop/broadcast.cpp
@@ -85,8 +85,7 @@ TYPED_TEST_P(BroadcastTests, broadcast_fail_rank) {
         auto bc = make_shared<TypeParam>(param, target_shape, axes_mapping);
         FAIL() << "Broadcast: target shape mismatch with input rank not detected";
     } catch (const NodeValidationFailure& error) {
-        EXPECT_HAS_SUBSTRING(error.what(),
-                             "Broadcast axes_mapping shape Shape{3} doesn't match rank of input tensor 2");
+        EXPECT_HAS_SUBSTRING(error.what(), "Broadcast axes_mapping shape {3} doesn't match rank of input tensor 2");
     } catch (...) {
         FAIL() << "Deduced type check failed for unexpected reason";
     }
diff --git a/ngraph/test/type_prop/constant.cpp b/ngraph/test/type_prop/constant.cpp
index facc9d1b57eb18..115f6584078195 100644
--- a/ngraph/test/type_prop/constant.cpp
+++ b/ngraph/test/type_prop/constant.cpp
@@ -41,7 +41,7 @@ TEST(type_prop, tensor_constant_bad_count) {
     } catch (const NodeValidationFailure& error) {
         EXPECT_HAS_SUBSTRING(error.what(),
                              std::string("Did not get the expected number of literals for a "
-                                         "constant of shape Shape{2, 2} (got 3, expected 1 or 4)"));
+                                         "constant of shape {2, 2} (got 3, expected 1 or 4)"));
     } catch (...) {
         FAIL() << "Deduced type check failed for unexpected reason";
     }
diff --git a/ngraph/test/type_prop/gather_tree.cpp b/ngraph/test/type_prop/gather_tree.cpp
index aa3ce09cc5ff70..da9a87ad202e25 100644
--- a/ngraph/test/type_prop/gather_tree.cpp
+++ b/ngraph/test/type_prop/gather_tree.cpp
@@ -2,6 +2,9 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
+#include <array>
+#include <utility>
+
 #include "gtest/gtest.h"
 #include "ngraph/ngraph.hpp"
 #include "util/type_prop.hpp"
@@ -9,78 +12,280 @@
 using namespace std;
 using namespace ngraph;
 
-TEST(type_prop, gather_tree_output_shape) {
-    auto step_ids = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto parent_idx = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto max_seq_len = make_shared<op::Parameter>(element::i64, Shape{1});
-    auto end_token = make_shared<op::Parameter>(element::i64, Shape{});
+namespace {
+constexpr size_t step_ids_input_idx = 0;
+constexpr size_t parent_idx_input_idx = 1;
+constexpr size_t max_seq_len_input_idx = 2;
+constexpr size_t end_token_input_idx = 3;
+constexpr size_t gather_tree_required_inputs = 4;
+struct GatherTreeInputInfo {
+    element::Type in_et;
+    PartialShape in_pshape;
+};
 
-    auto gather_tree = make_shared<op::v1::GatherTree>(step_ids, parent_idx, max_seq_len, end_token);
+using GatherTreeInputParams = std::array<GatherTreeInputInfo, gather_tree_required_inputs>;
 
-    ASSERT_EQ(gather_tree->get_output_shape(0), (Shape{1, 2, 3}));
-    ASSERT_EQ(gather_tree->get_output_element_type(0), element::i64);
+std::shared_ptr<Node> makeGatherTreeOp(const GatherTreeInputParams& p) {
+    if (p.size() != gather_tree_required_inputs) {
+        throw runtime_error("GatherTree requires 4 inputs");
+    }
+    auto step_ids = make_shared<op::Parameter>(p.at(step_ids_input_idx).in_et, p.at(step_ids_input_idx).in_pshape);
+    auto parent_idx =
+        make_shared<op::Parameter>(p.at(parent_idx_input_idx).in_et, p.at(parent_idx_input_idx).in_pshape);
+    auto max_seq_len =
+        make_shared<op::Parameter>(p.at(max_seq_len_input_idx).in_et, p.at(max_seq_len_input_idx).in_pshape);
+    auto end_token = make_shared<op::Parameter>(p.at(end_token_input_idx).in_et, p.at(end_token_input_idx).in_pshape);
+    return make_shared<op::v1::GatherTree>(step_ids, parent_idx, max_seq_len, end_token);
 }
+}  // namespace
 
-TEST(type_prop, gather_tree_pooling_step_ids_invalid_rank) {
-    auto step_ids = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3, 4});
-    auto parent_idx = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto max_seq_len = make_shared<op::Parameter>(element::i64, Shape{1});
-    auto end_token = make_shared<op::Parameter>(element::i64, Shape{});
+TEST(type_prop, gather_tree_invalid_input_element_type) {
+    Shape scalar_shape{};
+    Shape vector_shape{2};
+    Shape tensor_shape{1, 2, 3};
+
+    element::Type input_et = element::boolean;
+    GatherTreeInputParams params{GatherTreeInputInfo{input_et, tensor_shape},
+                                 GatherTreeInputInfo{input_et, tensor_shape},
+                                 GatherTreeInputInfo{input_et, vector_shape},
+                                 GatherTreeInputInfo{input_et, scalar_shape}};
     try {
-        auto gather_tree = make_shared<op::v1::GatherTree>(step_ids, parent_idx, max_seq_len, end_token);
-        // Should have thrown, so fail if it didn't
-        FAIL() << "Ivalid step_ids input rank not detected";
+        auto gather_tree = makeGatherTreeOp(params);
+        FAIL() << "Invalid element types for inputs not detected";
     } catch (const NodeValidationFailure& error) {
-        EXPECT_HAS_SUBSTRING(error.what(), std::string("step_ids input rank must equal to 3 (step_ids rank: 4)"));
+        EXPECT_HAS_SUBSTRING(error.what(), "Element type of inputs must be numeric.");
     } catch (...) {
-        FAIL() << "Deduced type check failed for unexpected reason";
+        FAIL() << "Element type check for inputs failed for unexpected reason";
     }
 }
 
-TEST(type_prop, gather_tree_parent_idx_invalid_rank) {
-    auto step_ids = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto parent_idx = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3, 4});
-    auto max_seq_len = make_shared<op::Parameter>(element::i64, Shape{1});
-    auto end_token = make_shared<op::Parameter>(element::i64, Shape{});
-    try {
-        auto gather_tree = make_shared<op::v1::GatherTree>(step_ids, parent_idx, max_seq_len, end_token);
-        // Should have thrown, so fail if it didn't
-        FAIL() << "Ivalid parent_idx input rank not detected";
-    } catch (const NodeValidationFailure& error) {
-        EXPECT_HAS_SUBSTRING(error.what(), std::string("parent_idx input rank must equal to 3 (parent_idx rank: 4)"));
-    } catch (...) {
-        FAIL() << "Deduced type check failed for unexpected reason";
+TEST(type_prop, gather_tree_incompatible_input_element_types) {
+    element::Type float_et = element::f32;
+    element::Type integer_et = element::i32;
+
+    Shape scalar_shape{};
+    Shape vector_shape{2};
+    Shape tensor_shape{1, 2, 3};
+
+    vector<GatherTreeInputParams> test_cases = {// step_ids input has incompatible element type
+                                                GatherTreeInputParams{GatherTreeInputInfo{integer_et, tensor_shape},
+                                                                      GatherTreeInputInfo{float_et, tensor_shape},
+                                                                      GatherTreeInputInfo{float_et, vector_shape},
+                                                                      GatherTreeInputInfo{float_et, scalar_shape}},
+                                                // parent_idx input has incompatible element type
+                                                GatherTreeInputParams{GatherTreeInputInfo{float_et, tensor_shape},
+                                                                      GatherTreeInputInfo{integer_et, tensor_shape},
+                                                                      GatherTreeInputInfo{float_et, vector_shape},
+                                                                      GatherTreeInputInfo{float_et, scalar_shape}},
+                                                // max_seq_len input has incompatible element type
+                                                GatherTreeInputParams{GatherTreeInputInfo{float_et, tensor_shape},
+                                                                      GatherTreeInputInfo{float_et, tensor_shape},
+                                                                      GatherTreeInputInfo{integer_et, vector_shape},
+                                                                      GatherTreeInputInfo{float_et, scalar_shape}},
+                                                // end_token input has incompatible element type
+                                                GatherTreeInputParams{GatherTreeInputInfo{float_et, tensor_shape},
+                                                                      GatherTreeInputInfo{float_et, tensor_shape},
+                                                                      GatherTreeInputInfo{float_et, vector_shape},
+                                                                      GatherTreeInputInfo{integer_et, scalar_shape}}};
+
+    for (const auto& test_case : test_cases) {
+        try {
+            auto gather_tree = makeGatherTreeOp(test_case);
+            FAIL() << "Incompatible element types for inputs not detected";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "Inputs must have the same element type.");
+        } catch (...) {
+            FAIL() << "Element type check for inputs failed for unexpected reason";
+        }
     }
 }
 
-TEST(type_prop, gather_tree_max_seq_len_invalid_rank) {
-    auto step_ids = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto parent_idx = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto max_seq_len = make_shared<op::Parameter>(element::i64, Shape{1, 2});
-    auto end_token = make_shared<op::Parameter>(element::i64, Shape{});
-    try {
-        auto gather_tree = make_shared<op::v1::GatherTree>(step_ids, parent_idx, max_seq_len, end_token);
-        // Should have thrown, so fail if it didn't
-        FAIL() << "Ivalid parent_idx input rank not detected";
-    } catch (const NodeValidationFailure& error) {
-        EXPECT_HAS_SUBSTRING(error.what(), std::string("max_seq_len input rank must equal to 1 (max_seq_len rank: 2)"));
-    } catch (...) {
-        FAIL() << "Deduced type check failed for unexpected reason";
+TEST(type_prop, gather_tree_input_element_types) {
+    Shape scalar_shape{};
+    Shape vector_shape{2};
+    Shape tensor_shape{1, 2, 3};
+
+    std::vector<element::Type> element_types{element::u4,
+                                             element::u8,
+                                             element::u16,
+                                             element::u32,
+                                             element::i8,
+                                             element::i16,
+                                             element::i32,
+                                             element::i64,
+                                             element::f32,
+                                             element::f64,
+                                             element::u32};
+    std::vector<GatherTreeInputParams> test_cases;
+    std::for_each(std::begin(element_types), std::end(element_types), [&](element::Type et) {
+        GatherTreeInputParams params{GatherTreeInputInfo{et, tensor_shape},
+                                     GatherTreeInputInfo{et, tensor_shape},
+                                     GatherTreeInputInfo{et, vector_shape},
+                                     GatherTreeInputInfo{et, scalar_shape}};
+        test_cases.insert(test_cases.end(), params);
+    });
+    for (const auto& test_case : test_cases) {
+        try {
+            EXPECT_NO_THROW(makeGatherTreeOp(test_case));
+        } catch (...) {
+            FAIL() << "Inputs element type validation check failed for unexpected reason";
+        }
     }
 }
 
-TEST(type_prop, gather_tree_end_token_invalid_rank) {
-    auto step_ids = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto parent_idx = make_shared<op::Parameter>(element::i64, Shape{1, 2, 3});
-    auto max_seq_len = make_shared<op::Parameter>(element::i64, Shape{1});
-    auto end_token = make_shared<op::Parameter>(element::i64, Shape{1});
-    try {
-        auto gather_tree = make_shared<op::v1::GatherTree>(step_ids, parent_idx, max_seq_len, end_token);
-        // Should have thrown, so fail if it didn't
-        FAIL() << "Ivalid end_token input rank not detected";
-    } catch (const NodeValidationFailure& error) {
-        EXPECT_HAS_SUBSTRING(error.what(), std::string("end_token input rank must be scalar (end_token rank: 1)"));
-    } catch (...) {
-        FAIL() << "Deduced type check failed for unexpected reason";
+TEST(type_prop, gather_tree_invalid_step_ids_and_parent_idx_input_shapes) {
+    element::Type et = element::f32;
+
+    Shape scalar_shape{};
+    PartialShape vector_shape{Dimension()};
+
+    std::vector<std::pair<PartialShape, PartialShape>> input_shapes = {
+        {PartialShape{1}, PartialShape{1, 2, 3}},
+        {PartialShape{1, 2, 3}, PartialShape{3, 3, 3, 3}},
+        {PartialShape{Dimension(), Dimension(), 3}, PartialShape::dynamic(4)},
+        {PartialShape::dynamic(2), PartialShape::dynamic()},
+        {PartialShape{1, 2, 3}, PartialShape{Dimension(), Dimension(3, 5), 3}}};
+    std::vector<GatherTreeInputParams> test_cases;
+    std::for_each(std::begin(input_shapes), std::end(input_shapes), [&](std::pair<PartialShape, PartialShape> shapes) {
+        GatherTreeInputParams params{GatherTreeInputInfo{et, shapes.first},
+                                     GatherTreeInputInfo{et, shapes.second},
+                                     GatherTreeInputInfo{et, vector_shape},
+                                     GatherTreeInputInfo{et, scalar_shape}};
+        test_cases.insert(test_cases.end(), params);
+    });
+    for (const auto& test_case : test_cases) {
+        try {
+            auto gather_tree = makeGatherTreeOp(test_case);
+            FAIL() << "Incompatible shapes for inputs step_ids and parent_idx not detected";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "step_ids and parent_idx inputs must have the same shape with rank 3.");
+        } catch (...) {
+            FAIL() << "Shape check for step_ids and parent_idx inputs failed for unexpected reason";
+        }
+    }
+}
+
+TEST(type_prop, gather_tree_invalid_max_seq_len_rank) {
+    element::Type et = element::f32;
+
+    Shape tensor_shape{1, 2, 3};
+    Shape scalar_shape{};
+
+    std::vector<PartialShape> max_seq_len_shapes = {{}, {Dimension(), 1}, PartialShape::dynamic(3), {1, 2, 3, 4}};
+
+    std::vector<GatherTreeInputParams> test_cases;
+    std::for_each(std::begin(max_seq_len_shapes), std::end(max_seq_len_shapes), [&](PartialShape shape) {
+        GatherTreeInputParams params{GatherTreeInputInfo{et, tensor_shape},
+                                     GatherTreeInputInfo{et, tensor_shape},
+                                     GatherTreeInputInfo{et, shape},
+                                     GatherTreeInputInfo{et, scalar_shape}};
+        test_cases.insert(test_cases.end(), params);
+    });
+    for (const auto& test_case : test_cases) {
+        try {
+            auto gather_tree = makeGatherTreeOp(test_case);
+            FAIL() << "Invalid shapes for max_seq_len input not detected";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "max_seq_len input must have rank 1.");
+        } catch (...) {
+            FAIL() << "Shape check for max_seq_len input failed for unexpected reason";
+        }
+    }
+}
+
+TEST(type_prop, gather_tree_incompatible_step_ids_and_max_seq_len_shapes) {
+    element::Type et = element::f32;
+
+    Shape scalar_shape{};
+
+    std::vector<std::pair<PartialShape, PartialShape>> input_shapes = {
+        {PartialShape{1, 2, 3}, PartialShape{4}},
+        {PartialShape{Dimension(), 2, 3}, PartialShape{Dimension(3, 6)}}};
+    std::vector<GatherTreeInputParams> test_cases;
+    std::for_each(std::begin(input_shapes), std::end(input_shapes), [&](std::pair<PartialShape, PartialShape> shapes) {
+        GatherTreeInputParams params{GatherTreeInputInfo{et, shapes.first},
+                                     GatherTreeInputInfo{et, shapes.first},
+                                     GatherTreeInputInfo{et, shapes.second},
+                                     GatherTreeInputInfo{et, scalar_shape}};
+        test_cases.insert(test_cases.end(), params);
+    });
+    for (const auto& test_case : test_cases) {
+        try {
+            auto gather_tree = makeGatherTreeOp(test_case);
+            FAIL() << "Incompatible shapes for inputs step_ids and max_seq_len not detected";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(),
+                                 "Number of elements of max_seq_len input must match BATCH_SIZE dimension of "
+                                 "step_ids/parent_idx inputs.");
+        } catch (...) {
+            FAIL() << "Shape check for step_ids and max_seq_len inputs failed for unexpected reason";
+        }
+    }
+}
+
+TEST(type_prop, gather_tree_output_shape) {
+    element::Type et = element::f32;
+    Shape scalar_shape{};
+
+    std::vector<std::pair<PartialShape, PartialShape>> input_shapes = {
+        {PartialShape{1, 2, 3}, PartialShape{2}},
+        {PartialShape{1, 2, 3}, PartialShape::dynamic(1)},
+        {PartialShape{Dimension(), 2, Dimension()}, PartialShape{2}},
+        {
+            PartialShape::dynamic(3),
+            PartialShape{4},
+        },
+        {PartialShape{Dimension(), Dimension(3, 5), Dimension()}, PartialShape{Dimension(1, 3)}},
+        {PartialShape::dynamic(), PartialShape::dynamic()}};
+    std::vector<GatherTreeInputParams> test_cases;
+    std::for_each(std::begin(input_shapes), std::end(input_shapes), [&](std::pair<PartialShape, PartialShape> shapes) {
+        GatherTreeInputParams params{GatherTreeInputInfo{et, shapes.first},
+                                     GatherTreeInputInfo{et, shapes.first},
+                                     GatherTreeInputInfo{et, shapes.second},
+                                     GatherTreeInputInfo{et, scalar_shape}};
+        test_cases.insert(test_cases.end(), params);
+    });
+    for (const auto& test_case : test_cases) {
+        try {
+            auto gather_tree = makeGatherTreeOp(test_case);
+
+            PartialShape result_shape{test_case.at(step_ids_input_idx).in_pshape};
+            PartialShape max_seq_len_shape{test_case.at(max_seq_len_input_idx).in_pshape};
+            if (result_shape.rank().is_static() && max_seq_len_shape.rank().is_static()) {
+                result_shape[1] = result_shape[1] & max_seq_len_shape[0];
+            }
+            ASSERT_EQ(gather_tree->get_output_partial_shape(0), result_shape);
+            ASSERT_EQ(gather_tree->get_output_element_type(0), et);
+        } catch (...) {
+            FAIL() << "Output shape check failed for unexpected reason";
+        }
+    }
+}
+
+TEST(type_prop, gather_tree_invalid_end_token_rank) {
+    element::Type et = element::f32;
+
+    Shape tensor_shape{1, 2, 3};
+    Shape vector_shape{2};
+
+    std::vector<PartialShape> end_token_shapes = {{3}, {Dimension(), 1}, PartialShape::dynamic(3), {1, 2, 3, 4}};
+
+    std::vector<GatherTreeInputParams> test_cases;
+    std::for_each(std::begin(end_token_shapes), std::end(end_token_shapes), [&](PartialShape shape) {
+        GatherTreeInputParams params{GatherTreeInputInfo{et, tensor_shape},
+                                     GatherTreeInputInfo{et, tensor_shape},
+                                     GatherTreeInputInfo{et, vector_shape},
+                                     GatherTreeInputInfo{et, shape}};
+        test_cases.insert(test_cases.end(), params);
+    });
+    for (const auto& test_case : test_cases) {
+        try {
+            auto gather_tree = makeGatherTreeOp(test_case);
+            FAIL() << "Invalid shapes for end_token input not detected";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "end_token input must be scalar.");
+        } catch (...) {
+            FAIL() << "Shape check for end_token input failed for unexpected reason";
+        }
     }
 }
diff --git a/ngraph/test/type_prop/rnn_sequence.cpp b/ngraph/test/type_prop/rnn_sequence.cpp
index 3273a57aef45ee..e7bc8a7b81bae7 100644
--- a/ngraph/test/type_prop/rnn_sequence.cpp
+++ b/ngraph/test/type_prop/rnn_sequence.cpp
@@ -43,3 +43,298 @@ TEST(type_prop, rnn_sequence_forward) {
     EXPECT_EQ(sequence->get_output_element_type(1), element::f32);
     EXPECT_EQ(sequence->get_output_shape(1), (Shape{batch_size, num_directions, hidden_size}));
 }
+
+TEST(type_prop, rnn_sequence_invalid_input) {
+    const size_t batch_size = 8;
+    const size_t num_directions = 1;
+    const size_t seq_length = 6;
+    const size_t input_size = 4;
+    const size_t hidden_size = 128;
+
+    auto X = make_shared<opset5::Parameter>(element::f32, Shape{batch_size, seq_length, input_size});
+    auto H_t = make_shared<opset5::Parameter>(element::f32, Shape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, Shape{batch_size});
+
+    auto W = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, input_size});
+    auto R = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, hidden_size});
+    auto B = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size});
+
+    auto direction = op::RecurrentSequenceDirection::FORWARD;
+
+    // Invalid W tensor shape.
+    W = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, 2 * hidden_size, input_size});
+    try {
+        const auto rnn_sequence =
+            make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+        FAIL() << "RNNSequence node was created with invalid data.";
+    } catch (const NodeValidationFailure& error) {
+        EXPECT_HAS_SUBSTRING(error.what(), std::string("Parameter hidden_size mistmatched in W input"));
+    }
+
+    // Invalid R tensor shape.
+    W = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, input_size});
+    R = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, 1});
+    try {
+        const auto rnn_sequence =
+            make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+        FAIL() << "RNNSequence node was created with invalid data.";
+    } catch (const NodeValidationFailure& error) {
+        EXPECT_HAS_SUBSTRING(error.what(), std::string("Parameter hidden_size not matched RNNSequence."));
+    }
+
+    // Invalid H_t tensor shape.
+    R = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, hidden_size});
+    H_t = make_shared<opset5::Parameter>(element::f32, Shape{4, num_directions, hidden_size});
+    try {
+        const auto rnn_sequence =
+            make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+        FAIL() << "RNNSequence node was created with invalid data.";
+    } catch (const NodeValidationFailure& error) {
+        EXPECT_HAS_SUBSTRING(error.what(), std::string("Parameter batch_size not matched in RNNSequence."));
+    }
+
+    // Invalid B tensor shape.
+    H_t = make_shared<opset5::Parameter>(element::f32, Shape{batch_size, num_directions, hidden_size});
+    B = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, 2 * hidden_size});
+    try {
+        const auto rnn_sequence =
+            make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+        FAIL() << "RNNSequence node was created with invalid data.";
+    } catch (const NodeValidationFailure& error) {
+        EXPECT_HAS_SUBSTRING(error.what(), std::string("Parameter hidden_size mistmatched in B inpu"));
+    }
+
+    // Invalid direction.
+    B = make_shared<opset5::Parameter>(element::f32, Shape{2, hidden_size});
+    try {
+        const auto rnn_sequence =
+            make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+        FAIL() << "RNNSequence node was created with invalid data.";
+    } catch (const NodeValidationFailure& error) {
+        EXPECT_HAS_SUBSTRING(error.what(), std::string("Parameter num_directions not matched in RNNSequence."));
+    }
+
+    // Invalid direction.
+    B = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size});
+    direction = op::RecurrentSequenceDirection::BIDIRECTIONAL;
+    try {
+        const auto rnn_sequence =
+            make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+        FAIL() << "RNNSequence node was created with invalid data.";
+    } catch (const NodeValidationFailure& error) {
+        EXPECT_HAS_SUBSTRING(error.what(), std::string("Parameter num_directions not match direction in RNNSequence."));
+    }
+}
+
+TEST(type_prop, rnn_sequence_dynamic_inputs) {
+    const auto batch_size = Dimension::dynamic();
+    const size_t num_directions = 1;
+    const size_t seq_length = 6;
+    const auto input_size = Dimension::dynamic();
+    const auto hidden_size = Dimension::dynamic();
+
+    const auto X = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, seq_length, input_size});
+    const auto H_t =
+        make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, PartialShape{batch_size});
+
+    const auto W = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, input_size});
+    const auto R = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, hidden_size});
+    const auto B = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size});
+
+    const auto direction = op::RecurrentSequenceDirection::REVERSE;
+
+    const auto sequence = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, 128, direction);
+
+    EXPECT_EQ(sequence->outputs().size(), 2);
+    EXPECT_EQ(sequence->get_output_element_type(0), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(0),
+              (PartialShape{batch_size, num_directions, seq_length, hidden_size}));
+    EXPECT_EQ(sequence->get_output_element_type(1), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(1), (PartialShape{batch_size, num_directions, hidden_size}));
+}
+
+TEST(type_prop, rnn_sequence_dynamic_batch_size) {
+    const auto batch_size = Dimension::dynamic();
+    const size_t num_directions = 1;
+    const size_t seq_length = 6;
+    const size_t input_size = 4;
+    const size_t hidden_size = 128;
+
+    const auto X = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, seq_length, input_size});
+    const auto H_t =
+        make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, PartialShape{batch_size});
+
+    const auto W = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, input_size});
+    const auto R = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, hidden_size});
+    const auto B = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size});
+
+    const auto direction = op::RecurrentSequenceDirection::FORWARD;
+
+    const auto sequence = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+
+    EXPECT_EQ(sequence->outputs().size(), 2);
+    EXPECT_EQ(sequence->get_output_element_type(0), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(0),
+              (PartialShape{batch_size, num_directions, seq_length, hidden_size}));
+    EXPECT_EQ(sequence->get_output_element_type(1), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(1), (PartialShape{batch_size, num_directions, hidden_size}));
+}
+
+TEST(type_prop, rnn_sequence_dynamic_input_size) {
+    const size_t batch_size = 8;
+    const size_t num_directions = 1;
+    const size_t seq_length = 6;
+    const auto input_size = Dimension::dynamic();
+    const size_t hidden_size = 128;
+
+    const auto X = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, seq_length, input_size});
+    const auto H_t =
+        make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, PartialShape{batch_size});
+
+    const auto W = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, input_size});
+    const auto R = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, hidden_size});
+    const auto B = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size});
+
+    const auto direction = op::RecurrentSequenceDirection::FORWARD;
+
+    const auto sequence = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+
+    EXPECT_EQ(sequence->outputs().size(), 2);
+    EXPECT_EQ(sequence->get_output_element_type(0), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(0),
+              (PartialShape{batch_size, num_directions, seq_length, hidden_size}));
+    EXPECT_EQ(sequence->get_output_element_type(1), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(1), (PartialShape{batch_size, num_directions, hidden_size}));
+}
+
+TEST(type_prop, rnn_sequence_dynamic_hidden_size) {
+    const size_t batch_size = 8;
+    const size_t num_directions = 1;
+    const size_t seq_length = 6;
+    const size_t input_size = 4;
+    const auto hidden_size = Dimension::dynamic();
+
+    const auto X = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, seq_length, input_size});
+    const auto H_t =
+        make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, PartialShape{batch_size});
+
+    const auto W = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, input_size});
+    const auto R = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, hidden_size});
+    const auto B = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size});
+
+    const auto direction = op::RecurrentSequenceDirection::FORWARD;
+
+    const auto sequence = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, 128, direction);
+
+    EXPECT_EQ(sequence->outputs().size(), 2);
+    EXPECT_EQ(sequence->get_output_element_type(0), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(0),
+              (PartialShape{batch_size, num_directions, seq_length, hidden_size}));
+    EXPECT_EQ(sequence->get_output_element_type(1), element::f32);
+    EXPECT_EQ(sequence->get_output_partial_shape(1), (PartialShape{batch_size, num_directions, hidden_size}));
+}
+
+TEST(type_prop, rnn_sequence_dynamic_invalid_input_rank0) {
+    const size_t batch_size = 8;
+    const size_t num_directions = 1;
+    const size_t seq_length = 6;
+    const size_t input_size = 4;
+    const size_t hidden_size = 128;
+
+    auto X = make_shared<opset5::Parameter>(element::f32, Shape{batch_size, seq_length, input_size});
+    auto H_t = make_shared<opset5::Parameter>(element::f32, Shape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, Shape{batch_size});
+
+    auto W = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, input_size});
+    auto R = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, hidden_size});
+    auto B = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size});
+
+    const auto direction = op::RecurrentSequenceDirection::FORWARD;
+
+    // Invalid rank0 for X tensor.
+    X = make_shared<opset5::Parameter>(element::f32, PartialShape{});
+    ASSERT_THROW(make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction),
+                 ngraph::CheckFailure)
+        << "RNNSequence node was created with invalid data.";
+
+    // Invalid rank0 for H_t tensor.
+    X = make_shared<opset5::Parameter>(element::f32, Shape{batch_size, seq_length, input_size});
+    H_t = make_shared<opset5::Parameter>(element::f32, PartialShape{});
+    ASSERT_THROW(make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction),
+                 ngraph::CheckFailure)
+        << "RNNSequence node was created with invalid data.";
+
+    // Invalid rank0 for W tensor.
+    H_t = make_shared<opset5::Parameter>(element::f32, Shape{batch_size, num_directions, hidden_size});
+    W = make_shared<opset5::Parameter>(element::f32, PartialShape{});
+    ASSERT_THROW(make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction),
+                 ngraph::CheckFailure)
+        << "RNNSequence node was created with invalid data.";
+
+    // Invalid rank0 for R tensor.
+    W = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, input_size});
+    R = make_shared<opset5::Parameter>(element::f32, PartialShape{});
+    ASSERT_THROW(make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction),
+                 ngraph::CheckFailure)
+        << "RNNSequence node was created with invalid data.";
+
+    // Invalid rank0 for B tensor.
+    R = make_shared<opset5::Parameter>(element::f32, Shape{num_directions, hidden_size, hidden_size});
+    B = make_shared<opset5::Parameter>(element::f32, PartialShape{});
+    ASSERT_THROW(make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction),
+                 ngraph::CheckFailure)
+        << "RNNSequence node was created with invalid data.";
+}
+
+TEST(type_prop, rnn_sequence_dynamic_invalid_input_dynamic_rank) {
+    const size_t batch_size = 8;
+    const size_t num_directions = 1;
+    const size_t seq_length = 6;
+    const size_t input_size = 4;
+    const size_t hidden_size = 128;
+
+    auto X = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, seq_length, input_size});
+    auto H_t = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, PartialShape{batch_size});
+
+    auto W = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, input_size});
+    auto R = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, hidden_size});
+    auto B = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size});
+
+    const auto direction = op::RecurrentSequenceDirection::FORWARD;
+
+    auto check_dynamic_rnn = [](const shared_ptr<opset5::RNNSequence>& rnn) -> bool {
+        return rnn->output(0).get_partial_shape() == PartialShape::dynamic() &&
+               rnn->output(0).get_element_type() == rnn->input(0).get_element_type() &&
+               rnn->output(1).get_partial_shape() == PartialShape::dynamic() &&
+               rnn->output(1).get_element_type() == rnn->input(0).get_element_type();
+    };
+
+    X = make_shared<opset5::Parameter>(element::f32, PartialShape::dynamic(Rank::dynamic()));
+    auto rnn_x = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+    EXPECT_EQ(check_dynamic_rnn(rnn_x), true);
+
+    X = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, seq_length, input_size});
+    H_t = make_shared<opset5::Parameter>(element::f32, PartialShape::dynamic(Rank::dynamic()));
+    auto rnn_h = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+    EXPECT_EQ(check_dynamic_rnn(rnn_h), true);
+
+    H_t = make_shared<opset5::Parameter>(element::f32, PartialShape{batch_size, num_directions, hidden_size});
+    W = make_shared<opset5::Parameter>(element::f32, PartialShape::dynamic(Rank::dynamic()));
+    auto rnn_w = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+    EXPECT_EQ(check_dynamic_rnn(rnn_w), true);
+
+    W = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, input_size});
+    R = make_shared<opset5::Parameter>(element::f32, PartialShape::dynamic(Rank::dynamic()));
+    auto rnn_r = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+    EXPECT_EQ(check_dynamic_rnn(rnn_r), true);
+
+    R = make_shared<opset5::Parameter>(element::f32, PartialShape{num_directions, hidden_size, hidden_size});
+    B = make_shared<opset5::Parameter>(element::f32, PartialShape::dynamic(Rank::dynamic()));
+    auto rnn_b = make_shared<opset5::RNNSequence>(X, H_t, sequence_lengths, W, R, B, hidden_size, direction);
+    EXPECT_EQ(check_dynamic_rnn(rnn_b), true);
+}
diff --git a/ngraph/test/type_prop/slice.cpp b/ngraph/test/type_prop/slice.cpp
new file mode 100644
index 00000000000000..e70d7f4b514960
--- /dev/null
+++ b/ngraph/test/type_prop/slice.cpp
@@ -0,0 +1,1013 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <numeric>
+
+#include "gtest/gtest.h"
+#include "ngraph/ngraph.hpp"
+#include "util/type_prop.hpp"
+
+using namespace ngraph;
+
+namespace {
+template <typename T>
+std::shared_ptr<Node> make_slice_op_const_inputs(const std::vector<std::vector<T>>& args,
+                                                 PartialShape& data_shape,
+                                                 element::Type_t et) {
+    const auto& start_val = args[0];
+    const auto& stop_val = args[1];
+    const auto& step_val = args[2];
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Constant>(et, Shape{start_val.size()}, start_val);
+    const auto stop = std::make_shared<op::v0::Constant>(et, Shape{stop_val.size()}, stop_val);
+    const auto step = std::make_shared<op::v0::Constant>(et, Shape{step_val.size()}, step_val);
+
+    if (args.size() > 3) {
+        const auto& axes_val = args[3];
+        const auto axes = std::make_shared<op::v0::Constant>(et, Shape{axes_val.size()}, axes_val);
+        return std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+    }
+    return std::make_shared<op::v8::Slice>(data, start, stop, step);
+}
+}  // namespace
+
+TEST(type_prop, slice_v8_basic_const_inputs) {
+    PartialShape data_shape{10, 10, 10, 10, 10, 10, 10, 10};
+    PartialShape expected_out_shape{7, 4, 10, 10, 9, 9, 5, 10};
+
+    std::vector<int32_t> start_val{1, 1, -20, 9, 9, 9, 9, 20};
+    std::vector<int32_t> stop_val{8, 8, 20, -11, 0, -10, -11, -20};
+    std::vector<int32_t> step_val{1, 2, 1, -1, -1, -1, -2, -1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_dif_steps) {
+    PartialShape data_shape{5, 5, 5, 5, 9, 9};
+    PartialShape expected_out_shape{3, 2, 2, 1, 5, 3};
+
+    std::vector<int32_t> start_val{0, 0, 0, 0, 0, 0};
+    std::vector<int32_t> stop_val{5, 5, 5, 5, 9, 9};
+    std::vector<int32_t> step_val{2, 3, 4, 5, 2, 3};
+
+    element::Type_t et = element::i32;
+
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_dif_neg_steps) {
+    PartialShape data_shape{5, 5, 5, 5, 9, 9};
+    PartialShape expected_out_shape{2, 2, 1, 1, 4, 3};
+
+    std::vector<int32_t> start_val{5, 5, 5, 5, 9, 9};
+    std::vector<int32_t> stop_val{0, 0, 0, 0, 0, 0};
+    std::vector<int32_t> step_val{-2, -3, -4, -5, -2, -3};
+
+    element::Type_t et = element::i32;
+
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_default_axes) {
+    PartialShape data_shape{10, 10, 10, 10, 10, 10, 10, 10};
+    PartialShape expected_out_shape{7, 4, 10, 10, 9, 9, 5, 10};
+
+    std::vector<int32_t> start_val{1, 1, -20, 9, 9, 9, 9, 20};
+    std::vector<int32_t> stop_val{8, 8, 20, -11, 0, -10, -11, -20};
+    std::vector<int32_t> step_val{1, 2, 1, -1, -1, -1, -2, -1};
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_unordered_axes) {
+    PartialShape data_shape{10, 10, 10, 10, 10, 10, 10, 10};
+    PartialShape expected_out_shape{4, 9, 7, 10, 10, 9, 5, 10};
+
+    std::vector<int32_t> start_val{1, 1, -20, 9, 9, 9, 9, 20};
+    std::vector<int32_t> stop_val{8, 8, 20, -11, 0, -10, -11, -20};
+    std::vector<int32_t> step_val{1, 2, 1, -1, -1, -1, -2, -1};
+
+    std::vector<int32_t> axes_val{2, 0, 3, 7, 1, 5, 6, 4};
+
+    element::Type_t et = element::i32;
+
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_const_inputs_not_all_axes_unordered) {
+    PartialShape data_shape{10, 10, 10, 10, 10, 20, Dimension(20, 30), 30, Dimension(2, 5), Dimension(-1)};
+    PartialShape expected_out_shape{4, 7, 10, 10, 9, 20, Dimension(10, 15), 30, Dimension(2, 5), Dimension(-1)};
+
+    std::vector<int32_t> start_val{1, 1, -20, 9, 10, 9};
+    std::vector<int32_t> stop_val{8, 8, 20, -11, 25, 0};
+    std::vector<int32_t> step_val{1, 2, 1, -1, 1, -1};
+
+    std::vector<int32_t> axes_val{1, 0, 2, 3, 6, 4};
+
+    element::Type_t et = element::i32;
+
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_data_dynamic_bounds_dimensions) {
+    PartialShape data_shape{Dimension(10, 20), Dimension(20, 30), Dimension(30, 40)};
+    PartialShape expected_out_shape{6, Dimension(10, 15), Dimension(0, 5)};
+
+    std::vector<int32_t> start_val{2, 10, 35};
+    std::vector<int32_t> stop_val{8, 25, 40};
+    std::vector<int32_t> step_val{1, 1, 1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_data_dynamic_rank) {
+    PartialShape data_shape = PartialShape::dynamic();
+    PartialShape expected_out_shape = PartialShape::dynamic();
+
+    std::vector<int32_t> start_val{1, 1, -20, 9, 9, 9, 9, 20};
+    std::vector<int32_t> stop_val{8, 8, 20, -11, 0, -10, -11, -20};
+    std::vector<int32_t> step_val{1, 2, 1, -1, -1, -1, -2, -1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+    EXPECT_TRUE(op->get_output_partial_shape(0).rank().is_dynamic());
+}
+
+TEST(type_prop, slice_v8_basic_param_inputs_default_axes) {
+    PartialShape data_shape{Dimension(0, 10),
+                            Dimension(1, 10),
+                            10,
+                            Dimension(3, 5),
+                            Dimension(-1, -1),
+                            Dimension(100, -1),
+                            Dimension(0, 8),
+                            Dimension(4, 8),
+                            16};
+    PartialShape expected_out_shape{Dimension(0, 10),
+                                    Dimension(0, 10),
+                                    Dimension(0, 10),
+                                    Dimension(0, 5),
+                                    Dimension(0, -1),
+                                    Dimension(0, -1),
+                                    Dimension(0, 8),
+                                    Dimension(4, 8),
+                                    16};
+
+    PartialShape start_shape{7};
+    PartialShape stop_shape{7};
+    PartialShape step_shape{7};
+
+    element::Type_t et = element::i32;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, start_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, stop_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, step_shape);
+
+    const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_sss_param_inputs_const_axes) {
+    PartialShape data_shape{Dimension(0, 10),
+                            Dimension(1, 10),
+                            10,
+                            Dimension(3, 5),
+                            Dimension(-1, -1),
+                            Dimension(100, -1),
+                            Dimension(0, 8),
+                            Dimension(4, 8),
+                            16};
+
+    PartialShape expected_out_shape{Dimension(0, 10),
+                                    Dimension(0, 10),
+                                    Dimension(0, 10),
+                                    Dimension(0, 5),
+                                    Dimension(0, -1),
+                                    Dimension(0, -1),
+                                    Dimension(0, 8),
+                                    Dimension(4, 8),
+                                    16};
+
+    PartialShape start_shape{7};
+    PartialShape stop_shape{7};
+    PartialShape step_shape{7};
+
+    element::Type_t et = element::i32;
+
+    Shape axes_shape{7};
+    std::vector<int32_t> axes_val(7);
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, start_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, stop_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, step_shape);
+    const auto axes = std::make_shared<op::v0::Constant>(et, axes_shape, axes_val);
+
+    const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_sss_param_inputs_param_axes) {
+    PartialShape data_shape{Dimension(0, 10),
+                            Dimension(1, 10),
+                            10,
+                            Dimension(3, 5),
+                            Dimension(-1, -1),
+                            Dimension(100, -1),
+                            Dimension(0, 8),
+                            Dimension(4, 8),
+                            16};
+
+    PartialShape expected_out_shape{Dimension(0, 10),
+                                    Dimension(0, 10),
+                                    Dimension(0, 10),
+                                    Dimension(0, 5),
+                                    Dimension(0, -1),
+                                    Dimension(0, -1),
+                                    Dimension(0, 8),
+                                    Dimension(4, 8),
+                                    16};
+    PartialShape start_shape{7};
+    PartialShape stop_shape{7};
+    PartialShape step_shape{7};
+    PartialShape axes_shape{7};
+
+    element::Type_t et = element::i32;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, start_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, stop_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, step_shape);
+    const auto axes = std::make_shared<op::v0::Parameter>(et, axes_shape);
+
+    const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_MAX_MIN_INT_dynamic_dimensions) {
+    PartialShape data_shape{10,
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(30, 40),
+                            Dimension(0, 50),
+                            Dimension(0, -1)};
+    PartialShape expected_out_shape{8,
+                                    Dimension(8, 18),
+                                    5,
+                                    10,
+                                    Dimension(10, 15),
+                                    Dimension(10, 20),
+                                    Dimension(30, 40),
+                                    Dimension(0, 50),
+                                    Dimension(0, INT32_MAX)};
+
+    std::vector<int32_t> start_val{2, 2, INT32_MIN, INT32_MIN, INT32_MIN, INT32_MIN, INT32_MIN, 0, 0};
+    std::vector<int32_t> stop_val{10, INT32_MAX, 5, 10, 15, 25, INT32_MAX, 50, INT32_MAX};
+    std::vector<int32_t> step_val{1, 1, 1, 1, 1, 1, 1, 1, 1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_MAX_MIN_INT_dynamic_dimensions_neg_step) {
+    PartialShape data_shape{10,
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(11, 20),
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(30, 40),
+                            Dimension(20),
+                            Dimension(20),
+                            Dimension(0, 20),
+                            Dimension(-1),
+                            Dimension(-1)};
+    PartialShape expected_out_shape{8,
+                                    Dimension(8, 18),
+                                    Dimension(5, 15),
+                                    Dimension(0, 9),
+                                    Dimension(0, 9),
+                                    Dimension(0, 4),
+                                    Dimension(0),
+                                    Dimension(30, 40),
+                                    Dimension(20),
+                                    Dimension(20),
+                                    Dimension(0, 20),
+                                    Dimension(0, 21),
+                                    Dimension(-1)};
+
+    std::vector<int32_t> start_val{9,
+                                   INT32_MAX,
+                                   INT32_MAX,
+                                   INT32_MAX,
+                                   INT32_MAX,
+                                   INT32_MAX,
+                                   INT32_MAX,
+                                   INT32_MAX,
+                                   20,
+                                   20,
+                                   20,
+                                   20,
+                                   INT32_MAX};
+    std::vector<int32_t> stop_val{1, 1, 4, 10, 10, 15, 25, INT32_MIN, -21, INT32_MIN, INT32_MIN, INT32_MIN, INT32_MIN};
+    std::vector<int32_t> step_val{-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_data_full_dynamic_dims) {
+    PartialShape data_shape{Dimension(-1), Dimension(-1), Dimension(-1)};
+    PartialShape expected_out_shape{Dimension(0, 6), Dimension(0, 15), Dimension(0, 5)};
+
+    std::vector<int32_t> start_val{2, 10, 35};
+    std::vector<int32_t> stop_val{8, 25, 40};
+    std::vector<int32_t> step_val{1, 1, 1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_data_full_dynamic_dims_neg_ind) {
+    PartialShape data_shape{Dimension(-1), Dimension(-1), Dimension(-1)};
+    PartialShape expected_out_shape{Dimension(0, 6), Dimension(0, 15), Dimension(0, 5)};
+
+    std::vector<int32_t> start_val{-8, -25, -40};
+    std::vector<int32_t> stop_val{-2, -10, -35};
+    std::vector<int32_t> step_val{1, 1, 1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_data_full_dynamic_dims_neg_step) {
+    PartialShape data_shape{Dimension(-1), Dimension(-1), Dimension(-1)};
+    PartialShape expected_out_shape{Dimension(0, 6), Dimension(0, 15), Dimension(0, 5)};
+
+    std::vector<int32_t> start_val{8, 25, 40};
+    std::vector<int32_t> stop_val{2, 10, 35};
+    std::vector<int32_t> step_val{-1, -1, -1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_data_full_dynamic_dims_neg_step_neg_ind) {
+    PartialShape data_shape{Dimension(-1), Dimension(-1), Dimension(-1)};
+    PartialShape expected_out_shape{Dimension(0, 6), Dimension(0, 15), Dimension(0, 5)};
+
+    std::vector<int32_t> start_val{-2, -10, -35};
+    std::vector<int32_t> stop_val{-8, -25, -40};
+    std::vector<int32_t> step_val{-1, -1, -1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_data_full_dynamic_dims_neg_step_mix_ind) {
+    PartialShape data_shape{Dimension(-1), Dimension(-1), Dimension(-1), Dimension(-1), Dimension(-1)};
+    PartialShape expected_out_shape{Dimension(0, 6),
+                                    Dimension(0, 6),
+                                    Dimension(-1),
+                                    Dimension(0, INT32_MAX - 5),
+                                    Dimension(-1)};
+
+    std::vector<int32_t> start_val{5, 5, -10, INT32_MAX, INT32_MAX};
+    std::vector<int32_t> stop_val{-10, INT32_MIN, 5, 5, INT32_MIN};
+    std::vector<int32_t> step_val{-1, -1, -1, -1, -1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_MAX_MIN_INT_64_dynamic_dimensions_neg_step) {
+    PartialShape data_shape{10,
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(11, 20),
+                            Dimension(10, 20),
+                            Dimension(10, 20),
+                            Dimension(30, 40),
+                            Dimension(20),
+                            Dimension(20),
+                            Dimension(0, 20),
+                            Dimension(-1),
+                            Dimension(-1)};
+    PartialShape expected_out_shape{8,
+                                    Dimension(8, 18),
+                                    Dimension(5, 15),
+                                    Dimension(0, 9),
+                                    Dimension(0, 9),
+                                    Dimension(0, 4),
+                                    Dimension(0),
+                                    Dimension(30, 40),
+                                    Dimension(20),
+                                    Dimension(20),
+                                    Dimension(0, 20),
+                                    Dimension(0, 21),
+                                    Dimension(-1)};
+
+    std::vector<int64_t> start_val{9,
+                                   INT64_MAX,
+                                   INT64_MAX,
+                                   INT64_MAX,
+                                   INT64_MAX,
+                                   INT64_MAX,
+                                   INT64_MAX,
+                                   INT64_MAX,
+                                   20,
+                                   20,
+                                   20,
+                                   20,
+                                   INT64_MAX};
+    std::vector<int64_t> stop_val{1, 1, 4, 10, 10, 15, 25, INT64_MIN, -21, INT64_MIN, INT64_MIN, INT64_MIN, INT64_MIN};
+    std::vector<int64_t> step_val{-1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1};
+
+    std::vector<int64_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i64;
+    std::vector<std::vector<int64_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_MAX_MIN_64_no_upper_bounds_neg_step) {
+    PartialShape data_shape{Dimension(-1), Dimension(0, INT64_MAX), Dimension(0, INT64_MAX)};
+    PartialShape expected_out_shape{Dimension(-1), Dimension(0, INT64_MAX), Dimension(0, INT64_MAX)};
+
+    std::vector<int64_t> start_val{INT64_MAX, INT64_MAX, INT64_MAX};
+    std::vector<int64_t> stop_val{INT64_MIN, INT64_MIN, INT64_MIN};
+    std::vector<int64_t> step_val{-1, -1, -1};
+
+    std::vector<int64_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i64;
+    std::vector<std::vector<int64_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_MAX_MIN_64_no_upper_bounds) {
+    PartialShape data_shape{Dimension(-1), Dimension(0, INT64_MAX), Dimension(0, INT64_MAX)};
+    PartialShape expected_out_shape{Dimension(-1), Dimension(0, INT64_MAX), Dimension(0, INT64_MAX)};
+
+    std::vector<int64_t> start_val{INT64_MIN, INT64_MIN, INT64_MIN};
+    std::vector<int64_t> stop_val{INT64_MAX, INT64_MAX, INT64_MAX};
+    std::vector<int64_t> step_val{1, 1, 1};
+
+    std::vector<int64_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i64;
+    std::vector<std::vector<int64_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_MAX_MIN_32_no_upper_bounds) {
+    PartialShape data_shape{Dimension(-1), Dimension(0, INT64_MAX), Dimension(0, INT32_MAX), Dimension(0, INT32_MAX)};
+    PartialShape expected_out_shape{Dimension(-1),
+                                    Dimension(0, INT64_MAX),
+                                    Dimension(0, INT32_MAX),
+                                    Dimension(0, INT32_MAX)};
+
+    std::vector<int32_t> start_val{INT32_MIN, INT32_MIN, INT32_MIN, INT32_MIN};
+    std::vector<int32_t> stop_val{INT32_MAX, INT32_MAX, INT32_MAX, INT32_MAX};
+    std::vector<int32_t> step_val{1, 1, 1, 1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_MAX_MIN_32_no_upper_bounds_neg_step) {
+    PartialShape data_shape{Dimension(-1), Dimension(0, INT64_MAX), Dimension(0, INT32_MAX), Dimension(0, INT32_MAX)};
+    PartialShape expected_out_shape{Dimension(-1), Dimension(-1), Dimension(0, INT32_MAX), Dimension(0, INT32_MAX)};
+
+    std::vector<int32_t> start_val{INT32_MAX, INT32_MAX, INT32_MAX, INT32_MAX};
+    std::vector<int32_t> stop_val{INT32_MIN, INT32_MIN, INT32_MIN, INT32_MIN};
+    std::vector<int32_t> step_val{-1, -1, -1, -1};
+
+    std::vector<int32_t> axes_val(start_val.size());
+    std::iota(axes_val.begin(), axes_val.end(), 0);
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+    const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+
+    EXPECT_EQ(op->get_element_type(), et);
+    EXPECT_EQ(op->get_output_partial_shape(0), expected_out_shape);
+}
+
+TEST(type_prop, slice_v8_duplicated_axes) {
+    PartialShape data_shape{100, 100, 100, 100};
+    PartialShape expected_out_shape{100, 100, 100, 100};
+
+    std::vector<int32_t> start_val{2, 10, 35, 10};
+    std::vector<int32_t> stop_val{8, 25, 40, 20};
+    std::vector<int32_t> step_val{1, 1, 1, 100};
+
+    std::vector<int32_t> axes_val{2, 1, 2, 3};
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+
+    EXPECT_THROW(make_slice_op_const_inputs(input_vals, data_shape, et), NodeValidationFailure);
+}
+
+TEST(type_prop, slice_v8_zero_step) {
+    PartialShape data_shape{100, 100, 100};
+    PartialShape expected_out_shape{100, 100, 100};
+
+    std::vector<int32_t> start_val{2, 10, 35};
+    std::vector<int32_t> stop_val{8, 25, 40};
+    std::vector<int32_t> step_val{1, 0, 1};
+
+    std::vector<int32_t> axes_val{1, 2, 3};
+
+    element::Type_t et = element::i32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+
+    EXPECT_THROW(make_slice_op_const_inputs(input_vals, data_shape, et), NodeValidationFailure);
+}
+
+TEST(type_prop, slice_v8_ind_bad_type) {
+    PartialShape data_shape{100, 100, 100, 100};
+    PartialShape expected_out_shape{100, 100, 100, 100};
+
+    std::vector<int32_t> start_val{2, 10, 35, 10};
+    std::vector<int32_t> stop_val{8, 25, 40, 20};
+    std::vector<int32_t> step_val{1, 1, 1, 100};
+
+    std::vector<int32_t> axes_val{0, 1, 2, 3};
+
+    element::Type_t et = element::f32;
+    std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+
+    EXPECT_THROW(make_slice_op_const_inputs(input_vals, data_shape, et), NodeValidationFailure);
+}
+
+TEST(type_prop, slice_v8_input_wrong_shape_catch) {
+    PartialShape data_shape{100, 100, 100, 100};
+
+    PartialShape correct_shape{3};
+    PartialShape wrong_shape{};
+
+    element::Type_t et = element::i32;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto axes = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    {
+        try {
+            const auto start = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`start` input must be a 1D tensor");
+        }
+    }
+    {
+        try {
+            const auto stop = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`stop` input must be a 1D tensor");
+        }
+    }
+    {
+        try {
+            const auto step = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`step` input must be a 1D tensor");
+        }
+    }
+    {
+        try {
+            const auto axes = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`axes` input must be a 1D tensor");
+        }
+    }
+    {
+        try {
+            const auto data = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`data` input can't be a scalar");
+        }
+    }
+}
+
+TEST(type_prop, slice_v8_input_start_stop_step_dif_length_catch) {
+    PartialShape data_shape{100, 100, 100, 100};
+
+    PartialShape correct_shape{3};
+    PartialShape wrong_shape{2};
+
+    element::Type_t et = element::i32;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto axes = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    {
+        try {
+            const auto start = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "start`, `stop`, `step` inputs must have compatible shapes");
+        }
+    }
+    {
+        try {
+            const auto stop = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "start`, `stop`, `step` inputs must have compatible shapes");
+        }
+    }
+    {
+        try {
+            const auto step = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "start`, `stop`, `step` inputs must have compatible shapes");
+        }
+    }
+    {
+        try {
+            const auto axes = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(),
+                                 "`axes` input must have compatible shape with `start`, `stop`, `step` inputs");
+        }
+    }
+}
+
+TEST(type_prop, slice_v8_input_start_stop_step_out_of_data_rank_length_catch) {
+    PartialShape data_shape{100, 100, 100, 100};
+
+    PartialShape correct_shape{3};
+    PartialShape wrong_shape{5};
+
+    element::Type_t et = element::i32;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto axes = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    {
+        try {
+            const auto start = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`start` input dim size can't be bigger than `data` rank");
+        }
+    }
+    {
+        try {
+            const auto stop = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`stop` input dim size can't be bigger than `data` rank");
+        }
+    }
+    {
+        try {
+            const auto step = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`step` input dim size can't be bigger than `data` rank");
+        }
+    }
+    {
+        try {
+            const auto axes = std::make_shared<op::v0::Parameter>(et, wrong_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`axes` input dim size can't be bigger than `data` rank");
+        }
+    }
+}
+
+TEST(type_prop, slice_v8_input_wrong_types_float_catch) {
+    PartialShape data_shape{100, 100, 100, 100};
+    PartialShape correct_shape{3};
+
+    element::Type_t et = element::i32;
+    element::Type_t wrong_et = element::f32;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto axes = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    {
+        try {
+            const auto start = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`start` input type must be integer.");
+        }
+    }
+    {
+        try {
+            const auto stop = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`stop` input type must be integer.");
+        }
+    }
+    {
+        try {
+            const auto step = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`step` input type must be integer.");
+        }
+    }
+    {
+        try {
+            const auto axes = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`axes` input type must be integer.");
+        }
+    }
+}
+
+TEST(type_prop, slice_v8_input_wrong_types_bool_catch) {
+    PartialShape data_shape{100, 100, 100, 100};
+    PartialShape correct_shape{3};
+
+    element::Type_t et = element::u64;
+    element::Type_t wrong_et = element::boolean;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    const auto axes = std::make_shared<op::v0::Parameter>(et, correct_shape);
+    {
+        try {
+            const auto start = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`start` input type must be integer.");
+        }
+    }
+    {
+        try {
+            const auto stop = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`stop` input type must be integer.");
+        }
+    }
+    {
+        try {
+            const auto step = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`step` input type must be integer.");
+        }
+    }
+    {
+        try {
+            const auto axes = std::make_shared<op::v0::Parameter>(wrong_et, correct_shape);
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "`axes` input type must be integer.");
+        }
+    }
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_out_axes_val) {
+    PartialShape data_shape{10, 10, 10, 10, 10, 10, 10, 10};
+
+    std::vector<int32_t> start_val{1, 1, -20, 9, 9, 9, 9, 20};
+    std::vector<int32_t> stop_val{8, 8, 20, -11, 0, -10, -11, -20};
+    std::vector<int32_t> step_val{1, 2, 1, -1, -1, -1, -2, -1};
+
+    element::Type_t et = element::i32;
+    {
+        try {
+            std::vector<int32_t> axes_val{2, 0, -20, 7, 1, 20, 6, 4};
+            std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+            const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+            FAIL() << "Slice validation did not work!";
+        } catch (const ov::AssertFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "must be in range of the `data` input rank: [-8, 7]. Got: -20");
+        }
+    }
+    {
+        try {
+            std::vector<int32_t> axes_val{2, 0, 9, 7, 1, 20, 6, 4};
+            std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val, axes_val};
+            const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "must be in range of the `data` input rank: [-8, 7]. Got: 9");
+        }
+    }
+    {
+        try {
+            const auto data = std::make_shared<op::v0::Parameter>(et, data_shape);
+            const auto start = std::make_shared<op::v0::Parameter>(et, PartialShape{2});
+            const auto stop = std::make_shared<op::v0::Parameter>(et, PartialShape{2});
+            const auto step = std::make_shared<op::v0::Parameter>(et, PartialShape{2});
+            const auto axes = std::make_shared<op::v0::Constant>(et, Shape{2}, std::vector<int32_t>{-15, 7});
+            const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "must be in range of the `data` input rank: [-8, 7]. Got: -15");
+        }
+    }
+}
+
+TEST(type_prop, slice_v8_basic_const_inputs_step_zero) {
+    PartialShape data_shape{10, 10, 10, 10, 10, 10, 10, 10};
+    PartialShape expected_out_shape{4, 9, 7, 10, 10, 9, 5, 10};
+
+    std::vector<int32_t> start_val{1, 1, -20, 9, 9, 9, 9, 20};
+    std::vector<int32_t> stop_val{8, 8, 20, -11, 0, -10, -11, -20};
+
+    element::Type_t et = element::i32;
+    {
+        std::vector<int32_t> step_val{1, 2, 0, -1, -1, -1, -2, -1};
+        std::vector<std::vector<int32_t>> input_vals{start_val, stop_val, step_val};
+        try {
+            const auto op = make_slice_op_const_inputs(input_vals, data_shape, et);
+            FAIL() << "Slice validation did not work!";
+        } catch (const NodeValidationFailure& error) {
+            EXPECT_HAS_SUBSTRING(error.what(), "'step' value can't be zero");
+        }
+    }
+}
+
+TEST(type_prop, slice_v8_dynamic_rank_inputs) {
+    PartialShape dyn_rank_shape = PartialShape::dynamic();
+    element::Type_t et = element::i32;
+
+    const auto data = std::make_shared<op::v0::Parameter>(et, dyn_rank_shape);
+    const auto start = std::make_shared<op::v0::Parameter>(et, dyn_rank_shape);
+    const auto stop = std::make_shared<op::v0::Parameter>(et, dyn_rank_shape);
+    const auto step = std::make_shared<op::v0::Parameter>(et, dyn_rank_shape);
+    const auto axes = std::make_shared<op::v0::Parameter>(et, dyn_rank_shape);
+    const auto op = std::make_shared<op::v8::Slice>(data, start, stop, step, axes);
+
+    EXPECT_EQ(op->get_output_partial_shape(0), dyn_rank_shape);
+}
diff --git a/ngraph/test/util.cpp b/ngraph/test/util.cpp
index 83be8232df94b2..e94c2dacd85976 100644
--- a/ngraph/test/util.cpp
+++ b/ngraph/test/util.cpp
@@ -13,6 +13,7 @@
 #include "ngraph/graph_util.hpp"
 #include "ngraph/ngraph.hpp"
 #include "ngraph/op/util/op_annotations.hpp"
+#include "ngraph/opsets/opset3.hpp"
 #include "ngraph/opsets/opset6.hpp"
 #include "ngraph/opsets/opset8.hpp"
 #include "ngraph/pass/manager.hpp"
@@ -236,7 +237,7 @@ TEST(graph_util, clone_multiple_results) {
     auto copy = clone_function(*f);
 }
 
-TEST(graph_util, clone_function_variables) {
+TEST(graph_util, clone_function_variables_dynamic) {
     auto c_fp16 = make_shared<opset8::Constant>(element::f16, Shape{3}, std::vector<float>{0});
     auto variable = make_shared<Variable>(VariableInfo{PartialShape::dynamic(), element::dynamic, "var_1"});
     auto read_value = make_shared<opset8::ReadValue>(c_fp16, variable);
@@ -253,6 +254,19 @@ TEST(graph_util, clone_function_variables) {
     copy = clone_function(*f);
 }
 
+TEST(graph_util, clone_function_variables_validate_partially) {
+    auto c_fp16 = make_shared<opset8::Constant>(element::f16, Shape{3}, std::vector<float>{0});
+
+    auto read_value = make_shared<opset3::ReadValue>(c_fp16, "var_1");
+    auto assign = make_shared<opset3::Assign>(read_value, "var_1");
+    auto res = make_shared<opset3::Result>(read_value);
+    auto f = make_shared<Function>(ResultVector{res}, SinkVector{assign}, ParameterVector{});
+    f->validate_nodes_and_infer_types();
+    NodeMap nm;
+    auto copy = clone_function(*f, nm);
+    nm[assign.get()]->validate_and_infer_types();
+}
+
 TEST(graph_util, clone_rt_info) {
     const std::string testAffinity = "CPU";
     std::shared_ptr<ngraph::Function> original_f;
diff --git a/ngraph/test/util/engine/ie_engines.cpp b/ngraph/test/util/engine/ie_engines.cpp
index 321e113207685b..4856492c17df61 100644
--- a/ngraph/test/util/engine/ie_engines.cpp
+++ b/ngraph/test/util/engine/ie_engines.cpp
@@ -24,14 +24,97 @@ namespace
         const auto expected_data = expected->rmap();
 
         const auto* computed_data_buffer = computed_data.template as<const T*>();
-        const auto* expected_data_buffer = expected_data.template as<const T*>();
-
         std::vector<T> computed_values(computed_data_buffer,
                                        computed_data_buffer + computed->size());
-        std::vector<T> expected_values(expected_data_buffer,
-                                       expected_data_buffer + computed->size());
 
-        return std::make_pair(std::move(computed_values), std::move(expected_values));
+        switch (static_cast<InferenceEngine::Precision::ePrecision>(expected->getTensorDesc().getPrecision()))
+        {
+            case InferenceEngine::Precision::FP32: {
+                const auto* expected_data_buffer = expected_data.template as<const float *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::FP64: {
+                const auto *expected_data_buffer = expected_data.template as<const double *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::I8: {
+                const auto *expected_data_buffer = expected_data.template as<const int8_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::I16: {
+                const auto *expected_data_buffer = expected_data.template as<const int16_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::I32: {
+                const auto *expected_data_buffer = expected_data.template as<const int32_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::I64: {
+                const auto *expected_data_buffer = expected_data.template as<const int64_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::U8: {
+                const auto *expected_data_buffer = expected_data.template as<const uint8_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::U16: {
+                const auto *expected_data_buffer = expected_data.template as<const uint16_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::U32: {
+                const auto *expected_data_buffer = expected_data.template as<const uint32_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::U64: {
+                const auto *expected_data_buffer = expected_data.template as<const uint64_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::BOOL: {
+                const auto *expected_data_buffer = expected_data.template as<const uint8_t *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            case InferenceEngine::Precision::BF16: {
+                const auto *expected_data_buffer = expected_data.template as<const bfloat16 *>();
+                std::vector<T> expected_values(expected_data_buffer,
+                                               expected_data_buffer + computed->size());
+                return std::make_pair(std::move(computed_values), std::move(expected_values));
+                break;
+            }
+            default: THROW_IE_EXCEPTION << "Not implemented yet";
+        }
     }
 
     /// Compares two blobs containing floating point elements.
@@ -87,12 +170,6 @@ namespace
                                                   const size_t tolerance_bits)
     {
         const auto& computed_precision = computed->getTensorDesc().getPrecision();
-        const auto& expected_precision = expected->getTensorDesc().getPrecision();
-
-        if (computed_precision != expected_precision)
-        {
-            return testing::AssertionFailure();
-        }
 
         switch (static_cast<InferenceEngine::Precision::ePrecision>(computed_precision))
         {
diff --git a/ngraph/test/visitors/op/gather_tree.cpp b/ngraph/test/visitors/op/gather_tree.cpp
new file mode 100644
index 00000000000000..7a89584199a0b2
--- /dev/null
+++ b/ngraph/test/visitors/op/gather_tree.cpp
@@ -0,0 +1,28 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "gtest/gtest.h"
+#include "ngraph/ngraph.hpp"
+#include "ngraph/op/util/attr_types.hpp"
+#include "ngraph/opsets/opset1.hpp"
+#include "util/visitor.hpp"
+
+using namespace ngraph;
+using ngraph::test::NodeBuilder;
+using ngraph::test::ValueMap;
+
+TEST(attributes, gather_tree_op) {
+    NodeBuilder::get_ops().register_factory<opset1::GatherTree>();
+
+    auto step_ids = std::make_shared<op::Parameter>(element::f32, Shape{1, 2, 3});
+    auto parent_idx = std::make_shared<op::Parameter>(element::f32, Shape{1, 2, 3});
+    auto max_seq_len = std::make_shared<op::Parameter>(element::f32, Shape{2});
+    auto end_token = std::make_shared<op::Parameter>(element::f32, Shape{});
+
+    auto gather_tree = std::make_shared<opset1::GatherTree>(step_ids, parent_idx, max_seq_len, end_token);
+    NodeBuilder builder(gather_tree);
+
+    const auto expected_attr_count = 0;
+    EXPECT_EQ(builder.get_value_map_size(), expected_attr_count);
+}
\ No newline at end of file
diff --git a/ngraph/test/visitors/op/rnn_sequence.cpp b/ngraph/test/visitors/op/rnn_sequence.cpp
new file mode 100644
index 00000000000000..a7d669b55de318
--- /dev/null
+++ b/ngraph/test/visitors/op/rnn_sequence.cpp
@@ -0,0 +1,63 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "gtest/gtest.h"
+#include "ngraph/ngraph.hpp"
+#include "ngraph/op/util/attr_types.hpp"
+#include "ngraph/opsets/opset1.hpp"
+#include "ngraph/opsets/opset3.hpp"
+#include "ngraph/opsets/opset4.hpp"
+#include "ngraph/opsets/opset5.hpp"
+#include "util/visitor.hpp"
+
+using namespace std;
+using namespace ngraph;
+using ngraph::test::NodeBuilder;
+using ngraph::test::ValueMap;
+
+TEST(attributes, rnn_sequence_op) {
+    NodeBuilder::get_ops().register_factory<opset5::RNNSequence>();
+
+    const size_t batch_size = 4;
+    const size_t num_directions = 2;
+    const size_t seq_length = 8;
+    const size_t input_size = 16;
+    const size_t hidden_size = 64;
+
+    const auto X = make_shared<op::Parameter>(element::f32, Shape{batch_size, seq_length, input_size});
+    const auto initial_hidden_state =
+        make_shared<op::Parameter>(element::f32, Shape{batch_size, num_directions, hidden_size});
+    const auto sequence_lengths = make_shared<op::Parameter>(element::i32, Shape{batch_size});
+    const auto W = make_shared<op::Parameter>(element::f32, Shape{num_directions, hidden_size, input_size});
+    const auto R = make_shared<op::Parameter>(element::f32, Shape{num_directions, hidden_size, hidden_size});
+    const auto B = make_shared<op::Parameter>(element::f32, Shape{num_directions, hidden_size});
+
+    const auto rnn_direction = op::RecurrentSequenceDirection::BIDIRECTIONAL;
+    const std::vector<float> activations_alpha = {1, 2, 3};
+    const std::vector<float> activations_beta = {4, 5, 6};
+    const std::vector<std::string> activations = {"tanh", "sigmoid", "tanh"};
+    const float clip_threshold = 0.5f;
+
+    const auto rnn_sequence = make_shared<opset5::RNNSequence>(X,
+                                                               initial_hidden_state,
+                                                               sequence_lengths,
+                                                               W,
+                                                               R,
+                                                               B,
+                                                               hidden_size,
+                                                               rnn_direction,
+                                                               activations,
+                                                               activations_alpha,
+                                                               activations_beta,
+                                                               clip_threshold);
+    NodeBuilder builder(rnn_sequence);
+    auto g_rnn_sequence = ov::as_type_ptr<opset5::RNNSequence>(builder.create());
+
+    EXPECT_EQ(g_rnn_sequence->get_hidden_size(), rnn_sequence->get_hidden_size());
+    EXPECT_EQ(g_rnn_sequence->get_activations(), rnn_sequence->get_activations());
+    EXPECT_EQ(g_rnn_sequence->get_activations_alpha(), rnn_sequence->get_activations_alpha());
+    EXPECT_EQ(g_rnn_sequence->get_activations_beta(), rnn_sequence->get_activations_beta());
+    EXPECT_EQ(g_rnn_sequence->get_clip(), rnn_sequence->get_clip());
+    EXPECT_EQ(g_rnn_sequence->get_direction(), rnn_sequence->get_direction());
+}
diff --git a/ngraph/test/visitors/op/slice.cpp b/ngraph/test/visitors/op/slice.cpp
new file mode 100644
index 00000000000000..e29ef9906fb5ff
--- /dev/null
+++ b/ngraph/test/visitors/op/slice.cpp
@@ -0,0 +1,42 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "gtest/gtest.h"
+#include "ngraph/ngraph.hpp"
+#include "ngraph/op/util/attr_types.hpp"
+#include "ngraph/opsets/opset8.hpp"
+#include "util/visitor.hpp"
+
+using namespace std;
+using namespace ngraph;
+using ngraph::test::NodeBuilder;
+
+TEST(attributes, slice_op_no_axes) {
+    NodeBuilder::get_ops().register_factory<opset8::Slice>();
+    const auto data = make_shared<op::Parameter>(element::f32, Shape{1, 3, 5, 4});
+    const auto start = make_shared<op::Parameter>(element::i32, Shape{4});
+    const auto stop = make_shared<op::Parameter>(element::i32, Shape{4});
+    const auto step = make_shared<op::Parameter>(element::i32, Shape{4});
+
+    const auto op = make_shared<opset8::Slice>(data, start, stop, step);
+    NodeBuilder builder(op);
+
+    const auto expected_attr_count = 0;
+    EXPECT_EQ(builder.get_value_map_size(), expected_attr_count);
+}
+
+TEST(attributes, slice_op_with_axes) {
+    NodeBuilder::get_ops().register_factory<opset8::Slice>();
+    const auto data = make_shared<op::Parameter>(element::f32, Shape{1, 3, 5, 4});
+    const auto start = make_shared<op::Parameter>(element::i32, Shape{4});
+    const auto stop = make_shared<op::Parameter>(element::i32, Shape{4});
+    const auto step = make_shared<op::Parameter>(element::i32, Shape{4});
+    const auto axes = make_shared<op::Parameter>(element::i32, Shape{4});
+
+    const auto op = make_shared<opset8::Slice>(data, start, stop, step, axes);
+    NodeBuilder builder(op);
+
+    const auto expected_attr_count = 0;
+    EXPECT_EQ(builder.get_value_map_size(), expected_attr_count);
+}
diff --git a/runtime/CMakeLists.txt b/runtime/CMakeLists.txt
new file mode 100644
index 00000000000000..88bc70641273a3
--- /dev/null
+++ b/runtime/CMakeLists.txt
@@ -0,0 +1,7 @@
+# Copyright (C) 2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+if(ENABLE_PYTHON)
+    add_subdirectory(bindings/python)
+endif()
diff --git a/runtime/bindings/python/.clang-format b/runtime/bindings/python/.clang-format
new file mode 100644
index 00000000000000..ebe747b7838a6a
--- /dev/null
+++ b/runtime/bindings/python/.clang-format
@@ -0,0 +1,28 @@
+BasedOnStyle: Google
+IndentWidth: 4
+UseTab: Never
+ColumnLimit: 120
+
+Language: Cpp
+Standard: Cpp11
+
+AccessModifierOffset: -4
+AlignConsecutiveMacros: true
+AllowAllArgumentsOnNextLine: false
+AllowAllConstructorInitializersOnNextLine: false
+AllowAllParametersOfDeclarationOnNextLine: false
+AllowShortFunctionsOnASingleLine: Empty
+AllowShortIfStatementsOnASingleLine: Never
+AllowShortLambdasOnASingleLine: Empty
+AllowShortLoopsOnASingleLine: false
+AlwaysBreakBeforeMultilineStrings: false
+BinPackArguments: false
+BinPackParameters: false
+CommentPragmas: '^#'
+DerivePointerAlignment: false
+FixNamespaceComments: true
+IndentCaseLabels: false
+IndentPPDirectives: AfterHash
+ForEachMacros:
+  - foreach
+  - FOREACH_CHILD
diff --git a/ngraph/python/.gitignore b/runtime/bindings/python/.gitignore
similarity index 100%
rename from ngraph/python/.gitignore
rename to runtime/bindings/python/.gitignore
diff --git a/ngraph/python/BUILDING.md b/runtime/bindings/python/BUILDING.md
similarity index 97%
rename from ngraph/python/BUILDING.md
rename to runtime/bindings/python/BUILDING.md
index 57a923d5cc66c7..4be330e95783a0 100644
--- a/ngraph/python/BUILDING.md
+++ b/runtime/bindings/python/BUILDING.md
@@ -57,7 +57,7 @@ set the mentioned flags to `ON`. Note the `CMAKE_INSTALL_PREFIX`, which defaults
 The Python module is installed in the `${OPENVINO_BASEDIR}/openvino_dist/python/python<version>/` folder. 
 Set up the OpenVINO™ environment in order to add the module path to `PYTHONPATH`:
 
-    source ${OPENVINO_BASEDIR}/openvino_dist/bin/setupvars.sh
+    source ${OPENVINO_BASEDIR}/openvino_dist/setupvars.sh
 
 If you would like to use a specific version of Python, or use a virtual environment, you can set the `PYTHON_EXECUTABLE` 
 variable. For example: 
@@ -136,7 +136,7 @@ adjust the number of threads used in the building process to your machine's capa
 
 Set up the OpenVINO™ environment in order to add a module path to `PYTHONPATH`:
 
-    %OPENVINO_BASEDIR%\openvino_dist\bin\setupvars.bat
+    %OPENVINO_BASEDIR%\openvino_dist\setupvars.bat
 
 ### Build an nGraph Python Wheel on Windows
 
@@ -173,7 +173,7 @@ You should now be able to run tests.
 
 You may need to run the `setupvars` script from the OpenVINO™ Toolkit to set paths to OpenVINO™ components.
 
-    source ${OPENVINO_BASEDIR}/openvino_dist/bin/setupvars.sh
+    source ${OPENVINO_BASEDIR}/openvino_dist/setupvars.sh
 
 Now you can run tests using `pytest`:
 
diff --git a/runtime/bindings/python/CMakeLists.txt b/runtime/bindings/python/CMakeLists.txt
new file mode 100644
index 00000000000000..4e1b972c17a0a2
--- /dev/null
+++ b/runtime/bindings/python/CMakeLists.txt
@@ -0,0 +1,25 @@
+# Copyright (C) 2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+cmake_minimum_required (VERSION 3.13)
+
+project(OpenVINOPython DESCRIPTION "OpenVINO Runtime Python bindings")
+
+set(LIBRARY_OUTPUT_DIRECTORY_BIN ${CMAKE_LIBRARY_OUTPUT_DIRECTORY})
+
+add_subdirectory(thirdparty/pybind11 EXCLUDE_FROM_ALL)
+add_subdirectory(src/compatibility)
+
+if(NGRAPH_UNIT_TEST_ENABLE)
+    add_subdirectory(tests/mock/mock_py_ngraph_frontend)
+    add_dependencies(_pyngraph mock_py_ngraph_frontend)
+    set_target_properties(mock_py_ngraph_frontend PROPERTIES
+            LIBRARY_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN}
+            ARCHIVE_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN}
+            COMPILE_PDB_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN}
+            PDB_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN})
+
+    add_subdirectory(tests/mock/pyngraph_fe_mock_api)
+    add_dependencies(_pyngraph pybind_mock_frontend)
+endif()
diff --git a/ngraph/python/requirements.txt b/runtime/bindings/python/requirements.txt
similarity index 100%
rename from ngraph/python/requirements.txt
rename to runtime/bindings/python/requirements.txt
diff --git a/ngraph/python/requirements_test.txt b/runtime/bindings/python/requirements_test.txt
similarity index 100%
rename from ngraph/python/requirements_test.txt
rename to runtime/bindings/python/requirements_test.txt
diff --git a/ngraph/python/setup.py b/runtime/bindings/python/setup.py
similarity index 94%
rename from ngraph/python/setup.py
rename to runtime/bindings/python/setup.py
index 5aae74ceb1e65a..0cd8167f263fc1 100644
--- a/ngraph/python/setup.py
+++ b/runtime/bindings/python/setup.py
@@ -18,9 +18,8 @@
 
 __version__ = os.environ.get("NGRAPH_VERSION", "0.0.0.dev0")
 PYNGRAPH_ROOT_DIR = os.path.abspath(os.path.dirname(__file__))
-NGRAPH_ROOT_DIR = os.path.normpath(os.path.join(PYNGRAPH_ROOT_DIR, ".."))
-OPENVINO_ROOT_DIR = os.path.normpath(os.path.join(PYNGRAPH_ROOT_DIR, "../.."))
-# Change current working dircectory to ngraph/python
+OPENVINO_ROOT_DIR = os.path.normpath(os.path.join(PYNGRAPH_ROOT_DIR, "../../.."))
+# Change current working directory to runtime/bindings/python
 os.chdir(PYNGRAPH_ROOT_DIR)
 
 NGRAPH_LIBS = ["ngraph", "onnx_ngraph_frontend"]
@@ -145,16 +144,17 @@ def build_cmake(self, extension: Extension):
         os.makedirs(build_dir, exist_ok=True)
         os.makedirs(extension_path.parent.absolute(), exist_ok=True)
 
-        # If ngraph_DIR is not set try to build from OpenVINO root
+        # If OpenVINO_DIR is set, try to build Python only,
+        # otherwise build from scratch using OpenVINO root
         root_dir = OPENVINO_ROOT_DIR
         bin_dir = os.path.join(OPENVINO_ROOT_DIR, "bin")
-        if os.environ.get("ngraph_DIR") is not None:
+        if os.environ.get("OpenVINO_DIR") is not None:
             root_dir = PYNGRAPH_ROOT_DIR
             bin_dir = build_dir
 
         self.announce("Configuring cmake project", level=3)
         ext_args = self.cmake_args.split() if self.cmake_args else []
-        self.spawn(["cmake", "-H" + root_dir, "-B" + self.build_temp,
+        self.spawn(["cmake", "-S" + root_dir, "-B" + self.build_temp,
                     "-DCMAKE_BUILD_TYPE={}".format(self.config),
                     "-DENABLE_PYTHON=ON",
                     "-DNGRAPH_ONNX_FRONTEND_ENABLE=ON"] + ext_args)
@@ -181,8 +181,8 @@ def run(self):
         self.announce("Adding library files", level=3)
 
         root_dir = os.path.join(OPENVINO_ROOT_DIR, "bin")
-        if os.environ.get("ngraph_DIR") is not None:
-            root_dir = pathlib.Path(os.environ["ngraph_DIR"]) / ".."
+        if os.environ.get("OpenVINO_DIR") is not None:
+            root_dir = pathlib.Path(PYNGRAPH_ROOT_DIR)
 
         lib_ext = ""
         if "linux" in sys.platform:
@@ -217,7 +217,7 @@ def run(self):
     url="https://github.com/openvinotoolkit/openvino",
     license="License :: OSI Approved :: Apache Software License",
     ext_modules=[CMakeExtension(name="_pyngraph")],
-    package_dir={"": "src"},
+    package_dir={"": "src/compatibility"},
     packages=packages,
     install_requires=requirements,
     data_files=data_files,
diff --git a/inference-engine/tools/CMakeLists.txt b/runtime/bindings/python/src/compatibility/CMakeLists.txt
similarity index 73%
rename from inference-engine/tools/CMakeLists.txt
rename to runtime/bindings/python/src/compatibility/CMakeLists.txt
index 9112658ce5ea37..d3272c94ca4ac1 100644
--- a/inference-engine/tools/CMakeLists.txt
+++ b/runtime/bindings/python/src/compatibility/CMakeLists.txt
@@ -2,4 +2,4 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
-add_subdirectory(compile_tool)
+add_subdirectory(pyngraph)
diff --git a/ngraph/python/src/ngraph/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/__init__.py
similarity index 98%
rename from ngraph/python/src/ngraph/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/__init__.py
index 950a05e4edec41..619baad3021080 100644
--- a/ngraph/python/src/ngraph/__init__.py
+++ b/runtime/bindings/python/src/compatibility/ngraph/__init__.py
@@ -27,6 +27,7 @@
 from ngraph.frontend import Place
 from ngraph.helpers import function_from_cnn
 from ngraph.helpers import function_to_cnn
+from ngraph.helpers import partial_shape_from_data
 from ngraph.opset8 import absolute
 from ngraph.opset8 import absolute as abs
 from ngraph.opset8 import acos
@@ -132,6 +133,7 @@
 from ngraph.opset8 import prior_box_clustered
 from ngraph.opset8 import psroi_pooling
 from ngraph.opset8 import proposal
+from ngraph.opset8 import random_uniform
 from ngraph.opset8 import range
 from ngraph.opset8 import read_value
 from ngraph.opset8 import reduce_l1
diff --git a/ngraph/python/src/ngraph/exceptions.py b/runtime/bindings/python/src/compatibility/ngraph/exceptions.py
similarity index 100%
rename from ngraph/python/src/ngraph/exceptions.py
rename to runtime/bindings/python/src/compatibility/ngraph/exceptions.py
diff --git a/ngraph/python/src/ngraph/frontend/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/frontend/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/frontend/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/frontend/__init__.py
diff --git a/ngraph/python/src/ngraph/helpers.py b/runtime/bindings/python/src/compatibility/ngraph/helpers.py
similarity index 60%
rename from ngraph/python/src/ngraph/helpers.py
rename to runtime/bindings/python/src/compatibility/ngraph/helpers.py
index d69a3b86529e32..7869affaba3e16 100644
--- a/ngraph/python/src/ngraph/helpers.py
+++ b/runtime/bindings/python/src/compatibility/ngraph/helpers.py
@@ -3,8 +3,10 @@
 
 """nGraph helper functions."""
 
-from ngraph.impl import Function
-from openvino.inference_engine import IENetwork
+from typing import Union
+
+from ngraph.impl import Function, PartialShape
+from openvino.inference_engine import IENetwork, DataPtr, CDataPtr
 
 
 def function_from_cnn(cnn_network: IENetwork) -> Function:
@@ -18,3 +20,9 @@ def function_to_cnn(ng_function: Function) -> Function:
     """Get Inference Engine CNN network from nGraph function."""
     capsule = Function.to_capsule(ng_function)
     return IENetwork(capsule)
+
+
+def partial_shape_from_data(data: Union[DataPtr, CDataPtr]) -> PartialShape:
+    """Get nGraph PartialShape from Inference Engine Data."""
+    capsule = data._get_partial_shape_capsule()
+    return PartialShape.from_capsule(capsule)
diff --git a/ngraph/python/src/ngraph/impl/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/impl/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/impl/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/impl/__init__.py
diff --git a/ngraph/python/src/ngraph/impl/op/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/impl/op/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/impl/op/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/impl/op/__init__.py
diff --git a/ngraph/python/src/ngraph/impl/op/util/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/impl/op/util/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/impl/op/util/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/impl/op/util/__init__.py
diff --git a/ngraph/python/src/ngraph/impl/passes/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/impl/passes/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/impl/passes/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/impl/passes/__init__.py
diff --git a/ngraph/python/src/ngraph/opset1/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset1/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset1/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset1/__init__.py
diff --git a/ngraph/python/src/ngraph/opset1/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset1/ops.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset1/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset1/ops.py
diff --git a/ngraph/python/src/ngraph/opset2/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset2/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset2/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset2/__init__.py
diff --git a/ngraph/python/src/ngraph/opset2/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset2/ops.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset2/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset2/ops.py
diff --git a/ngraph/python/src/ngraph/opset3/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset3/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset3/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset3/__init__.py
diff --git a/ngraph/python/src/ngraph/opset3/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset3/ops.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset3/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset3/ops.py
diff --git a/ngraph/python/src/ngraph/opset4/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset4/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset4/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset4/__init__.py
diff --git a/ngraph/python/src/ngraph/opset4/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset4/ops.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset4/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset4/ops.py
diff --git a/ngraph/python/src/ngraph/opset5/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset5/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset5/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset5/__init__.py
diff --git a/ngraph/python/src/ngraph/opset5/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset5/ops.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset5/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset5/ops.py
diff --git a/ngraph/python/src/ngraph/opset6/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset6/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset6/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset6/__init__.py
diff --git a/ngraph/python/src/ngraph/opset6/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset6/ops.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset6/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset6/ops.py
diff --git a/ngraph/python/src/ngraph/opset7/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset7/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset7/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset7/__init__.py
diff --git a/ngraph/python/src/ngraph/opset7/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset7/ops.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset7/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset7/ops.py
diff --git a/ngraph/python/src/ngraph/opset8/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/opset8/__init__.py
similarity index 98%
rename from ngraph/python/src/ngraph/opset8/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset8/__init__.py
index d294788c28258a..f0d0dfdd2dbf64 100644
--- a/ngraph/python/src/ngraph/opset8/__init__.py
+++ b/runtime/bindings/python/src/compatibility/ngraph/opset8/__init__.py
@@ -84,7 +84,7 @@
 from ngraph.opset1.ops import lstm_sequence
 from ngraph.opset1.ops import matmul
 from ngraph.opset8.ops import matrix_nms
-from ngraph.opset1.ops import max_pool
+from ngraph.opset8.ops import max_pool
 from ngraph.opset1.ops import maximum
 from ngraph.opset1.ops import minimum
 from ngraph.opset4.ops import mish
@@ -106,6 +106,7 @@
 from ngraph.opset1.ops import prior_box_clustered
 from ngraph.opset1.ops import psroi_pooling
 from ngraph.opset4.ops import proposal
+from ngraph.opset8.ops import random_uniform
 from ngraph.opset1.ops import range
 from ngraph.opset3.ops import read_value
 from ngraph.opset4.ops import reduce_l1
diff --git a/ngraph/python/src/ngraph/opset8/ops.py b/runtime/bindings/python/src/compatibility/ngraph/opset8/ops.py
similarity index 73%
rename from ngraph/python/src/ngraph/opset8/ops.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset8/ops.py
index 82e2a24446b77a..6c355930b7c021 100644
--- a/ngraph/python/src/ngraph/opset8/ops.py
+++ b/runtime/bindings/python/src/compatibility/ngraph/opset8/ops.py
@@ -276,3 +276,94 @@ def gather(
         "batch_dims": batch_dims
     }
     return _get_node_factory_opset8().create("Gather", inputs, attributes)
+
+
+@nameable_op
+def max_pool(
+    data: NodeInput,
+    strides: List[int],
+    dilations: List[int],
+    pads_begin: List[int],
+    pads_end: List[int],
+    kernel_shape: TensorShape,
+    rounding_type: str = "floor",
+    auto_pad: Optional[str] = None,
+    index_element_type: Optional[str] = "i64",
+    axis: Optional[int] = 0,
+    name: Optional[str] = None,
+) -> Node:
+    """Perform max pooling operation and return both values and indices of the selected elements.
+
+    @param  data:                The node providing input data.
+    @param  strides:             The distance (in pixels) to slide the filter on the feature map
+                                 over the axes.
+    @param  dilations:           The dilation of filter elements(distance between elements).
+    @param  pads_begin:          The number of pixels to add at the beginning along each axis.
+    @param  pads_end:            The number of pixels to add at the end along each axis.
+    @param  kernel_shape:        The pooling operation kernel shape.
+    @param  rounding_type:       Determines used rounding schema when computing output shape.
+                                 Acceptable values are: ['floor', 'ceil']. Defaults to 'floor'.
+    @param  auto_pad:            Determines how the padding is calculated. Acceptable values:
+                                 [None, 'same_upper', 'same_lower', 'valid']. Defaults to None.
+    @param  index_element_type:  The data type used for the indices output of this operator.
+                                 Defaults to i64.
+    @param  axis:                The first dimension in the data shape used to determine the maximum
+                                 returned index value. The value is the product of all dimensions
+                                 starting at the provided axis. Defaults to 0.
+    @param  name:                The optional name for the created output node.
+
+    @return   The new node performing max pooling operation.
+    """
+    if auto_pad is None:
+        auto_pad = "explicit"
+    return _get_node_factory_opset8().create(
+        "MaxPool",
+        [as_node(data)],
+        {
+            "strides": strides,
+            "dilations": dilations,
+            "pads_begin": pads_begin,
+            "pads_end": pads_end,
+            "kernel": kernel_shape,
+            "rounding_type": rounding_type.upper(),
+            "auto_pad": auto_pad.upper(),
+            "index_element_type": index_element_type,
+            "axis": axis,
+        },
+    )
+
+
+@nameable_op
+def random_uniform(
+        output_shape: NodeInput,
+        min_val: NodeInput,
+        max_val: NodeInput,
+        output_type: str,
+        global_seed: int = 0,
+        op_seed: int = 0
+) -> Node:
+    """Return a node which generates sequence of random values from uniform distribution.
+
+    @param output_shape: Tensor with shape of the output tensor.
+    @param min_val: Tensor with the lower bound on the range of random values to generate.
+    @param max_val: Tensor with the upper bound on the range of random values to generate.
+    @param output_type: Specifies the output tensor type, possible values:
+    'i64', 'i32', 'f64', 'f32', 'f16', 'bf16'.
+    @param global_seed: Specifies global seed value. Required to be a positive integer or 0.
+    @param op_seed: Specifies operational seed value. Required to be a positive integer or 0.
+    @return The new node which performs generation of random values from uniform distribution.
+    """
+    inputs = as_nodes(output_shape, min_val, max_val)
+
+    if global_seed < 0:
+        raise RuntimeError("global_seed should be positive or 0. Got: {}".format(global_seed))
+
+    if op_seed < 0:
+        raise RuntimeError("op_seed should be positive or 0. Got: {}".format(op_seed))
+
+    attributes = {
+        "output_type": output_type,
+        "global_seed": global_seed,
+        "op_seed": op_seed,
+    }
+    return _get_node_factory_opset8().create("RandomUniform", inputs, attributes)
diff --git a/ngraph/python/src/ngraph/opset_utils.py b/runtime/bindings/python/src/compatibility/ngraph/opset_utils.py
similarity index 100%
rename from ngraph/python/src/ngraph/opset_utils.py
rename to runtime/bindings/python/src/compatibility/ngraph/opset_utils.py
diff --git a/ngraph/python/src/ngraph/utils/__init__.py b/runtime/bindings/python/src/compatibility/ngraph/utils/__init__.py
similarity index 100%
rename from ngraph/python/src/ngraph/utils/__init__.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/__init__.py
diff --git a/ngraph/python/src/ngraph/utils/broadcasting.py b/runtime/bindings/python/src/compatibility/ngraph/utils/broadcasting.py
similarity index 100%
rename from ngraph/python/src/ngraph/utils/broadcasting.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/broadcasting.py
diff --git a/ngraph/python/src/ngraph/utils/decorators.py b/runtime/bindings/python/src/compatibility/ngraph/utils/decorators.py
similarity index 100%
rename from ngraph/python/src/ngraph/utils/decorators.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/decorators.py
diff --git a/ngraph/python/src/ngraph/utils/input_validation.py b/runtime/bindings/python/src/compatibility/ngraph/utils/input_validation.py
similarity index 100%
rename from ngraph/python/src/ngraph/utils/input_validation.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/input_validation.py
diff --git a/ngraph/python/src/ngraph/utils/node_factory.py b/runtime/bindings/python/src/compatibility/ngraph/utils/node_factory.py
similarity index 83%
rename from ngraph/python/src/ngraph/utils/node_factory.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/node_factory.py
index 67e1825a4b32ba..ffb0c3d861ccc8 100644
--- a/ngraph/python/src/ngraph/utils/node_factory.py
+++ b/runtime/bindings/python/src/compatibility/ngraph/utils/node_factory.py
@@ -1,6 +1,8 @@
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+import logging as log
+
 from functools import partial
 from typing import Any, Dict, List, Optional, Union
 
@@ -8,6 +10,8 @@
 
 from ngraph.impl import Node, Output
 
+from ngraph.exceptions import UserInputError
+
 DEFAULT_OPSET = "opset8"
 
 
@@ -24,7 +28,7 @@ def __init__(self, opset_version: str = DEFAULT_OPSET) -> None:
     def create(
         self,
         op_type_name: str,
-        arguments: List[Union[Node, Output]],
+        arguments: Optional[List[Union[Node, Output]]] = None,
         attributes: Optional[Dict[str, Any]] = None,
     ) -> Node:
         """Create node object from provided description.
@@ -37,9 +41,24 @@ def create(
 
         @return   Node object representing requested operator with attributes set.
         """
+        if arguments is None and attributes is None:
+            node = self.factory.create(op_type_name)
+            node._attr_cache = {}
+            node._attr_cache_valid = False
+            return node
+
+        if arguments is None and attributes is not None:
+            raise UserInputError(
+                'Error: cannot create "{}" op without arguments.'.format(
+                    op_type_name
+                )
+            )
+
         if attributes is None:
             attributes = {}
 
+        assert arguments is not None
+
         arguments = self._arguments_as_outputs(arguments)
         node = self.factory.create(op_type_name, arguments, attributes)
 
@@ -55,7 +74,7 @@ def create(
         #   node.get_some_metric_attr_name()
         #   node.set_some_metric_attr_name()
         # Please see test_dyn_attributes.py for more usage examples.
-        all_attributes = node._get_attributes()
+        all_attributes = node.get_attributes()
         for attr_name in all_attributes.keys():
             setattr(
                 node,
@@ -82,6 +101,9 @@ def _arguments_as_outputs(arguments: List[Union[Node, Output]]) -> List[Output]:
             if issubclass(type(argument), Output):
                 outputs.append(argument)
             else:
+                log.warning("Op arguments were passed as Node, please avoid passing arguments in "
+                            "this manner, and pass Output(s) instead, because accepting Nodes will "
+                            "be deprecated in a future release.")
                 outputs.extend(argument.outputs())
         return outputs
 
@@ -129,7 +151,7 @@ def _get_node_attr_value(node: Node, attr_name: str) -> Any:
         @return   The node attribute value.
         """
         if not node._attr_cache_valid:
-            node._attr_cache = node._get_attributes()
+            node._attr_cache = node.get_attributes()
             node._attr_cache_valid = True
         return node._attr_cache[attr_name]
 
@@ -141,5 +163,5 @@ def _set_node_attr_value(node: Node, attr_name: str, value: Any) -> None:
         @param      attr_name:  The attribute name.
         @param      value:      The new attribute value.
         """
-        node._set_attribute(attr_name, value)
+        node.set_attribute(attr_name, value)
         node._attr_cache[attr_name] = value
diff --git a/ngraph/python/src/ngraph/utils/reduction.py b/runtime/bindings/python/src/compatibility/ngraph/utils/reduction.py
similarity index 100%
rename from ngraph/python/src/ngraph/utils/reduction.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/reduction.py
diff --git a/ngraph/python/src/ngraph/utils/tensor_iterator_types.py b/runtime/bindings/python/src/compatibility/ngraph/utils/tensor_iterator_types.py
similarity index 100%
rename from ngraph/python/src/ngraph/utils/tensor_iterator_types.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/tensor_iterator_types.py
diff --git a/ngraph/python/src/ngraph/utils/types.py b/runtime/bindings/python/src/compatibility/ngraph/utils/types.py
similarity index 100%
rename from ngraph/python/src/ngraph/utils/types.py
rename to runtime/bindings/python/src/compatibility/ngraph/utils/types.py
diff --git a/ngraph/python/CMakeLists.txt b/runtime/bindings/python/src/compatibility/pyngraph/CMakeLists.txt
similarity index 67%
rename from ngraph/python/CMakeLists.txt
rename to runtime/bindings/python/src/compatibility/pyngraph/CMakeLists.txt
index 7de595a5211edd..dc0644adb86a80 100644
--- a/ngraph/python/CMakeLists.txt
+++ b/runtime/bindings/python/src/compatibility/pyngraph/CMakeLists.txt
@@ -2,22 +2,17 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
-cmake_minimum_required (VERSION 3.13)
-
 project (pyngraph)
 
 if(NOT DEFINED OpenVINO_SOURCE_DIR)
     find_package(InferenceEngineDeveloperPackage QUIET)
-    find_package(ngraph REQUIRED)
+    find_package(OpenVINO REQUIRED)
 endif()
 
-add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/pybind11 EXCLUDE_FROM_ALL)
-
 # PYTHON_VERSION_MAJOR and PYTHON_VERSION_MINOR are defined inside pybind11
 set(PYTHON_VERSION python${PYTHON_VERSION_MAJOR}.${PYTHON_VERSION_MINOR})
 message(STATUS "Python version=${PYTHON_VERSION}")
 
-set(LIBRARY_OUTPUT_DIRECTORY_BIN ${CMAKE_LIBRARY_OUTPUT_DIRECTORY})
 if(OpenVINO_SOURCE_DIR)
     if(WIN32)
         set(PYTHON_BRIDGE_OUTPUT_DIRECTORY ${CMAKE_LIBRARY_OUTPUT_DIRECTORY}/$<CONFIG>/python_api/${PYTHON_VERSION}/)
@@ -53,36 +48,24 @@ endif()
 
 # create target
 
-file(GLOB_RECURSE SOURCES src/pyngraph/*.cpp)
+file(GLOB_RECURSE SOURCES *.cpp)
 
 pybind11_add_module(_${PROJECT_NAME} MODULE ${SOURCES})
 
-target_include_directories(_${PROJECT_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/src")
+target_include_directories(_${PROJECT_NAME} PRIVATE "../")
 
-target_link_libraries(_${PROJECT_NAME} PRIVATE ngraph::ngraph ngraph::frontend_manager)
+target_link_libraries(_${PROJECT_NAME} PRIVATE openvino::core openvino::frontend::manager)
 
-if (TARGET ngraph::onnx_ngraph_frontend)
-    add_dependencies(_${PROJECT_NAME} ngraph::onnx_ngraph_frontend)
+if(TARGET onnx_ngraph_frontend)
+    add_dependencies(_${PROJECT_NAME} onnx_ngraph_frontend)
 endif()
 
-if(NGRAPH_UNIT_TEST_ENABLE)
-    add_subdirectory(tests/mock/mock_py_ngraph_frontend)
-    add_dependencies(_${PROJECT_NAME} mock_py_ngraph_frontend)
-    set_target_properties(mock_py_ngraph_frontend PROPERTIES
-            LIBRARY_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN}
-            ARCHIVE_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN}
-            COMPILE_PDB_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN}
-            PDB_OUTPUT_DIRECTORY ${LIBRARY_OUTPUT_DIRECTORY_BIN})
-
-    add_subdirectory(tests/mock/pyngraph_fe_mock_api)
-    add_dependencies(_${PROJECT_NAME} pybind_mock_frontend)
-endif()
 
 # perform copy
 if(OpenVINO_SOURCE_DIR)
     add_custom_command(TARGET _${PROJECT_NAME}
         POST_BUILD
-        COMMAND ${CMAKE_COMMAND} -E copy_directory ${CMAKE_CURRENT_SOURCE_DIR}/src/ngraph ${CMAKE_LIBRARY_OUTPUT_DIRECTORY}/ngraph
+        COMMAND ${CMAKE_COMMAND} -E copy_directory ${CMAKE_CURRENT_SOURCE_DIR}/../ngraph ${CMAKE_LIBRARY_OUTPUT_DIRECTORY}/ngraph
     )
 endif()
 
@@ -99,12 +82,12 @@ if(OpenVINO_SOURCE_DIR OR InferenceEngineDeveloperPackage_FOUND)
             DESTINATION python/${PYTHON_VERSION}
             COMPONENT pyngraph_${PYTHON_VERSION})
 
-    install(DIRECTORY ${CMAKE_CURRENT_LIST_DIR}/src/ngraph
+    install(DIRECTORY ${CMAKE_CURRENT_LIST_DIR}/../ngraph
             DESTINATION python/${PYTHON_VERSION}
             COMPONENT pyngraph_${PYTHON_VERSION}
             USE_SOURCE_PERMISSIONS)
 
-    install(DIRECTORY ${CMAKE_CURRENT_LIST_DIR}/tests
+    install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/../../../tests
             DESTINATION tests/${PROJECT_NAME}
             COMPONENT tests EXCLUDE_FROM_ALL)
 
diff --git a/ngraph/python/src/pyngraph/axis_set.cpp b/runtime/bindings/python/src/compatibility/pyngraph/axis_set.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/axis_set.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/axis_set.cpp
diff --git a/ngraph/python/src/pyngraph/axis_set.hpp b/runtime/bindings/python/src/compatibility/pyngraph/axis_set.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/axis_set.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/axis_set.hpp
diff --git a/ngraph/python/src/pyngraph/axis_vector.cpp b/runtime/bindings/python/src/compatibility/pyngraph/axis_vector.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/axis_vector.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/axis_vector.cpp
diff --git a/ngraph/python/src/pyngraph/axis_vector.hpp b/runtime/bindings/python/src/compatibility/pyngraph/axis_vector.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/axis_vector.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/axis_vector.hpp
diff --git a/ngraph/python/src/pyngraph/coordinate.cpp b/runtime/bindings/python/src/compatibility/pyngraph/coordinate.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/coordinate.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/coordinate.cpp
diff --git a/ngraph/python/src/pyngraph/coordinate.hpp b/runtime/bindings/python/src/compatibility/pyngraph/coordinate.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/coordinate.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/coordinate.hpp
diff --git a/ngraph/python/src/pyngraph/coordinate_diff.cpp b/runtime/bindings/python/src/compatibility/pyngraph/coordinate_diff.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/coordinate_diff.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/coordinate_diff.cpp
diff --git a/ngraph/python/src/pyngraph/coordinate_diff.hpp b/runtime/bindings/python/src/compatibility/pyngraph/coordinate_diff.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/coordinate_diff.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/coordinate_diff.hpp
diff --git a/ngraph/python/src/pyngraph/dict_attribute_visitor.cpp b/runtime/bindings/python/src/compatibility/pyngraph/dict_attribute_visitor.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/dict_attribute_visitor.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/dict_attribute_visitor.cpp
diff --git a/ngraph/python/src/pyngraph/dict_attribute_visitor.hpp b/runtime/bindings/python/src/compatibility/pyngraph/dict_attribute_visitor.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/dict_attribute_visitor.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/dict_attribute_visitor.hpp
diff --git a/ngraph/python/src/pyngraph/dimension.cpp b/runtime/bindings/python/src/compatibility/pyngraph/dimension.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/dimension.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/dimension.cpp
diff --git a/ngraph/python/src/pyngraph/dimension.hpp b/runtime/bindings/python/src/compatibility/pyngraph/dimension.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/dimension.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/dimension.hpp
diff --git a/ngraph/python/src/pyngraph/frontend/frontend.cpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/frontend.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend.cpp
diff --git a/ngraph/python/src/pyngraph/frontend/frontend.hpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/frontend.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend.hpp
diff --git a/ngraph/python/src/pyngraph/frontend/frontend_manager.cpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend_manager.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/frontend_manager.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend_manager.cpp
diff --git a/ngraph/python/src/pyngraph/frontend/frontend_manager.hpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend_manager.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/frontend_manager.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/frontend_manager.hpp
diff --git a/ngraph/python/src/pyngraph/frontend/inputmodel.cpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/inputmodel.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/inputmodel.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/inputmodel.cpp
diff --git a/ngraph/python/src/pyngraph/frontend/inputmodel.hpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/inputmodel.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/inputmodel.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/inputmodel.hpp
diff --git a/ngraph/python/src/pyngraph/frontend/place.cpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/place.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/place.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/place.cpp
diff --git a/ngraph/python/src/pyngraph/frontend/place.hpp b/runtime/bindings/python/src/compatibility/pyngraph/frontend/place.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/frontend/place.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/frontend/place.hpp
diff --git a/ngraph/python/src/pyngraph/function.cpp b/runtime/bindings/python/src/compatibility/pyngraph/function.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/function.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/function.cpp
diff --git a/ngraph/python/src/pyngraph/function.hpp b/runtime/bindings/python/src/compatibility/pyngraph/function.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/function.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/function.hpp
diff --git a/ngraph/python/src/pyngraph/node.cpp b/runtime/bindings/python/src/compatibility/pyngraph/node.cpp
similarity index 94%
rename from ngraph/python/src/pyngraph/node.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node.cpp
index 59ba2da7abf658..3c7436d2dc8079 100644
--- a/ngraph/python/src/pyngraph/node.cpp
+++ b/runtime/bindings/python/src/compatibility/pyngraph/node.cpp
@@ -265,15 +265,21 @@ void regclass_pyngraph_Node(py::module m) {
     node.def_property_readonly("version", &ngraph::Node::get_version);
     node.def_property("friendly_name", &ngraph::Node::get_friendly_name, &ngraph::Node::set_friendly_name);
 
-    node.def("_get_attributes", [](const std::shared_ptr<ngraph::Node>& self) {
+    node.def("get_attributes", [](const std::shared_ptr<ngraph::Node>& self) {
         util::DictAttributeSerializer dict_serializer(self);
         return dict_serializer.get_attributes();
     });
-    node.def("_set_attribute", [](std::shared_ptr<ngraph::Node>& self, const std::string& atr_name, py::object value) {
+    node.def("set_attribute", [](std::shared_ptr<ngraph::Node>& self, const std::string& atr_name, py::object value) {
         py::dict attr_dict;
         attr_dict[atr_name.c_str()] = value;
         std::unordered_map<std::string, std::shared_ptr<ngraph::Variable>> variables;
         util::DictAttributeDeserializer dict_deserializer(attr_dict, variables);
         self->visit_attributes(dict_deserializer);
     });
+    node.def("set_arguments", [](const std::shared_ptr<ngraph::Node>& self, const ngraph::OutputVector& arguments) {
+        return self->set_arguments(arguments);
+    });
+    node.def("validate", [](const std::shared_ptr<ngraph::Node>& self) {
+        return self->constructor_validate_and_infer_types();
+    });
 }
diff --git a/ngraph/python/src/pyngraph/node.hpp b/runtime/bindings/python/src/compatibility/pyngraph/node.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/node.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node.hpp
diff --git a/ngraph/python/src/pyngraph/node_factory.cpp b/runtime/bindings/python/src/compatibility/pyngraph/node_factory.cpp
similarity index 74%
rename from ngraph/python/src/pyngraph/node_factory.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node_factory.cpp
index bcc4a63c0bf78a..d4ad3d7bacbb47 100644
--- a/ngraph/python/src/pyngraph/node_factory.cpp
+++ b/runtime/bindings/python/src/compatibility/pyngraph/node_factory.cpp
@@ -19,6 +19,7 @@
 #include "dict_attribute_visitor.hpp"
 #include "ngraph/check.hpp"
 #include "ngraph/except.hpp"
+#include "ngraph/log.hpp"
 #include "ngraph/node.hpp"
 #include "ngraph/op/util/op_types.hpp"
 #include "ngraph/op/util/variable.hpp"
@@ -51,6 +52,19 @@ class NodeFactory {
         return op_node;
     }
 
+    std::shared_ptr<ngraph::Node> create(const std::string op_type_name) {
+        std::shared_ptr<ngraph::Node> op_node = std::shared_ptr<ngraph::Node>(m_opset.create(op_type_name));
+
+        NGRAPH_CHECK(op_node != nullptr, "Couldn't create operator: ", op_type_name);
+        NGRAPH_CHECK(!ngraph::op::is_constant(op_node),
+                     "Currently NodeFactory doesn't support Constant node: ",
+                     op_type_name);
+
+        NGRAPH_WARN << "Empty op created! Please assign inputs and attributes and run validate() before op is used.";
+
+        return op_node;
+    }
+
 private:
     const ngraph::OpSet& get_opset(std::string opset_ver) {
         std::locale loc;
@@ -90,7 +104,16 @@ void regclass_pyngraph_NodeFactory(py::module m) {
     node_factory.def(py::init());
     node_factory.def(py::init<std::string>());
 
-    node_factory.def("create", &NodeFactory::create);
+    node_factory.def("create", [](NodeFactory& self, const std::string name) {
+        return self.create(name);
+    });
+    node_factory.def("create",
+                     [](NodeFactory& self,
+                        const std::string name,
+                        const ngraph::OutputVector& arguments,
+                        const py::dict& attributes) {
+                         return self.create(name, arguments, attributes);
+                     });
 
     node_factory.def("__repr__", [](const NodeFactory& self) {
         return "<NodeFactory>";
diff --git a/ngraph/python/src/pyngraph/node_factory.hpp b/runtime/bindings/python/src/compatibility/pyngraph/node_factory.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/node_factory.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node_factory.hpp
diff --git a/ngraph/python/src/pyngraph/node_input.cpp b/runtime/bindings/python/src/compatibility/pyngraph/node_input.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/node_input.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node_input.cpp
diff --git a/ngraph/python/src/pyngraph/node_input.hpp b/runtime/bindings/python/src/compatibility/pyngraph/node_input.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/node_input.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node_input.hpp
diff --git a/ngraph/python/src/pyngraph/node_output.cpp b/runtime/bindings/python/src/compatibility/pyngraph/node_output.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/node_output.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node_output.cpp
diff --git a/ngraph/python/src/pyngraph/node_output.hpp b/runtime/bindings/python/src/compatibility/pyngraph/node_output.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/node_output.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/node_output.hpp
diff --git a/ngraph/python/src/pyngraph/ops/constant.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/constant.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/constant.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/constant.cpp
diff --git a/ngraph/python/src/pyngraph/ops/constant.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/constant.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/constant.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/constant.hpp
diff --git a/ngraph/python/src/pyngraph/ops/parameter.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/parameter.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/parameter.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/parameter.cpp
diff --git a/ngraph/python/src/pyngraph/ops/parameter.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/parameter.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/parameter.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/parameter.hpp
diff --git a/ngraph/python/src/pyngraph/ops/result.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/result.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/result.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/result.cpp
diff --git a/ngraph/python/src/pyngraph/ops/result.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/result.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/result.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/result.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/arithmetic_reduction.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/arithmetic_reduction.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/arithmetic_reduction.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/arithmetic_reduction.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/arithmetic_reduction.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/arithmetic_reduction.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/arithmetic_reduction.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/arithmetic_reduction.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/binary_elementwise_arithmetic.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_arithmetic.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/binary_elementwise_arithmetic.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_arithmetic.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/binary_elementwise_arithmetic.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_arithmetic.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/binary_elementwise_arithmetic.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_arithmetic.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/binary_elementwise_comparison.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_comparison.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/binary_elementwise_comparison.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_comparison.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/binary_elementwise_comparison.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_comparison.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/binary_elementwise_comparison.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_comparison.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/binary_elementwise_logical.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_logical.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/binary_elementwise_logical.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_logical.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/binary_elementwise_logical.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_logical.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/binary_elementwise_logical.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/binary_elementwise_logical.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/index_reduction.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/index_reduction.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/index_reduction.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/index_reduction.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/index_reduction.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/index_reduction.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/index_reduction.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/index_reduction.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/op_annotations.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/op_annotations.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/op_annotations.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/op_annotations.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/op_annotations.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/op_annotations.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/op_annotations.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/op_annotations.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/regmodule_pyngraph_op_util.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/regmodule_pyngraph_op_util.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/regmodule_pyngraph_op_util.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/regmodule_pyngraph_op_util.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/regmodule_pyngraph_op_util.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/regmodule_pyngraph_op_util.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/regmodule_pyngraph_op_util.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/regmodule_pyngraph_op_util.hpp
diff --git a/ngraph/python/src/pyngraph/ops/util/unary_elementwise_arithmetic.cpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/unary_elementwise_arithmetic.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/unary_elementwise_arithmetic.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/unary_elementwise_arithmetic.cpp
diff --git a/ngraph/python/src/pyngraph/ops/util/unary_elementwise_arithmetic.hpp b/runtime/bindings/python/src/compatibility/pyngraph/ops/util/unary_elementwise_arithmetic.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/ops/util/unary_elementwise_arithmetic.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/ops/util/unary_elementwise_arithmetic.hpp
diff --git a/ngraph/python/src/pyngraph/partial_shape.cpp b/runtime/bindings/python/src/compatibility/pyngraph/partial_shape.cpp
similarity index 90%
rename from ngraph/python/src/pyngraph/partial_shape.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/partial_shape.cpp
index e63abbb15b801e..80004760dc0c02 100644
--- a/ngraph/python/src/pyngraph/partial_shape.cpp
+++ b/runtime/bindings/python/src/compatibility/pyngraph/partial_shape.cpp
@@ -17,6 +17,8 @@
 
 namespace py = pybind11;
 
+static const char* CAPSULE_NAME = "ngraph_partial_shape";
+
 void regclass_pyngraph_PartialShape(py::module m) {
     py::class_<ngraph::PartialShape, std::shared_ptr<ngraph::PartialShape>> shape(m, "PartialShape");
     shape.doc() = "ngraph.impl.PartialShape wraps ngraph::PartialShape";
@@ -199,4 +201,18 @@ void regclass_pyngraph_PartialShape(py::module m) {
     shape.def("__repr__", [](const ngraph::PartialShape& self) -> std::string {
         return "<PartialShape: " + py::cast(self).attr("__str__")().cast<std::string>() + ">";
     });
+
+    shape.def_static("from_capsule", [](py::object* capsule) {
+        // get the underlying PyObject* which is a PyCapsule pointer
+        auto* pybind_capsule_ptr = capsule->ptr();
+        // extract the pointer stored in the PyCapsule under the name CAPSULE_NAME
+        auto* capsule_ptr = PyCapsule_GetPointer(pybind_capsule_ptr, CAPSULE_NAME);
+
+        auto* ngraph_pShape = static_cast<std::shared_ptr<ngraph::PartialShape>*>(capsule_ptr);
+        if (ngraph_pShape && *ngraph_pShape) {
+            return *ngraph_pShape;
+        } else {
+            throw std::runtime_error("The provided capsule does not contain an ngraph::PartialShape");
+        }
+    });
 }
diff --git a/ngraph/python/src/pyngraph/partial_shape.hpp b/runtime/bindings/python/src/compatibility/pyngraph/partial_shape.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/partial_shape.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/partial_shape.hpp
diff --git a/ngraph/python/src/pyngraph/passes/manager.cpp b/runtime/bindings/python/src/compatibility/pyngraph/passes/manager.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/passes/manager.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/passes/manager.cpp
diff --git a/ngraph/python/src/pyngraph/passes/manager.hpp b/runtime/bindings/python/src/compatibility/pyngraph/passes/manager.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/passes/manager.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/passes/manager.hpp
diff --git a/ngraph/python/src/pyngraph/passes/regmodule_pyngraph_passes.cpp b/runtime/bindings/python/src/compatibility/pyngraph/passes/regmodule_pyngraph_passes.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/passes/regmodule_pyngraph_passes.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/passes/regmodule_pyngraph_passes.cpp
diff --git a/ngraph/python/src/pyngraph/passes/regmodule_pyngraph_passes.hpp b/runtime/bindings/python/src/compatibility/pyngraph/passes/regmodule_pyngraph_passes.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/passes/regmodule_pyngraph_passes.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/passes/regmodule_pyngraph_passes.hpp
diff --git a/ngraph/python/src/pyngraph/pyngraph.cpp b/runtime/bindings/python/src/compatibility/pyngraph/pyngraph.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/pyngraph.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/pyngraph.cpp
diff --git a/ngraph/python/src/pyngraph/rt_map.cpp b/runtime/bindings/python/src/compatibility/pyngraph/rt_map.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/rt_map.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/rt_map.cpp
diff --git a/ngraph/python/src/pyngraph/rt_map.hpp b/runtime/bindings/python/src/compatibility/pyngraph/rt_map.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/rt_map.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/rt_map.hpp
diff --git a/ngraph/python/src/pyngraph/shape.cpp b/runtime/bindings/python/src/compatibility/pyngraph/shape.cpp
similarity index 93%
rename from ngraph/python/src/pyngraph/shape.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/shape.cpp
index a0938fa88ca8c9..424d0abddca8a4 100644
--- a/ngraph/python/src/pyngraph/shape.cpp
+++ b/runtime/bindings/python/src/compatibility/pyngraph/shape.cpp
@@ -42,6 +42,6 @@ void regclass_pyngraph_Shape(py::module m) {
     });
 
     shape.def("__repr__", [](const ngraph::Shape& self) -> std::string {
-        return "<" + py::cast(self).attr("__str__")().cast<std::string>() + ">";
+        return "<Shape: " + py::cast(self).attr("__str__")().cast<std::string>() + ">";
     });
 }
diff --git a/ngraph/python/src/pyngraph/shape.hpp b/runtime/bindings/python/src/compatibility/pyngraph/shape.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/shape.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/shape.hpp
diff --git a/ngraph/python/src/pyngraph/strides.cpp b/runtime/bindings/python/src/compatibility/pyngraph/strides.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/strides.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/strides.cpp
diff --git a/ngraph/python/src/pyngraph/strides.hpp b/runtime/bindings/python/src/compatibility/pyngraph/strides.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/strides.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/strides.hpp
diff --git a/ngraph/python/src/pyngraph/types/element_type.cpp b/runtime/bindings/python/src/compatibility/pyngraph/types/element_type.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/types/element_type.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/types/element_type.cpp
diff --git a/ngraph/python/src/pyngraph/types/element_type.hpp b/runtime/bindings/python/src/compatibility/pyngraph/types/element_type.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/types/element_type.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/types/element_type.hpp
diff --git a/ngraph/python/src/pyngraph/types/regmodule_pyngraph_types.cpp b/runtime/bindings/python/src/compatibility/pyngraph/types/regmodule_pyngraph_types.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/types/regmodule_pyngraph_types.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/types/regmodule_pyngraph_types.cpp
diff --git a/ngraph/python/src/pyngraph/types/regmodule_pyngraph_types.hpp b/runtime/bindings/python/src/compatibility/pyngraph/types/regmodule_pyngraph_types.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/types/regmodule_pyngraph_types.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/types/regmodule_pyngraph_types.hpp
diff --git a/ngraph/python/src/pyngraph/util.cpp b/runtime/bindings/python/src/compatibility/pyngraph/util.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/util.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/util.cpp
diff --git a/ngraph/python/src/pyngraph/util.hpp b/runtime/bindings/python/src/compatibility/pyngraph/util.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/util.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/util.hpp
diff --git a/ngraph/python/src/pyngraph/util.py b/runtime/bindings/python/src/compatibility/pyngraph/util.py
similarity index 100%
rename from ngraph/python/src/pyngraph/util.py
rename to runtime/bindings/python/src/compatibility/pyngraph/util.py
diff --git a/ngraph/python/src/pyngraph/variant.cpp b/runtime/bindings/python/src/compatibility/pyngraph/variant.cpp
similarity index 100%
rename from ngraph/python/src/pyngraph/variant.cpp
rename to runtime/bindings/python/src/compatibility/pyngraph/variant.cpp
diff --git a/ngraph/python/src/pyngraph/variant.hpp b/runtime/bindings/python/src/compatibility/pyngraph/variant.hpp
similarity index 100%
rename from ngraph/python/src/pyngraph/variant.hpp
rename to runtime/bindings/python/src/compatibility/pyngraph/variant.hpp
diff --git a/ngraph/python/tests/__init__.py b/runtime/bindings/python/tests/__init__.py
similarity index 93%
rename from ngraph/python/tests/__init__.py
rename to runtime/bindings/python/tests/__init__.py
index 929eb41658b8da..7c603670452dcf 100644
--- a/ngraph/python/tests/__init__.py
+++ b/runtime/bindings/python/tests/__init__.py
@@ -25,8 +25,6 @@ def xfail_test(reason="Mark the test as expected to fail", strict=True):
 skip_segfault = pytest.mark.skip(reason="Segmentation fault error")
 xfail_issue_33488 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
                                       "MaxUnpool")
-xfail_issue_33535 = xfail_test(reason="nGraph does not support the following ONNX operations:"
-                                      "DynamicQuantizeLinear")
 xfail_issue_33538 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
                                       "Scan")
 skip_issue_38084 = pytest.mark.skip(reason="Aborted (core dumped) Assertion "
@@ -65,15 +63,11 @@ def xfail_test(reason="Mark the test as expected to fail", strict=True):
 xfail_issue_38710 = xfail_test(reason="RuntimeError: data has zero dimension which is not allowed")
 xfail_issue_38713 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
                                       "ai.onnx.preview.training.Momentum")
-xfail_issue_43742 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
-                                      "If")
 xfail_issue_45457 = xfail_test(reason="RuntimeError: Unsupported dynamic ops: v5::Loop"
                                       "Not constant termination condition body output is not supported")
 xfail_issue_38722 = xfail_test(reason="RuntimeError: While validating ONNX nodes MatMulInteger"
                                       "and QLinearMatMul"
                                       "Input0 scale and input0 zero point shape must be same and 1")
-xfail_issue_38723 = xfail_test(reason="RuntimeError: nGraph does not support the following ONNX operations:"
-                                      "QLinearConv")
 xfail_issue_38724 = xfail_test(reason="RuntimeError: While validating ONNX node '<Node(Resize): Y>':"
                                       "tf_crop_and_resize - this type of coordinate transformation mode"
                                       "is not supported. Choose one of the following modes:"
@@ -100,9 +94,6 @@ def xfail_test(reason="Mark the test as expected to fail", strict=True):
 xfail_issue_44958 = xfail_test(reason="Expected: Unsupported dynamic op: Interpolate")
 xfail_issue_44965 = xfail_test(reason="Expected: RuntimeError: value info has no element")
 xfail_issue_44968 = xfail_test(reason="Expected: Unsupported dynamic op: Squeeze")
-xfail_issue_44976 = xfail_test(reason="Expected: RuntimeError: Quantize layer with name:"
-                                      "FakeQuantize_xxx has non const input on 1 port")
-xfail_issue_46762 = xfail_test(reason="Incorrect result of Minimum op if uint data type is used")
 xfail_issue_47323 = xfail_test(reason="RuntimeError: The plugin does not support FP64")
 xfail_issue_47337 = xfail_test(reason="RuntimeError: Unsupported dynamic ops: v1::OneHot")
 xfail_issue_33593 = xfail_test(reason="Current implementation of MaxPool doesn't support indices output")
@@ -158,3 +149,4 @@ def xfail_test(reason="Mark the test as expected to fail", strict=True):
 xfail_issue_63136 = xfail_test(reason="Unsupported operation: CastLike")
 xfail_issue_63137 = xfail_test(reason="Unsupported operations: OptionalHasElement, OptionalGetElement")
 xfail_issue_63138 = xfail_test(reason="Missing ONNX Shape-15 support")
+xfail_issue_63643 = xfail_test(reason="RuntimeError: Unsupported operation of type: Convolution name")
diff --git a/ngraph/python/tests/conftest.py b/runtime/bindings/python/tests/conftest.py
similarity index 91%
rename from ngraph/python/tests/conftest.py
rename to runtime/bindings/python/tests/conftest.py
index 911be2f770c490..4b4fa151343f82 100644
--- a/ngraph/python/tests/conftest.py
+++ b/runtime/bindings/python/tests/conftest.py
@@ -17,7 +17,7 @@ def pytest_addoption(parser):
     parser.addoption(
         "--backend",
         default="CPU",
-        choices=["CPU", "GPU", "FPGA", "HDDL", "MYRIAD", "HETERO", "TEMPLATE"],
+        choices=["CPU", "GPU", "HDDL", "MYRIAD", "HETERO", "TEMPLATE"],
         help="Select target device",
     )
     parser.addoption(
@@ -42,7 +42,6 @@ def pytest_configure(config):
     # register additional markers
     config.addinivalue_line("markers", "skip_on_cpu: Skip test on CPU")
     config.addinivalue_line("markers", "skip_on_gpu: Skip test on GPU")
-    config.addinivalue_line("markers", "skip_on_fpga: Skip test on FPGA")
     config.addinivalue_line("markers", "skip_on_hddl: Skip test on HDDL")
     config.addinivalue_line("markers", "skip_on_myriad: Skip test on MYRIAD")
     config.addinivalue_line("markers", "skip_on_hetero: Skip test on HETERO")
@@ -58,7 +57,6 @@ def pytest_collection_modifyitems(config, items):
     keywords = {
         "CPU": "skip_on_cpu",
         "GPU": "skip_on_gpu",
-        "FPGA": "skip_on_fpga",
         "HDDL": "skip_on_hddl",
         "MYRIAD": "skip_on_myriad",
         "HETERO": "skip_on_hetero",
@@ -68,7 +66,6 @@ def pytest_collection_modifyitems(config, items):
     skip_markers = {
         "CPU": pytest.mark.skip(reason="Skipping test on the CPU backend."),
         "GPU": pytest.mark.skip(reason="Skipping test on the GPU backend."),
-        "FPGA": pytest.mark.skip(reason="Skipping test on the FPGA backend."),
         "HDDL": pytest.mark.skip(reason="Skipping test on the HDDL backend."),
         "MYRIAD": pytest.mark.skip(reason="Skipping test on the MYRIAD backend."),
         "HETERO": pytest.mark.skip(reason="Skipping test on the HETERO backend."),
diff --git a/ngraph/python/tests/mock/mock_py_ngraph_frontend/CMakeLists.txt b/runtime/bindings/python/tests/mock/mock_py_ngraph_frontend/CMakeLists.txt
similarity index 72%
rename from ngraph/python/tests/mock/mock_py_ngraph_frontend/CMakeLists.txt
rename to runtime/bindings/python/tests/mock/mock_py_ngraph_frontend/CMakeLists.txt
index b218da4751fdbb..62fb1879de5c87 100644
--- a/ngraph/python/tests/mock/mock_py_ngraph_frontend/CMakeLists.txt
+++ b/runtime/bindings/python/tests/mock/mock_py_ngraph_frontend/CMakeLists.txt
@@ -15,10 +15,10 @@ add_library(${TARGET_FE_NAME} SHARED ${LIBRARY_SRC} ${LIBRARY_HEADERS})
 
 target_include_directories(${TARGET_FE_NAME} PRIVATE ${CMAKE_CURRENT_SOURCE_DIR})
 
-target_link_libraries(${TARGET_FE_NAME} PRIVATE ngraph::frontend_manager::static)
+target_link_libraries(${TARGET_FE_NAME} PRIVATE frontend_manager::static)
 
 add_clang_format_target(${TARGET_FE_NAME}_clang FOR_TARGETS ${TARGET_FE_NAME})
 
 install(TARGETS ${TARGET_FE_NAME}
-        RUNTIME DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL
-        LIBRARY DESTINATION ${NGRAPH_INSTALL_LIB} COMPONENT tests EXCLUDE_FROM_ALL)
+        RUNTIME DESTINATION ${IE_CPACK_RUNTIME_PATH} COMPONENT tests EXCLUDE_FROM_ALL
+        LIBRARY DESTINATION ${IE_CPACK_LIBRARY_PATH} COMPONENT tests EXCLUDE_FROM_ALL)
diff --git a/ngraph/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.cpp b/runtime/bindings/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.cpp
similarity index 100%
rename from ngraph/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.cpp
rename to runtime/bindings/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.cpp
diff --git a/ngraph/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.hpp b/runtime/bindings/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.hpp
similarity index 100%
rename from ngraph/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.hpp
rename to runtime/bindings/python/tests/mock/mock_py_ngraph_frontend/mock_py_frontend.hpp
diff --git a/ngraph/python/tests/mock/pyngraph_fe_mock_api/CMakeLists.txt b/runtime/bindings/python/tests/mock/pyngraph_fe_mock_api/CMakeLists.txt
similarity index 94%
rename from ngraph/python/tests/mock/pyngraph_fe_mock_api/CMakeLists.txt
rename to runtime/bindings/python/tests/mock/pyngraph_fe_mock_api/CMakeLists.txt
index f464e3e316fd50..08755970fb6887 100644
--- a/ngraph/python/tests/mock/pyngraph_fe_mock_api/CMakeLists.txt
+++ b/runtime/bindings/python/tests/mock/pyngraph_fe_mock_api/CMakeLists.txt
@@ -11,7 +11,7 @@ source_group("src" FILES ${PYBIND_FE_SRC})
 
 pybind11_add_module(${PYBIND_FE_NAME} MODULE ${PYBIND_FE_SRC})
 
-target_link_libraries(${PYBIND_FE_NAME} PRIVATE ${TARGET_FE_NAME} ngraph::frontend_manager::static)
+target_link_libraries(${PYBIND_FE_NAME} PRIVATE ${TARGET_FE_NAME} frontend_manager::static)
 
 add_clang_format_target(${PYBIND_FE_NAME}_clang FOR_TARGETS ${PYBIND_FE_NAME})
 
diff --git a/ngraph/python/tests/mock/pyngraph_fe_mock_api/pyngraph_mock_frontend_api.cpp b/runtime/bindings/python/tests/mock/pyngraph_fe_mock_api/pyngraph_mock_frontend_api.cpp
similarity index 100%
rename from ngraph/python/tests/mock/pyngraph_fe_mock_api/pyngraph_mock_frontend_api.cpp
rename to runtime/bindings/python/tests/mock/pyngraph_fe_mock_api/pyngraph_mock_frontend_api.cpp
diff --git a/ngraph/python/tests/runtime.py b/runtime/bindings/python/tests/runtime.py
similarity index 100%
rename from ngraph/python/tests/runtime.py
rename to runtime/bindings/python/tests/runtime.py
diff --git a/ngraph/python/tests/test_frontend/test_frontend_onnx.py b/runtime/bindings/python/tests/test_frontend/test_frontend_onnx.py
similarity index 100%
rename from ngraph/python/tests/test_frontend/test_frontend_onnx.py
rename to runtime/bindings/python/tests/test_frontend/test_frontend_onnx.py
diff --git a/ngraph/python/tests/test_frontend/test_frontend_onnx_editor.py b/runtime/bindings/python/tests/test_frontend/test_frontend_onnx_editor.py
similarity index 93%
rename from ngraph/python/tests/test_frontend/test_frontend_onnx_editor.py
rename to runtime/bindings/python/tests/test_frontend/test_frontend_onnx_editor.py
index 3542a20ef19ba2..e241945dd0c205 100644
--- a/ngraph/python/tests/test_frontend/test_frontend_onnx_editor.py
+++ b/runtime/bindings/python/tests/test_frontend/test_frontend_onnx_editor.py
@@ -595,6 +595,56 @@ def test_get_place_by_tensor_name():
     place3 = model.get_place_by_tensor_name(tensorName="in1")
     assert place3
 
-    with pytest.raises(Exception) as e:
-        model.get_place_by_tensor_name(tensorName="0:add_out")
-    assert "The tensor with name: 0:add_out does not exist in the graph" in str(e)
+    assert not model.get_place_by_tensor_name(tensorName="0:add_out")
+
+
+def test_get_place_by_operation_name():
+    skip_if_onnx_frontend_is_disabled()
+    fe = fem.load_by_framework(framework=ONNX_FRONTEND_NAME)
+    assert fe
+
+    model = fe.load("input_model.onnx")
+    assert model
+
+    place1 = model.get_place_by_operation_name(operationName="split1")
+    assert place1
+
+    place2 = model.get_place_by_operation_name(operationName="not_existed")
+    assert not place2
+
+
+def test_get_output_port():
+    skip_if_onnx_frontend_is_disabled()
+    fe = fem.load_by_framework(framework=ONNX_FRONTEND_NAME)
+    assert fe
+    model = fe.load("input_model.onnx")
+    assert model
+
+    split_op = model.get_place_by_operation_name(operationName="split1")
+    place1 = split_op.get_output_port(outputPortIndex=0)
+    place2 = split_op.get_output_port(outputName="out2")
+
+    assert place1.get_target_tensor().get_names()[0] == "out1"
+    assert place2.get_target_tensor().get_names()[0] == "out2"
+
+    assert not split_op.get_output_port()
+    assert not split_op.get_output_port(outputPortIndex=3)
+    assert not split_op.get_output_port(outputName="not_existed")
+
+
+def test_get_input_port():
+    skip_if_onnx_frontend_is_disabled()
+    fe = fem.load_by_framework(framework=ONNX_FRONTEND_NAME)
+    assert fe
+    model = fe.load("input_model.onnx")
+    assert model
+
+    split_op = model.get_place_by_operation_name(operationName="split1")
+    place1 = split_op.get_input_port(inputPortIndex=0)
+    assert place1.get_source_tensor().get_names()[0] == "add_out"
+
+    place2 = split_op.get_input_port()
+    assert place1.is_equal(place2)
+
+    assert not split_op.get_input_port(inputPortIndex=1)
+    assert not split_op.get_input_port(inputName="not_existed")
diff --git a/ngraph/python/tests/test_frontend/test_frontendmanager.py b/runtime/bindings/python/tests/test_frontend/test_frontendmanager.py
similarity index 100%
rename from ngraph/python/tests/test_frontend/test_frontendmanager.py
rename to runtime/bindings/python/tests/test_frontend/test_frontendmanager.py
diff --git a/ngraph/python/tests/test_ngraph/__init__.py b/runtime/bindings/python/tests/test_ngraph/__init__.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/__init__.py
rename to runtime/bindings/python/tests/test_ngraph/__init__.py
diff --git a/ngraph/python/tests/test_ngraph/test_adaptive_pool.py b/runtime/bindings/python/tests/test_ngraph/test_adaptive_pool.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_adaptive_pool.py
rename to runtime/bindings/python/tests/test_ngraph/test_adaptive_pool.py
diff --git a/ngraph/python/tests/test_ngraph/test_basic.py b/runtime/bindings/python/tests/test_ngraph/test_basic.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_basic.py
rename to runtime/bindings/python/tests/test_ngraph/test_basic.py
diff --git a/ngraph/python/tests/test_ngraph/test_convolution.py b/runtime/bindings/python/tests/test_ngraph/test_convolution.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_convolution.py
rename to runtime/bindings/python/tests/test_ngraph/test_convolution.py
diff --git a/ngraph/python/tests/test_ngraph/test_core.py b/runtime/bindings/python/tests/test_ngraph/test_core.py
similarity index 99%
rename from ngraph/python/tests/test_ngraph/test_core.py
rename to runtime/bindings/python/tests/test_ngraph/test_core.py
index 620341ff4f82a0..87974c6e527d2d 100644
--- a/ngraph/python/tests/test_ngraph/test_core.py
+++ b/runtime/bindings/python/tests/test_ngraph/test_core.py
@@ -98,7 +98,7 @@ def test_partial_shape():
     assert list(ps.get_max_shape()) == [1, 2, 3]
     assert list(ps.get_min_shape()) == [1, 2, 3]
     assert list(ps.to_shape()) == [1, 2, 3]
-    assert repr(shape) == "<Shape{1, 2, 3}>"
+    assert repr(shape) == "<Shape: {1, 2, 3}>"
     assert repr(ps) == "<PartialShape: {1,2,3}>"
 
     ps = PartialShape([Dimension(1), Dimension(2), Dimension(3), Dimension.dynamic()])
diff --git a/ngraph/python/tests/test_ngraph/test_create_op.py b/runtime/bindings/python/tests/test_ngraph/test_create_op.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_create_op.py
rename to runtime/bindings/python/tests/test_ngraph/test_create_op.py
diff --git a/ngraph/python/tests/test_ngraph/test_ctc_loss.py b/runtime/bindings/python/tests/test_ngraph/test_ctc_loss.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_ctc_loss.py
rename to runtime/bindings/python/tests/test_ngraph/test_ctc_loss.py
diff --git a/ngraph/python/tests/test_ngraph/test_data_movement.py b/runtime/bindings/python/tests/test_ngraph/test_data_movement.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_data_movement.py
rename to runtime/bindings/python/tests/test_ngraph/test_data_movement.py
diff --git a/ngraph/python/tests/test_ngraph/test_dft.py b/runtime/bindings/python/tests/test_ngraph/test_dft.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_dft.py
rename to runtime/bindings/python/tests/test_ngraph/test_dft.py
diff --git a/ngraph/python/tests/test_ngraph/test_dyn_attributes.py b/runtime/bindings/python/tests/test_ngraph/test_dyn_attributes.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_dyn_attributes.py
rename to runtime/bindings/python/tests/test_ngraph/test_dyn_attributes.py
diff --git a/ngraph/python/tests/test_ngraph/test_einsum.py b/runtime/bindings/python/tests/test_ngraph/test_einsum.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_einsum.py
rename to runtime/bindings/python/tests/test_ngraph/test_einsum.py
diff --git a/ngraph/python/tests/test_ngraph/test_gather.py b/runtime/bindings/python/tests/test_ngraph/test_gather.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_gather.py
rename to runtime/bindings/python/tests/test_ngraph/test_gather.py
diff --git a/ngraph/python/tests/test_ngraph/test_idft.py b/runtime/bindings/python/tests/test_ngraph/test_idft.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_idft.py
rename to runtime/bindings/python/tests/test_ngraph/test_idft.py
diff --git a/ngraph/python/tests/test_ngraph/test_input_validation.py b/runtime/bindings/python/tests/test_ngraph/test_input_validation.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_input_validation.py
rename to runtime/bindings/python/tests/test_ngraph/test_input_validation.py
diff --git a/ngraph/python/tests/test_ngraph/test_log_softmax.py b/runtime/bindings/python/tests/test_ngraph/test_log_softmax.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_log_softmax.py
rename to runtime/bindings/python/tests/test_ngraph/test_log_softmax.py
diff --git a/ngraph/python/tests/test_ngraph/test_manager.py b/runtime/bindings/python/tests/test_ngraph/test_manager.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_manager.py
rename to runtime/bindings/python/tests/test_ngraph/test_manager.py
diff --git a/ngraph/python/tests/test_ngraph/test_node_factory.py b/runtime/bindings/python/tests/test_ngraph/test_node_factory.py
similarity index 55%
rename from ngraph/python/tests/test_ngraph/test_node_factory.py
rename to runtime/bindings/python/tests/test_ngraph/test_node_factory.py
index e47ad8ee75d15e..14fe3d62d040fd 100644
--- a/ngraph/python/tests/test_ngraph/test_node_factory.py
+++ b/runtime/bindings/python/tests/test_ngraph/test_node_factory.py
@@ -3,6 +3,7 @@
 
 import numpy as np
 import ngraph as ng
+from ngraph.exceptions import UserInputError
 from ngraph.utils.node_factory import NodeFactory
 from _pyngraph import NodeFactory as _NodeFactory
 
@@ -45,7 +46,49 @@ def test_node_factory_topk():
     node = factory.create(
         "TopK", arguments, {"axis": 1, "mode": "max", "sort": "value"}
     )
+    attributes = node.get_attributes()
 
     assert node.get_type_name() == "TopK"
     assert node.get_output_size() == 2
     assert list(node.get_output_shape(0)) == [2, 3]
+    assert attributes["axis"] == 1
+    assert attributes["mode"] == "max"
+    assert attributes["sort"] == "value"
+
+
+def test_node_factory_empty_topk():
+    factory = NodeFactory("opset1")
+    node = factory.create("TopK")
+
+    assert node.get_type_name() == "TopK"
+
+
+def test_node_factory_empty_topk_with_args_and_attrs():
+    dtype = np.int32
+    data = ng.parameter([2, 10], dtype=dtype, name="A")
+    k = ng.constant(3, dtype=dtype, name="B")
+    factory = NodeFactory("opset1")
+    arguments = NodeFactory._arguments_as_outputs([data, k])
+    node = factory.create("TopK", None, None)
+    node.set_arguments(arguments)
+    node.set_attribute("axis", 1)
+    node.set_attribute("mode", "max")
+    node.set_attribute("sort", "value")
+    node.validate()
+
+    assert node.get_type_name() == "TopK"
+    assert node.get_output_size() == 2
+    assert list(node.get_output_shape(0)) == [2, 3]
+
+
+def test_node_factory_validate_missing_arguments():
+    factory = NodeFactory("opset1")
+
+    try:
+        factory.create(
+            "TopK", None, {"axis": 1, "mode": "max", "sort": "value"}
+        )
+    except UserInputError:
+        pass
+    else:
+        raise AssertionError("Validation of missing arguments has unexpectedly passed.")
diff --git a/ngraph/python/tests/test_ngraph/test_normalization.py b/runtime/bindings/python/tests/test_ngraph/test_normalization.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_normalization.py
rename to runtime/bindings/python/tests/test_ngraph/test_normalization.py
diff --git a/ngraph/python/tests/test_ngraph/test_ops.py b/runtime/bindings/python/tests/test_ngraph/test_ops.py
similarity index 95%
rename from ngraph/python/tests/test_ngraph/test_ops.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops.py
index bbe22553cd9d21..89993329d347eb 100644
--- a/ngraph/python/tests/test_ngraph/test_ops.py
+++ b/runtime/bindings/python/tests/test_ngraph/test_ops.py
@@ -552,10 +552,24 @@ def test_max_pool():
     window_shape = [3]
 
     strides = [1] * len(window_shape)
+    dilations = [1] * len(window_shape)
     pads_begin = [0] * len(window_shape)
     pads_end = [0] * len(window_shape)
-
-    model = ng.max_pool(A, strides, pads_begin, pads_end, window_shape)
+    rounding_type = "floor"
+    auto_pad = "explicit"
+    idx_elem_type = "i32"
+
+    model = ng.max_pool(
+        A,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        window_shape,
+        rounding_type,
+        auto_pad,
+        idx_elem_type,
+    )
     function = Function([model], parameter_list, "test")
 
     runtime = get_runtime()
@@ -570,7 +584,17 @@ def test_max_pool():
     pads_begin = [0] * len(window_shape)
     pads_end = [0] * len(window_shape)
 
-    model = ng.max_pool(A, strides, pads_begin, pads_end, window_shape)
+    model = ng.max_pool(
+        A,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        window_shape,
+        rounding_type,
+        auto_pad,
+        idx_elem_type,
+    )
     function = Function([model], parameter_list, "test")
 
     size = 4
@@ -590,10 +614,21 @@ def test_max_pool():
     window_shape = [3, 3]
 
     strides = [1, 1]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
 
-    model = ng.max_pool(A, strides, pads_begin, pads_end, window_shape)
+    model = ng.max_pool(
+        A,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        window_shape,
+        rounding_type,
+        auto_pad,
+        idx_elem_type,
+    )
     function = Function([model], parameter_list, "test")
 
     computation = runtime.computation(function, *parameter_list)
@@ -604,10 +639,21 @@ def test_max_pool():
 
     # test 2d with strides
     strides = [2, 2]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
 
-    model = ng.max_pool(A, strides, pads_begin, pads_end, window_shape)
+    model = ng.max_pool(
+        A,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        window_shape,
+        rounding_type,
+        auto_pad,
+        idx_elem_type,
+    )
     function = Function([model], parameter_list, "test")
     computation = runtime.computation(function, *parameter_list)
     result = computation(input_arr)[0]
diff --git a/ngraph/python/tests/test_ngraph/test_ops_binary.py b/runtime/bindings/python/tests/test_ngraph/test_ops_binary.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_ops_binary.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops_binary.py
diff --git a/ngraph/python/tests/test_ngraph/test_ops_fused.py b/runtime/bindings/python/tests/test_ngraph/test_ops_fused.py
similarity index 99%
rename from ngraph/python/tests/test_ngraph/test_ops_fused.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops_fused.py
index d96f870f604bc0..6db4a5f29c4e77 100644
--- a/ngraph/python/tests/test_ngraph/test_ops_fused.py
+++ b/runtime/bindings/python/tests/test_ngraph/test_ops_fused.py
@@ -6,7 +6,7 @@
 
 import ngraph as ng
 from tests.runtime import get_runtime
-from tests import (xfail_issue_36486, xfail_issue_44976)
+from tests import xfail_issue_36486
 
 
 def test_elu_operator_with_scalar_and_array():
@@ -40,7 +40,6 @@ def test_elu_operator_with_scalar():
     assert np.allclose(result, expected)
 
 
-@xfail_issue_44976
 def test_fake_quantize():
     runtime = get_runtime()
 
diff --git a/ngraph/python/tests/test_ngraph/test_ops_matmul.py b/runtime/bindings/python/tests/test_ngraph/test_ops_matmul.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_ops_matmul.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops_matmul.py
diff --git a/ngraph/python/tests/test_ngraph/test_ops_multioutput.py b/runtime/bindings/python/tests/test_ngraph/test_ops_multioutput.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_ops_multioutput.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops_multioutput.py
diff --git a/ngraph/python/tests/test_ngraph/test_ops_reshape.py b/runtime/bindings/python/tests/test_ngraph/test_ops_reshape.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_ops_reshape.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops_reshape.py
diff --git a/ngraph/python/tests/test_ngraph/test_ops_scatter.py b/runtime/bindings/python/tests/test_ngraph/test_ops_scatter.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_ops_scatter.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops_scatter.py
diff --git a/ngraph/python/tests/test_ngraph/test_ops_unary.py b/runtime/bindings/python/tests/test_ngraph/test_ops_unary.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_ops_unary.py
rename to runtime/bindings/python/tests/test_ngraph/test_ops_unary.py
diff --git a/ngraph/python/tests/test_ngraph/test_pooling.py b/runtime/bindings/python/tests/test_ngraph/test_pooling.py
similarity index 62%
rename from ngraph/python/tests/test_ngraph/test_pooling.py
rename to runtime/bindings/python/tests/test_ngraph/test_pooling.py
index afee2ede43f54f..77da435ff5ebea 100644
--- a/ngraph/python/tests/test_ngraph/test_pooling.py
+++ b/runtime/bindings/python/tests/test_ngraph/test_pooling.py
@@ -85,17 +85,35 @@ def test_max_pool_basic():
     #          [12.5, 13.5, 14.5, 15.5]]]], dtype=float32)
     data = np.arange(0.5, 16, dtype=np.float32).reshape((1, 1, 4, 4))
     strides = [1, 1]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
     kernel_shape = [2, 2]
+    rounding_type = "floor"
+    auto_pad = None
+    index_et = "i32"
 
     data_node = ng.parameter(data.shape, name="A", dtype=np.float32)
-    avgpool_node = ng.max_pool(data_node, strides, pads_begin, pads_end, kernel_shape)
-    comp = rt.computation(avgpool_node, data_node)
+    maxpool_node = ng.max_pool(
+        data_node,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        kernel_shape,
+        rounding_type,
+        auto_pad,
+        index_et,
+    )
+    comp = rt.computation(maxpool_node, data_node)
     result = comp(data)
 
-    expected = np.array([[[[5.5, 6.5, 7.5], [9.5, 10.5, 11.5], [13.5, 14.5, 15.5]]]], dtype=np.float32)
-    assert np.allclose(result, expected)
+    expected = np.array(
+        [[[[5.5, 6.5, 7.5], [9.5, 10.5, 11.5], [13.5, 14.5, 15.5]]]], dtype=np.float32
+    )
+    expected_idx = np.array([[[[5, 6, 7], [9, 10, 11], [13, 14, 15]]]], dtype=np.int32)
+    assert np.allclose(result[0], expected)
+    assert np.allclose(result[1], expected_idx)
 
 
 def test_max_pool_strides():
@@ -107,20 +125,36 @@ def test_max_pool_strides():
     #          [12.5, 13.5, 14.5, 15.5]]]], dtype=float32)
     data = np.arange(0.5, 16, dtype=np.float32).reshape((1, 1, 4, 4))
     strides = [2, 1]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
     kernel_shape = [2, 2]
+    rounding_type = "floor"
+    auto_pad = None
+    index_et = "i32"
 
     data_node = ng.parameter(data.shape, name="A", dtype=np.float32)
-    avgpool_node = ng.max_pool(data_node, strides, pads_begin, pads_end, kernel_shape)
-    comp = rt.computation(avgpool_node, data_node)
+    maxpool_node = ng.max_pool(
+        data_node,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        kernel_shape,
+        rounding_type,
+        auto_pad,
+        index_et,
+    )
+    comp = rt.computation(maxpool_node, data_node)
     result = comp(data)
 
     expected = np.array([[[[5.5, 6.5, 7.5], [13.5, 14.5, 15.5]]]], dtype=np.float32)
-    assert np.allclose(result, expected)
+    expected_idx = np.array([[[[5, 6, 7], [13, 14, 15]]]], dtype=np.int32)
+    assert np.allclose(result[0], expected)
+    assert np.allclose(result[1], expected_idx)
 
 
-def test_max_pool_kernel_shape1d():
+def test_max_pool_kernel_shape1x1():
     rt = get_runtime()
 
     # array([[[[ 0.5,  1.5,  2.5,  3.5],
@@ -129,19 +163,34 @@ def test_max_pool_kernel_shape1d():
     #          [12.5, 13.5, 14.5, 15.5]]]], dtype=float32)
     data = np.arange(0.5, 16, dtype=np.float32).reshape((1, 1, 4, 4))
     strides = [1, 1]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
     kernel_shape = [1, 1]
+    rounding_type = "floor"
+    auto_pad = None
+    index_et = "i32"
 
     data_node = ng.parameter(data.shape, name="A", dtype=np.float32)
-    avgpool_node = ng.max_pool(data_node, strides, pads_begin, pads_end, kernel_shape)
-    comp = rt.computation(avgpool_node, data_node)
+    maxpool_node = ng.max_pool(
+        data_node,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        kernel_shape,
+        rounding_type,
+        auto_pad,
+        index_et,
+    )
+    comp = rt.computation(maxpool_node, data_node)
     result = comp(data)
 
-    assert np.allclose(result, data)
+    assert np.allclose(result[0], data)
+    assert np.allclose(result[1], np.arange(0, 16, dtype=np.int32).reshape((1, 1, 4, 4)))
 
 
-def test_max_pool_kernel_shape3d():
+def test_max_pool_kernel_shape3x3():
     rt = get_runtime()
 
     # array([[[[ 0.5,  1.5,  2.5,  3.5],
@@ -150,17 +199,31 @@ def test_max_pool_kernel_shape3d():
     #          [12.5, 13.5, 14.5, 15.5]]]], dtype=float32)
     data = np.arange(0.5, 16, dtype=np.float32).reshape((1, 1, 4, 4))
     strides = [1, 1]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
     kernel_shape = [3, 3]
+    rounding_type = "floor"
+    auto_pad = None
+    index_et = "i32"
 
     data_node = ng.parameter(data.shape, name="A", dtype=np.float32)
-    avgpool_node = ng.max_pool(data_node, strides, pads_begin, pads_end, kernel_shape)
-    comp = rt.computation(avgpool_node, data_node)
+    maxpool_node = ng.max_pool(
+        data_node,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        kernel_shape,
+        rounding_type,
+        auto_pad,
+        index_et,
+    )
+    comp = rt.computation(maxpool_node, data_node)
     result = comp(data)
 
     expected = np.array([[[[10.5, 11.5], [14.5, 15.5]]]], dtype=np.float32)
-    assert np.allclose(result, expected)
+    assert np.allclose(result[0], expected)
 
 
 def test_max_pool_non_zero_pads():
@@ -172,6 +235,7 @@ def test_max_pool_non_zero_pads():
     #          [12.5, 13.5, 14.5, 15.5]]]], dtype=float32)
     data = np.arange(0.5, 16, dtype=np.float32).reshape((1, 1, 4, 4))
     strides = [1, 1]
+    dilations = [1, 1]
     pads_begin = [1, 1]
     pads_end = [1, 1]
     #  0   0  ,  0  ,  0  ,  0,    0
@@ -181,10 +245,23 @@ def test_max_pool_non_zero_pads():
     #  0 [12.5, 13.5, 14.5, 15.5], 0
     #  0   0  ,  0  ,  0  ,  0,    0
     kernel_shape = [2, 2]
+    rounding_type = "floor"
+    auto_pad = None
+    index_et = "i32"
 
     data_node = ng.parameter(data.shape, name="A", dtype=np.float32)
-    avgpool_node = ng.max_pool(data_node, strides, pads_begin, pads_end, kernel_shape)
-    comp = rt.computation(avgpool_node, data_node)
+    maxpool_node = ng.max_pool(
+        data_node,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        kernel_shape,
+        rounding_type,
+        auto_pad,
+        index_et,
+    )
+    comp = rt.computation(maxpool_node, data_node)
     result = comp(data)
 
     expected = np.array(
@@ -201,7 +278,22 @@ def test_max_pool_non_zero_pads():
         ],
         dtype=np.float32,
     )
-    assert np.allclose(result, expected)
+    expected_idx = np.array(
+        [
+            [
+                [
+                    [0, 1, 2, 3, 3],
+                    [4, 5, 6, 7, 7],
+                    [8, 9, 10, 11, 11],
+                    [12, 13, 14, 15, 15],
+                    [12, 13, 14, 15, 15],
+                ]
+            ]
+        ],
+        dtype=np.int32,
+    )
+    assert np.allclose(result[0], expected)
+    assert np.allclose(result[1], expected_idx)
 
 
 def test_max_pool_same_upper_auto_pads():
@@ -213,6 +305,7 @@ def test_max_pool_same_upper_auto_pads():
     #          [12.5, 13.5, 14.5, 15.5]]]], dtype=float32)
     data = np.arange(0.5, 16, dtype=np.float32).reshape((1, 1, 4, 4))
     strides = [1, 1]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
     # [ 0.5,  1.5,  2.5,  3.5], 0,
@@ -222,10 +315,22 @@ def test_max_pool_same_upper_auto_pads():
     #   0  ,  0  ,  0  ,  0,    0
     kernel_shape = [2, 2]
     auto_pad = "same_upper"
+    rounding_type = "floor"
+    index_et = "i32"
 
     data_node = ng.parameter(data.shape, name="A", dtype=np.float32)
-    avgpool_node = ng.max_pool(data_node, strides, pads_begin, pads_end, kernel_shape, auto_pad=auto_pad)
-    comp = rt.computation(avgpool_node, data_node)
+    maxpool_node = ng.max_pool(
+        data_node,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        kernel_shape,
+        rounding_type,
+        auto_pad,
+        index_et,
+    )
+    comp = rt.computation(maxpool_node, data_node)
     result = comp(data)
 
     expected = np.array(
@@ -241,7 +346,21 @@ def test_max_pool_same_upper_auto_pads():
         ],
         dtype=np.float32,
     )
-    assert np.allclose(result, expected)
+    expected_idx = np.array(
+        [
+            [
+                [
+                    [5, 6, 7, 7],
+                    [9, 10, 11, 11],
+                    [13, 14, 15, 15],
+                    [13, 14, 15, 15],
+                ]
+            ]
+        ],
+        dtype=np.int32,
+    )
+    assert np.allclose(result[0], expected)
+    assert np.allclose(result[1], expected_idx)
 
 
 def test_max_pool_same_lower_auto_pads():
@@ -253,6 +372,7 @@ def test_max_pool_same_lower_auto_pads():
     #          [12.5, 13.5, 14.5, 15.5]]]], dtype=float32)
     data = np.arange(0.5, 16, dtype=np.float32).reshape((1, 1, 4, 4))
     strides = [1, 1]
+    dilations = [1, 1]
     pads_begin = [0, 0]
     pads_end = [0, 0]
     #  0   0  ,  0  ,  0  ,  0,
@@ -262,14 +382,49 @@ def test_max_pool_same_lower_auto_pads():
     #  0 [12.5, 13.5, 14.5, 15.5],
     kernel_shape = [2, 2]
     auto_pad = "same_lower"
+    rounding_type = "floor"
+    index_et = "i32"
 
     data_node = ng.parameter(data.shape, name="A", dtype=np.float32)
-    avgpool_node = ng.max_pool(data_node, strides, pads_begin, pads_end, kernel_shape, auto_pad=auto_pad)
-    comp = rt.computation(avgpool_node, data_node)
+    maxpool_node = ng.max_pool(
+        data_node,
+        strides,
+        dilations,
+        pads_begin,
+        pads_end,
+        kernel_shape,
+        rounding_type,
+        auto_pad,
+        index_et,
+    )
+    comp = rt.computation(maxpool_node, data_node)
     result = comp(data)
 
     expected = np.array(
-        [[[[0.5, 1.5, 2.5, 3.5], [4.5, 5.5, 6.5, 7.5], [8.5, 9.5, 10.5, 11.5], [12.5, 13.5, 14.5, 15.5]]]],
+        [
+            [
+                [
+                    [0.5, 1.5, 2.5, 3.5],
+                    [4.5, 5.5, 6.5, 7.5],
+                    [8.5, 9.5, 10.5, 11.5],
+                    [12.5, 13.5, 14.5, 15.5],
+                ]
+            ]
+        ],
         dtype=np.float32,
     )
-    assert np.allclose(result, expected)
+    expected_idx = np.array(
+        [
+            [
+                [
+                    [0, 1, 2, 3],
+                    [4, 5, 6, 7],
+                    [8, 9, 10, 11],
+                    [12, 13, 14, 15],
+                ]
+            ]
+        ],
+        dtype=np.int32,
+    )
+    assert np.allclose(result[0], expected)
+    assert np.allclose(result[1], expected_idx)
diff --git a/ngraph/python/tests/test_ngraph/test_proposal.py b/runtime/bindings/python/tests/test_ngraph/test_proposal.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_proposal.py
rename to runtime/bindings/python/tests/test_ngraph/test_proposal.py
diff --git a/runtime/bindings/python/tests/test_ngraph/test_random_uniform.py b/runtime/bindings/python/tests/test_ngraph/test_random_uniform.py
new file mode 100644
index 00000000000000..cd1895e1aa9563
--- /dev/null
+++ b/runtime/bindings/python/tests/test_ngraph/test_random_uniform.py
@@ -0,0 +1,27 @@
+import ngraph as ng
+import numpy as np
+from tests.runtime import get_runtime
+
+
+def test_random_uniform():
+    runtime = get_runtime()
+    input_tensor = ng.constant(np.array([2, 4, 3], dtype=np.int32))
+    min_val = ng.constant(np.array([-2.7], dtype=np.float32))
+    max_val = ng.constant(np.array([3.5], dtype=np.float32))
+
+    random_uniform_node = ng.random_uniform(input_tensor, min_val, max_val,
+                                            output_type="f32", global_seed=7461,
+                                            op_seed=1546)
+    computation = runtime.computation(random_uniform_node)
+    random_uniform_results = computation()
+    expected_results = np.array([[[2.8450181, -2.3457108, 2.2134445],
+                                  [-1.0436587, 0.79548645, 1.3023183],
+                                  [0.34447956, -2.0267959, 1.3989122],
+                                  [0.9607613, 1.5363653, 3.117298]],
+
+                                 [[1.570041, 2.2782724, 2.3193843],
+                                  [3.3393657, 0.63299894, 0.41231918],
+                                  [3.1739233, 0.03919673, -0.2136085],
+                                  [-1.4519991, -2.277353, 2.630727]]], dtype=np.float32)
+
+    assert np.allclose(random_uniform_results, expected_results)
diff --git a/ngraph/python/tests/test_ngraph/test_reduction.py b/runtime/bindings/python/tests/test_ngraph/test_reduction.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_reduction.py
rename to runtime/bindings/python/tests/test_ngraph/test_reduction.py
diff --git a/ngraph/python/tests/test_ngraph/test_roll.py b/runtime/bindings/python/tests/test_ngraph/test_roll.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_roll.py
rename to runtime/bindings/python/tests/test_ngraph/test_roll.py
diff --git a/ngraph/python/tests/test_ngraph/test_sequence_processing.py b/runtime/bindings/python/tests/test_ngraph/test_sequence_processing.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_sequence_processing.py
rename to runtime/bindings/python/tests/test_ngraph/test_sequence_processing.py
diff --git a/ngraph/python/tests/test_ngraph/test_swish.py b/runtime/bindings/python/tests/test_ngraph/test_swish.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_swish.py
rename to runtime/bindings/python/tests/test_ngraph/test_swish.py
diff --git a/ngraph/python/tests/test_ngraph/test_utils.py b/runtime/bindings/python/tests/test_ngraph/test_utils.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/test_utils.py
rename to runtime/bindings/python/tests/test_ngraph/test_utils.py
diff --git a/ngraph/python/tests/test_ngraph/util.py b/runtime/bindings/python/tests/test_ngraph/util.py
similarity index 100%
rename from ngraph/python/tests/test_ngraph/util.py
rename to runtime/bindings/python/tests/test_ngraph/util.py
diff --git a/ngraph/python/tests/test_onnx/__init__.py b/runtime/bindings/python/tests/test_onnx/__init__.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/__init__.py
rename to runtime/bindings/python/tests/test_onnx/__init__.py
diff --git a/ngraph/python/tests/test_onnx/model_zoo_preprocess.sh b/runtime/bindings/python/tests/test_onnx/model_zoo_preprocess.sh
similarity index 100%
rename from ngraph/python/tests/test_onnx/model_zoo_preprocess.sh
rename to runtime/bindings/python/tests/test_onnx/model_zoo_preprocess.sh
diff --git a/ngraph/python/tests/test_onnx/models/add_abc.onnx b/runtime/bindings/python/tests/test_onnx/models/add_abc.onnx
similarity index 100%
rename from ngraph/python/tests/test_onnx/models/add_abc.onnx
rename to runtime/bindings/python/tests/test_onnx/models/add_abc.onnx
diff --git a/ngraph/python/tests/test_onnx/models/data/tensor.data b/runtime/bindings/python/tests/test_onnx/models/data/tensor.data
similarity index 100%
rename from ngraph/python/tests/test_onnx/models/data/tensor.data
rename to runtime/bindings/python/tests/test_onnx/models/data/tensor.data
diff --git a/ngraph/python/tests/test_onnx/models/external_data.onnx b/runtime/bindings/python/tests/test_onnx/models/external_data.onnx
similarity index 100%
rename from ngraph/python/tests/test_onnx/models/external_data.onnx
rename to runtime/bindings/python/tests/test_onnx/models/external_data.onnx
diff --git a/ngraph/python/tests/test_onnx/test_backend.py b/runtime/bindings/python/tests/test_onnx/test_backend.py
similarity index 95%
rename from ngraph/python/tests/test_onnx/test_backend.py
rename to runtime/bindings/python/tests/test_onnx/test_backend.py
index 367e9a04dd55f3..e20d0cc099aaad 100644
--- a/ngraph/python/tests/test_onnx/test_backend.py
+++ b/runtime/bindings/python/tests/test_onnx/test_backend.py
@@ -8,7 +8,6 @@
     BACKEND_NAME,
     skip_rng_tests,
     xfail_issue_33488,
-    xfail_issue_33535,
     xfail_issue_33538,
     xfail_issue_33581,
     xfail_issue_33589,
@@ -26,7 +25,6 @@
     xfail_issue_38710,
     xfail_issue_38713,
     xfail_issue_38722,
-    xfail_issue_38723,
     xfail_issue_38724,
     xfail_issue_38732,
     xfail_issue_38734,
@@ -35,7 +33,6 @@
     xfail_issue_39658,
     xfail_issue_39659,
     xfail_issue_39662,
-    xfail_issue_43742,
     xfail_issue_44848,
     xfail_issue_44851,
     xfail_issue_44854,
@@ -45,10 +42,8 @@
     xfail_issue_44958,
     xfail_issue_44965,
     xfail_issue_44968,
-    xfail_issue_44976,
     xfail_issue_45180,
     xfail_issue_45344,
-    xfail_issue_46762,
     xfail_issue_47323,
     xfail_issue_47337,
     xfail_issue_48052,
@@ -186,13 +181,6 @@ def expect_fail(test_case_path, xfail):  # type: (str) -> None
         "OnnxBackendNodeModelTest.test_top_k_smallest_cpu",
     ),
     (xfail_issue_33633, "OnnxBackendNodeModelTest.test_maxpool_2d_dilations_cpu"),
-    (
-        xfail_issue_46762,
-        "OnnxBackendNodeModelTest.test_min_uint8_cpu",
-        "OnnxBackendNodeModelTest.test_min_uint16_cpu",
-        "OnnxBackendNodeModelTest.test_min_uint32_cpu",
-        "OnnxBackendNodeModelTest.test_min_uint64_cpu",
-    ),
     (
         xfail_issue_55760,
         "OnnxBackendNodeModelTest.test_argmax_negative_axis_keepdims_example_select_last_index_cpu",
@@ -200,7 +188,12 @@ def expect_fail(test_case_path, xfail):  # type: (str) -> None
         "OnnxBackendNodeModelTest.test_argmax_negative_axis_keepdims_random_select_last_index_cpu",
         "OnnxBackendNodeModelTest.test_argmin_negative_axis_keepdims_random_select_last_index_cpu",
     ),
-    (xfail_issue_38091, "OnnxBackendNodeModelTest.test_gather_negative_indices_cpu"),
+    (
+        xfail_issue_38091,
+        "OnnxBackendNodeModelTest.test_gather_negative_indices_cpu",
+        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_cpu",
+        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_expanded_cpu",
+    ),
     (
         xfail_issue_52463,
         "OnnxBackendPyTorchOperatorModelTest.test_operator_add_size1_singleton_broadcast_cpu",
@@ -227,6 +220,7 @@ def expect_fail(test_case_path, xfail):  # type: (str) -> None
         "OnnxBackendSimpleModelTest.test_sequence_model4_cpu",
         "OnnxBackendSimpleModelTest.test_sequence_model2_cpu",
         "OnnxBackendNodeModelTest.test_identity_sequence_cpu",
+        "OnnxBackendNodeModelTest.test_if_seq_cpu",
     ),
     (
         xfail_issue_38701,
@@ -337,19 +331,12 @@ def expect_fail(test_case_path, xfail):  # type: (str) -> None
         "OnnxBackendNodeModelTest.test_isinf_negative_cpu",
         "OnnxBackendNodeModelTest.test_isinf_cpu",
     ),
-    (
-        xfail_issue_33535,
-        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_min_adjusted_cpu",
-        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_cpu",
-        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_max_adjusted_cpu",
-    ),
     (
         xfail_issue_38722,
         "OnnxBackendNodeModelTest.test_matmulinteger_cpu",
         "OnnxBackendNodeModelTest.test_qlinearmatmul_2D_cpu",
         "OnnxBackendNodeModelTest.test_qlinearmatmul_3D_cpu",
     ),
-    (xfail_issue_38723, "OnnxBackendNodeModelTest.test_qlinearconv_cpu"),
     (xfail_issue_38724, "OnnxBackendNodeModelTest.test_resize_tf_crop_and_resize_cpu"),
     (
         xfail_issue_33606,
@@ -389,11 +376,6 @@ def expect_fail(test_case_path, xfail):  # type: (str) -> None
         "OnnxBackendNodeModelTest.test_reduce_sum_keepdims_random_cpu",
         "OnnxBackendNodeModelTest.test_reduce_sum_negative_axes_keepdims_example_cpu",
     ),
-    (
-        xfail_issue_43742,
-        "OnnxBackendNodeModelTest.test_if_cpu",
-        "OnnxBackendNodeModelTest.test_if_seq_cpu",
-    ),
     (
         xfail_issue_44848,
         "OnnxBackendNodeModelTest.test_range_float_type_positive_delta_cpu",
@@ -450,14 +432,6 @@ def expect_fail(test_case_path, xfail):  # type: (str) -> None
         "OnnxBackendNodeModelTest.test_squeeze_cpu",
         "OnnxBackendNodeModelTest.test_squeeze_negative_axes_cpu",
     ),
-    (
-        xfail_issue_44976,
-        "OnnxBackendNodeModelTest.test_quantizelinear_axis_cpu",
-        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_min_adjusted_expanded_cpu",
-        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_expanded_cpu",
-        "OnnxBackendNodeModelTest.test_dynamicquantizelinear_max_adjusted_expanded_cpu",
-        "OnnxBackendNodeModelTest.test_quantizelinear_cpu",
-    ),
     (
         xfail_issue_33593,
         "OnnxBackendNodeModelTest.test_maxpool_with_argmax_2d_precomputed_strides_cpu",
diff --git a/ngraph/python/tests/test_onnx/test_onnx_external_data.py b/runtime/bindings/python/tests/test_onnx/test_onnx_external_data.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_onnx_external_data.py
rename to runtime/bindings/python/tests/test_onnx/test_onnx_external_data.py
diff --git a/ngraph/python/tests/test_onnx/test_onnx_import.py b/runtime/bindings/python/tests/test_onnx/test_onnx_import.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_onnx_import.py
rename to runtime/bindings/python/tests/test_onnx/test_onnx_import.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_batchnorm.py b/runtime/bindings/python/tests/test_onnx/test_ops_batchnorm.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_batchnorm.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_batchnorm.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_binary.py b/runtime/bindings/python/tests/test_onnx/test_ops_binary.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_binary.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_binary.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_convpool.py b/runtime/bindings/python/tests/test_onnx/test_ops_convpool.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_convpool.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_convpool.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_logical.py b/runtime/bindings/python/tests/test_onnx/test_ops_logical.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_logical.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_logical.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_matmul.py b/runtime/bindings/python/tests/test_onnx/test_ops_matmul.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_matmul.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_matmul.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_nonlinear.py b/runtime/bindings/python/tests/test_onnx/test_ops_nonlinear.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_nonlinear.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_nonlinear.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_reduction.py b/runtime/bindings/python/tests/test_onnx/test_ops_reduction.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_reduction.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_reduction.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_reshape.py b/runtime/bindings/python/tests/test_onnx/test_ops_reshape.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_reshape.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_reshape.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_unary.py b/runtime/bindings/python/tests/test_onnx/test_ops_unary.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_unary.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_unary.py
diff --git a/ngraph/python/tests/test_onnx/test_ops_variadic.py b/runtime/bindings/python/tests/test_onnx/test_ops_variadic.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/test_ops_variadic.py
rename to runtime/bindings/python/tests/test_onnx/test_ops_variadic.py
diff --git a/ngraph/python/tests/test_onnx/test_zoo_models.py b/runtime/bindings/python/tests/test_onnx/test_zoo_models.py
similarity index 98%
rename from ngraph/python/tests/test_onnx/test_zoo_models.py
rename to runtime/bindings/python/tests/test_onnx/test_zoo_models.py
index dd2534600445cc..26e128b7a940e4 100644
--- a/ngraph/python/tests/test_onnx/test_zoo_models.py
+++ b/runtime/bindings/python/tests/test_onnx/test_zoo_models.py
@@ -12,7 +12,6 @@
 
 from tests import (
     xfail_issue_38701,
-    xfail_issue_43742,
     xfail_issue_45457,
     xfail_issue_37957,
     xfail_issue_38084,
@@ -24,6 +23,7 @@
     xfail_issue_48145,
     xfail_issue_48190,
     xfail_issue_58676,
+    xfail_issue_63643,
     xfail_issue_onnx_models_140)
 
 MODELS_ROOT_DIR = tests.MODEL_ZOO_DIR
@@ -145,11 +145,9 @@ def tinyyolov3_post_processing(outputs : Sequence[Any]) -> Sequence[Any]:
         import_xfail_list = [
             # ONNX Model Zoo
             (xfail_issue_38701, "test_onnx_model_zoo_text_machine_comprehension_bidirectional_attention_flow_model_bidaf_9_bidaf_bidaf_cpu"),
-            (xfail_issue_43742, "test_onnx_model_zoo_vision_object_detection_segmentation_ssd_mobilenetv1_model_ssd_mobilenet_v1_10_ssd_mobilenet_v1_ssd_mobilenet_v1_cpu"),
             (xfail_issue_38726, "test_onnx_model_zoo_text_machine_comprehension_t5_model_t5_decoder_with_lm_head_12_t5_decoder_with_lm_head_cpu"),
 
             # Model MSFT
-            (xfail_issue_43742, "test_MSFT_opset10_mlperf_ssd_mobilenet_300_ssd_mobilenet_v1_coco_2018_01_28_cpu"),
             (xfail_issue_37957, "test_MSFT_opset10_mask_rcnn_keras_mask_rcnn_keras_cpu"),
         ]
         for test_case in import_xfail_list:
@@ -170,6 +168,7 @@ def tinyyolov3_post_processing(outputs : Sequence[Any]) -> Sequence[Any]:
             (xfail_issue_48145, "test_onnx_model_zoo_text_machine_comprehension_bert_squad_model_bertsquad_8_download_sample_8_bertsquad8_cpu"),
             (xfail_issue_48190, "test_onnx_model_zoo_text_machine_comprehension_roberta_model_roberta_base_11_roberta_base_11_roberta_base_11_cpu"),
             (xfail_issue_onnx_models_140, "test_onnx_model_zoo_vision_object_detection_segmentation_duc_model_ResNet101_DUC_7_ResNet101_DUC_HDC_ResNet101_DUC_HDC_cpu"),
+            (xfail_issue_63643, "test_onnx_model_zoo_vision_object_detection_segmentation_ssd_mobilenetv1_model_ssd_mobilenet_v1_10_ssd_mobilenet_v1_ssd_mobilenet_v1_cpu"),
 
             # Model MSFT
             (xfail_issue_37973, "test_MSFT_opset7_tf_inception_v2_model_cpu"),
@@ -187,7 +186,7 @@ def tinyyolov3_post_processing(outputs : Sequence[Any]) -> Sequence[Any]:
             (xfail_issue_39669, "test_MSFT_opset9_cgan_cgan_cpu"),
             (xfail_issue_47495, "test_MSFT_opset10_BERT_Squad_bertsquad10_cpu"),
             (xfail_issue_45457, "test_MSFT_opset10_mlperf_ssd_resnet34_1200_ssd_resnet34_mAP_20.2_cpu"),
-
+            (xfail_issue_63643, "test_MSFT_opset10_mlperf_ssd_mobilenet_300_ssd_mobilenet_v1_coco_2018_01_28_cpu"),
         ]
         for test_case in import_xfail_list + execution_xfail_list:
             xfail, test_name = test_case
diff --git a/ngraph/python/tests/test_onnx/utils/__init__.py b/runtime/bindings/python/tests/test_onnx/utils/__init__.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/utils/__init__.py
rename to runtime/bindings/python/tests/test_onnx/utils/__init__.py
diff --git a/ngraph/python/tests/test_onnx/utils/model_importer.py b/runtime/bindings/python/tests/test_onnx/utils/model_importer.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/utils/model_importer.py
rename to runtime/bindings/python/tests/test_onnx/utils/model_importer.py
diff --git a/ngraph/python/tests/test_onnx/utils/onnx_backend.py b/runtime/bindings/python/tests/test_onnx/utils/onnx_backend.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/utils/onnx_backend.py
rename to runtime/bindings/python/tests/test_onnx/utils/onnx_backend.py
diff --git a/ngraph/python/tests/test_onnx/utils/onnx_helpers.py b/runtime/bindings/python/tests/test_onnx/utils/onnx_helpers.py
similarity index 100%
rename from ngraph/python/tests/test_onnx/utils/onnx_helpers.py
rename to runtime/bindings/python/tests/test_onnx/utils/onnx_helpers.py
diff --git a/runtime/bindings/python/thirdparty/pybind11 b/runtime/bindings/python/thirdparty/pybind11
new file mode 160000
index 00000000000000..d71ba0cb73616c
--- /dev/null
+++ b/runtime/bindings/python/thirdparty/pybind11
@@ -0,0 +1 @@
+Subproject commit d71ba0cb73616c493d35699a8a9283aa64ef0f6b
diff --git a/ngraph/python/tox.ini b/runtime/bindings/python/tox.ini
similarity index 98%
rename from ngraph/python/tox.ini
rename to runtime/bindings/python/tox.ini
index d19da1a3005332..7f0acd7e96ddf8 100644
--- a/ngraph/python/tox.ini
+++ b/runtime/bindings/python/tox.ini
@@ -10,7 +10,7 @@ deps =
 setenv =
   NGRAPH_BACKEND = {env:NGRAPH_BACKEND:"CPU"}
   PYTHONPATH = {env:PYTHONPATH}
-  ngraph_DIR = {env:ngraph_DIR}
+  OpenVINO_DIR = {env:OpenVINO_DIR}
 passenv =
   http_proxy
   https_proxy
diff --git a/scripts/CMakeLists.txt b/scripts/CMakeLists.txt
index 6cf6e02c1c44b9..c8449e26ae24ce 100644
--- a/scripts/CMakeLists.txt
+++ b/scripts/CMakeLists.txt
@@ -10,14 +10,14 @@ ie_shellcheck_process(DIRECTORY "${OpenVINO_SOURCE_DIR}"
                       SKIP "${OpenVINO_SOURCE_DIR}/bin"
                            "${OpenVINO_SOURCE_DIR}/build"
                            "${OpenVINO_SOURCE_DIR}/thirdparty"
-                           "${OpenVINO_SOURCE_DIR}/ngraph/python/pybind11"
+                           "${OpenVINO_SOURCE_DIR}/runtime/bindings/python/thirdparty/pybind11"
                            "${IE_MAIN_SOURCE_DIR}/thirdparty"
                            "${TEMP}"
                            # TODO fix and enable back:
                            "${OpenVINO_SOURCE_DIR}/inference-engine/scripts/dependencies.sh"
                            "${OpenVINO_SOURCE_DIR}/scripts/install_dependencies/install_NEO_OCL_driver.sh"
                            "${OpenVINO_SOURCE_DIR}/scripts/install_dependencies/install_openvino_dependencies.sh"
-                           "${OpenVINO_SOURCE_DIR}/ngraph/python/tests/test_onnx/model_zoo_preprocess.sh"
+                           "${OpenVINO_SOURCE_DIR}/runtime/bindings/python/tests/test_onnx/model_zoo_preprocess.sh"
                            )
 
 #
@@ -30,11 +30,11 @@ ie_cpack_add_component(setupvars REQUIRED)
 
 if(UNIX)
     install(PROGRAMS setupvars/setupvars.sh
-            DESTINATION bin
+            DESTINATION .
             COMPONENT setupvars)
 elseif(WIN32)
     install(PROGRAMS setupvars/setupvars.bat
-            DESTINATION bin
+            DESTINATION .
             COMPONENT setupvars)
 endif()
 
@@ -47,28 +47,22 @@ if(UNIX)
             COMPONENT install_dependencies)
 endif()
 
-# install DeploymentManager
-
-ie_cpack_add_component(deployment_manager REQUIRED)
-install(DIRECTORY deployment_manager/
-        DESTINATION deployment_tools/tools/deployment_manager
-        COMPONENT deployment_manager
-        USE_SOURCE_PERMISSIONS)
-
 # install files for demo
 
 ie_cpack_add_component(demo_scripts DEPENDS core)
 
 if(UNIX)
     install(DIRECTORY demo/
-            DESTINATION deployment_tools/demo
+            DESTINATION samples/scripts
             COMPONENT demo_scripts
             USE_SOURCE_PERMISSIONS
+            PATTERN demo_security_barrier_camera.* EXCLUDE
             PATTERN *.bat EXCLUDE)
 elseif(WIN32)
     install(DIRECTORY demo/
-            DESTINATION deployment_tools/demo
+            DESTINATION samples/scripts
             COMPONENT demo_scripts
             USE_SOURCE_PERMISSIONS
+            PATTERN demo_security_barrier_camera.* EXCLUDE
             PATTERN *.sh EXCLUDE)
 endif()
diff --git a/scripts/demo/README.txt b/scripts/demo/README.txt
index 3f9c8713c6b355..a013aad62cce48 100644
--- a/scripts/demo/README.txt
+++ b/scripts/demo/README.txt
@@ -1,10 +1,10 @@
 =====================================================
-Demo Scripts for Model Optimizer and Inference Engine
+Scripts to build and run OpenVINO samples
 =====================================================
 
-The demo scripts illustrate Intel(R) Deep Learning Deployment Toolkit usage to convert and optimize pre-trained models and perform inference.
+These scripts simplify process of build samples, download and convert models and run samples to perform inference. They can used to quick validation of OpenVINO installation and proper environment initialization.
 
-Setting Up Demos
+Setting Up
 ================
 If you are behind a proxy, set the following environment variables in the console session:
 
@@ -16,85 +16,49 @@ On Windows* OS:
 set http_proxy=http://<proxyHost>:<proxyPort>
 set https_proxy=https://<proxyHost>:<proxyPort>
 
-Running Demos
+Running Samples
 =============
 
-The "demo" folder contains three scripts:
+The "demo" folder contains two scripts:
 
-1. Classification demo using public SqueezeNet topology (demo_squeezenet_download_convert_run.sh|bat)
+1. Classification sample using public SqueezeNet topology (run_sample_squeezenet.sh|bat)
 
-2. Security barrier camera demo that showcases three models coming with the product (demo_squeezenet_download_convert_run.sh|bat)
+2. Benchmark sample using public SqueezeNet topology (run_sample_benchmark_app.sh|bat) 
 
-3. Benchmark demo using public SqueezeNet topology (demo_benchmark_app.sh|bat) 
+To run the samples, invoke run_sample_squeezenet.sh or run_sample_benchmark_app.sh (*.bat on Windows) scripts from the console without parameters, for example:
 
-4. Speech recognition demo utilizing models trained on open LibriSpeech dataset
+./run_sample_squeezenet.sh
 
-To run the demos, run demo_squeezenet_download_convert_run.sh or demo_security_barrier_camera.sh or demo_benchmark_app.sh or demo_speech_recognition.sh (*.bat on Windows) scripts from the console without parameters, for example:
+The script allows to specify the target device to infer on using -d <CPU|GPU|MYRIAD> option.
 
-./demo_squeezenet_download_convert_run.sh
-
-The script allows to specify the target device to infer on using -d <CPU|GPU|MYRIAD|FPGA> option.
-
-Classification Demo Using SqueezeNet
+Classification Sample Using SqueezeNet
 ====================================
 
-The demo illustrates the general workflow of using the Intel(R) Deep Learning Deployment Toolkit and performs the following:
+The sample illustrates the general workflow of using the Intel(R) Deep Learning Deployment Toolkit and performs the following:
 
-  - Downloads a public SqueezeNet model using the Model Downloader (open_model_zoo\tools\downloader\downloader.py)
-  - Installs all prerequisites required for running the Model Optimizer using the scripts from the "model_optimizer\install_prerequisites" folder
-  - Converts SqueezeNet to an IR using the Model Optimizer (model_optimizer\mo.py) via the Model Converter (open_model_zoo\tools\downloader\converter.py)
-  - Builds the Inference Engine classification_sample (inference_engine\samples\classification_sample)
+  - Downloads a public SqueezeNet model using the Model Downloader (extras\open_model_zoo\tools\downloader\downloader.py)
+  - Installs all prerequisites required for running the Model Optimizer using the scripts from the "tools\model_optimizer\install_prerequisites" folder
+  - Converts SqueezeNet to an IR using the Model Optimizer (tools\model_optimizer\mo.py) via the Model Converter (extras\open_model_zoo\tools\downloader\converter.py)
+  - Builds the Inference Engine classification_sample (samples\cpp\classification_sample)
   - Runs the sample with the car.png picture located in the demo folder
 
 The sample application prints top-10 inference results for the picture.
- 
-For more information about the Inference Engine classification sample, refer to the documentation available in the sample folder.
-
-
-Security Barrier Camera Demo
-============================
-
-The demo illustrates using the Inference Engine with pre-trained models to perform vehicle detection, vehicle attributes and license-plate recognition tasks. 
-As the sample produces visual output, it should be run in GUI mode.  
-
-The demo script does the following:
-
-- Builds the Inference Engine security barrier camera sample (inference_engine\samples\security_barrier_camera_sample)
-- Runs the sample with the car_1.bmp located in the demo folder
-
-The sample application displays the resulting frame with detections rendered as bounding boxes and text.
-
-For more information about the Inference Engine security barrier camera sample, refer to the documentation available in the sample folder.
 
+For more information about the Inference Engine classification sample, refer to the documentation available in the sample folder.
 
-Benchmark Demo Using SqueezeNet
+Benchmark Sample Using SqueezeNet
 ===============================
 
-The demo illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices.
+The sample illustrates how to use the Benchmark Application to estimate deep learning inference performance on supported devices.
 
-The demo script does the following:
+The sample script does the following:
 
-  - Downloads a public SqueezeNet model using the Model Downloader (open_model_zoo\tools\downloader\downloader.py)
-  - Installs all prerequisites required for running the Model Optimizer using the scripts from the "model_optimizer\install_prerequisites" folder
-  - Converts SqueezeNet to an IR using the Model Optimizer (model_optimizer\mo.py) via the Model Converter (open_model_zoo\tools\downloader\converter.py)
-  - Builds the Inference Engine benchmark tool (inference_engine\samples\demo_benchmark_app)
+  - Downloads a public SqueezeNet model using the Model Downloader (extras\open_model_zoo\tools\downloader\downloader.py)
+  - Installs all prerequisites required for running the Model Optimizer using the scripts from the "tools\model_optimizer\install_prerequisites" folder
+  - Converts SqueezeNet to an IR using the Model Optimizer (tools\model_optimizer\mo.py) via the Model Converter (extras\open_model_zoo\tools\downloader\converter.py)
+  - Builds the Inference Engine benchmark tool (samples\benchmark_app)
   - Runs the tool with the car.png picture located in the demo folder
 
 The benchmark app prints performance counters, resulting latency, and throughput values.
- 
-For more information about the Inference Engine benchmark app, refer to the documentation available in the sample folder.
-
-Speech Recognition Demo Using LibriSpeech models
-================================================
 
-The demo illustrates live speech recognition - transcribing speech from microphone or offline (from wave file).
-The demo is also capable of live close captioning of an audio clip or movie, where signal is intercepted from the speaker. 
-
-The demo script does the following:
-
-  - Downloads US English models trained on LibriSpeech dataset prepared for direct usage by the Inference Engine
-  - Installs the required components
-  - Runs the command line offline demo
-  - As a final step, runs live speech recognition application with graphical interface
-
-The GUI application prints the speech transcribed from input signal in window. Up to two channels can be transcribed in parallel: microphone & speakers streams.
+For more information about the Inference Engine benchmark app, refer to the documentation available in the sample folder.
diff --git a/scripts/demo/demo_security_barrier_camera.bat b/scripts/demo/demo_security_barrier_camera.bat
deleted file mode 100644
index 21db90e6d549b2..00000000000000
--- a/scripts/demo/demo_security_barrier_camera.bat
+++ /dev/null
@@ -1,239 +0,0 @@
-:: Copyright (C) 2018-2021 Intel Corporation
-:: SPDX-License-Identifier: Apache-2.0
-
-@echo off
-setlocal enabledelayedexpansion
-
-set TARGET=CPU
-set SAMPLE_OPTIONS=
-set BUILD_FOLDER=%USERPROFILE%\Documents\Intel\OpenVINO
-set VENV_DIR=%USERPROFILE%\Documents\Intel\OpenVINO\venv_openvino
-
-:: command line arguments parsing
-:input_arguments_loop
-if not "%1"=="" (
-    if "%1"=="-d" (
-        set TARGET=%2
-        echo target = !TARGET!
-        shift
-    )
-    if "%1"=="-sample-options" (
-        set SAMPLE_OPTIONS=%2 %3 %4 %5 %6
-        echo sample_options = !SAMPLE_OPTIONS!
-        shift
-    )
-    if "%1"=="-help" (
-        echo Security barrier camera demo that showcases three models coming with the product
-        echo.
-        echo Options:
-        echo    -help                      Print help message
-        echo    -d DEVICE                  Specify the target device to infer on; CPU, GPU, HDDL or MYRIAD are acceptable. Sample will look for a suitable plugin for device specified
-        echo    -sample-options OPTIONS    Specify command line arguments for the sample
-        exit /b
-    )
-    shift
-    goto :input_arguments_loop
-)
-
-set ROOT_DIR=%~dp0
-
-set target_image_path=%ROOT_DIR%car_1.bmp
-
-set TARGET_PRECISION=FP16
-
-echo target_precision = !TARGET_PRECISION!
-
-if exist "%ROOT_DIR%..\..\bin\setupvars.bat" (
-    call "%ROOT_DIR%..\..\bin\setupvars.bat"
-) else (
-    echo setupvars.bat is not found, INTEL_OPENVINO_DIR can't be set
-    goto error
-)
-
-echo INTEL_OPENVINO_DIR is set to %INTEL_OPENVINO_DIR%
-
-:: Check if Python is installed
-python --version 2>NUL
-if errorlevel 1 (
-    echo Error^: Python is not installed. Please install Python 3.5 ^(64-bit^) or higher from https://www.python.org/downloads/
-    goto error
-)
-
-:: Check if Python version is equal or higher 3.4
-for /F "tokens=* USEBACKQ" %%F IN (`python --version 2^>^&1`) DO (
-    set version=%%F
-)
-echo %var%
-
-for /F "tokens=1,2,3 delims=. " %%a in ("%version%") do (
-    set Major=%%b
-    set Minor=%%c
-)
-
-if "%Major%" geq "3" (
-    if "%Minor%" geq "5" (
-        set python_ver=okay
-    )
-)
-if not "%python_ver%"=="okay" (
-    echo Unsupported Python version. Please install Python 3.5 ^(64-bit^) or higher from https://www.python.org/downloads/
-    goto error
-)
-
-:: install yaml python modules required for downloader.py
-if exist "%VENV_DIR%" (
-    echo.
-    echo ###############^|^| Using the existing python virtual environment ^|^|###############
-    echo.
-) else (
-    echo.
-    echo ###############^|^| Creating the python virtual environment ^|^|###############
-    echo.
-    python -m venv "%VENV_DIR%"
-)
-
-call "%VENV_DIR%\Scripts\activate.bat"
-python -m pip install -U pip
-python -m pip install -r "%ROOT_DIR%..\open_model_zoo\tools\downloader\requirements.in"
-
-if ERRORLEVEL 1 GOTO errorHandling
-
-set models_path=%BUILD_FOLDER%\openvino_models\ir
-set models_cache=%BUILD_FOLDER%\openvino_models\cache
-
-if not exist "%models_cache%" (
-    mkdir "%models_cache%"
-)
-
-set downloader_dir=%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\downloader
-
-for /F "tokens=1,2 usebackq" %%a in ("%ROOT_DIR%demo_security_barrier_camera.conf") do (
-    echo python "%downloader_dir%\downloader.py" --name "%%b" --output_dir "%models_path%" --cache_dir "%models_cache%"
-    python "%downloader_dir%\downloader.py" --name "%%b" --output_dir "%models_path%" --cache_dir "%models_cache%"
-
-    for /F "tokens=* usebackq" %%d in (
-        `python "%downloader_dir%\info_dumper.py" --name "%%b" ^|
-            python -c "import sys, json; print(json.load(sys.stdin)[0]['subdirectory'])"`
-    ) do (
-        set model_args=!model_args! %%a "%models_path%\%%d\%target_precision%\%%b.xml"
-    )
-)
-
-echo.
-echo ###############^|^| Generate VS solution for Inference Engine demos using cmake ^|^|###############
-echo.
-CALL :delay 3
-
-if "%PROCESSOR_ARCHITECTURE%" == "AMD64" (
-    set "PLATFORM=x64"
-) else (
-    set "PLATFORM=Win32"
-)
-
-set VSWHERE="false"
-if exist "%ProgramFiles(x86)%\Microsoft Visual Studio\Installer\vswhere.exe" (
-    set VSWHERE="true"
-    cd /d "%ProgramFiles(x86)%\Microsoft Visual Studio\Installer"
-) else if exist "%ProgramFiles%\Microsoft Visual Studio\Installer\vswhere.exe" (
-    set VSWHERE="true"
-    cd /d "%ProgramFiles%\Microsoft Visual Studio\Installer"
-) else (
-    echo "vswhere tool is not found"
-)
-
-if !VSWHERE! == "true" (
-    for /f "usebackq tokens=*" %%i in (`vswhere -latest -products * -requires Microsoft.Component.MSBuild -property installationPath`) do (
-        set VS_PATH=%%i
-    )
-    if exist "!VS_PATH!\MSBuild\14.0\Bin\MSBuild.exe" (
-        set "MSBUILD_BIN=!VS_PATH!\MSBuild\14.0\Bin\MSBuild.exe"
-    )
-    if exist "!VS_PATH!\MSBuild\15.0\Bin\MSBuild.exe" (
-        set "MSBUILD_BIN=!VS_PATH!\MSBuild\15.0\Bin\MSBuild.exe"
-    )
-    if exist "!VS_PATH!\MSBuild\Current\Bin\MSBuild.exe" (
-        set "MSBUILD_BIN=!VS_PATH!\MSBuild\Current\Bin\MSBuild.exe"
-    )
-    for /f "usebackq tokens=1 delims=." %%i in (`vswhere -latest -products * -requires Microsoft.Component.MSBuild -property installationVersion`) do (
-        set VS_MAJOR_VER=%%i
-    )
-    if "!VS_MAJOR_VER!"=="16" set "MSBUILD_VERSION=16 2019"
-    if "!VS_MAJOR_VER!"=="15" set "MSBUILD_VERSION=15 2017"
-)
-
-if "!MSBUILD_BIN!" == "" (
-    if exist "C:\Program Files (x86)\MSBuild\14.0\Bin\MSBuild.exe" (
-        set "MSBUILD_BIN=C:\Program Files (x86)\MSBuild\14.0\Bin\MSBuild.exe"
-        set "MSBUILD_VERSION=14 2015"
-    )
-    if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\BuildTools\MSBuild\15.0\Bin\MSBuild.exe" (
-        set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\BuildTools\MSBuild\15.0\Bin\MSBuild.exe"
-        set "MSBUILD_VERSION=15 2017"
-    )
-    if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\Professional\MSBuild\15.0\Bin\MSBuild.exe" (
-        set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\Professional\MSBuild\15.0\Bin\MSBuild.exe"
-        set "MSBUILD_VERSION=15 2017"
-    )
-    if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\Community\MSBuild\15.0\Bin\MSBuild.exe" (
-        set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\Community\MSBuild\15.0\Bin\MSBuild.exe"
-        set "MSBUILD_VERSION=15 2017"
-    )
-) else (
-    if not "!MSBUILD_BIN:2019=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=16 2019"
-    if not "!MSBUILD_BIN:2017=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=15 2017"
-    if not "!MSBUILD_BIN:2015=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=14 2015"
-)
-
-if "!MSBUILD_BIN!" == "" (
-    echo Build tools for Visual Studio 2015 / 2017 / 2019 cannot be found. If you use Visual Studio 2017, please download and install build tools from https://www.visualstudio.com/downloads/#build-tools-for-visual-studio-2017
-    GOTO errorHandling
-)
-
-set "SOLUTION_DIR64=%BUILD_FOLDER%\inference_engine_demos_build"
-
-echo Creating Visual Studio !MSBUILD_VERSION! %PLATFORM% files in %SOLUTION_DIR64%... && ^
-if exist "%SOLUTION_DIR64%\CMakeCache.txt" del "%SOLUTION_DIR64%\CMakeCache.txt"
-cd /d "%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\demos" && cmake -E make_directory "%SOLUTION_DIR64%" && cd /d "%SOLUTION_DIR64%" && cmake -G "Visual Studio !MSBUILD_VERSION!" -A %PLATFORM% "%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\demos"
-if ERRORLEVEL 1 GOTO errorHandling
-
-CALL :delay 7
-echo.
-echo ###############^|^| Build Inference Engine demos using MS Visual Studio (MSBuild.exe) ^|^|###############
-echo.
-CALL :delay 3
-echo "!MSBUILD_BIN!" Demos.sln /p:Configuration=Release /t:security_barrier_camera_demo /clp:ErrorsOnly /m
-"!MSBUILD_BIN!" Demos.sln /p:Configuration=Release /t:security_barrier_camera_demo /clp:ErrorsOnly /m
-if ERRORLEVEL 1 GOTO errorHandling
-
-CALL :delay 7
-
-:runSample
-echo.
-echo ###############^|^| Run Inference Engine security barrier camera demo ^|^|###############
-echo.
-CALL :delay 3
-cd /d "%SOLUTION_DIR64%\intel64\Release"
-if not exist security_barrier_camera_demo.exe (
-    cd /d "%INTEL_OPENVINO_DIR%\inference_engine\demos\intel64\Release"
-    echo "%INTEL_OPENVINO_DIR%\inference_engine\demos\intel64\Release\security_barrier_camera_demo.exe" -i "%target_image_path%" %model_args% -d !TARGET! -d_va !TARGET! -d_lpr !TARGET! !SAMPLE_OPTIONS!
-)
-else (
-    echo "%SOLUTION_DIR64%\intel64\Release\security_barrier_camera_demo.exe" -i "%target_image_path%" %model_args% -d !TARGET! -d_va !TARGET! -d_lpr !TARGET! !SAMPLE_OPTIONS!
-)
-security_barrier_camera_demo.exe -i "%target_image_path%" %model_args% ^
-                                 -d !TARGET! -d_va !TARGET! -d_lpr !TARGET! !SAMPLE_OPTIONS!
-if ERRORLEVEL 1 GOTO errorHandling
-
-echo.
-echo ###############^|^| Demo completed successfully ^|^|###############
-cd /d "%ROOT_DIR%"
-
-goto :eof
-
-:errorHandling
-echo Error
-cd /d "%ROOT_DIR%"
-
-:delay
-timeout %~1 2> nul
-EXIT /B 0
diff --git a/scripts/demo/demo_security_barrier_camera.conf b/scripts/demo/demo_security_barrier_camera.conf
deleted file mode 100644
index c283abce251a7f..00000000000000
--- a/scripts/demo/demo_security_barrier_camera.conf
+++ /dev/null
@@ -1,3 +0,0 @@
--m     vehicle-license-plate-detection-barrier-0106
--m_lpr license-plate-recognition-barrier-0001
--m_va  vehicle-attributes-recognition-barrier-0039
diff --git a/scripts/demo/demo_security_barrier_camera.sh b/scripts/demo/demo_security_barrier_camera.sh
deleted file mode 100755
index 982e7f57f3ce05..00000000000000
--- a/scripts/demo/demo_security_barrier_camera.sh
+++ /dev/null
@@ -1,178 +0,0 @@
-#!/usr/bin/env bash
-
-# Copyright (C) 2018-2021 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-echo -ne "\e[0;33mWARNING: If you get an error when running the demo in the Docker container, you may need to install additional packages. To do this, run the container as root (-u 0) and run install_openvino_dependencies.sh script. If you get a package-independent error, try setting additional parameters using -sample-options.\e[0m\n"
-
-ROOT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]-$0}" )" && pwd )"
-VENV_DIR="$HOME/venv_openvino"
-
-. "$ROOT_DIR/utils.sh"
-
-usage() {
-    echo "Security barrier camera demo that showcases three models coming with the product"
-    echo
-    echo "Options:"
-    echo "  -help                     Print help message"
-    echo "  -d DEVICE                 Specify the target device to infer on; CPU, GPU, HDDL or MYRIAD are acceptable. Sample will look for a suitable plugin for device specified"
-    echo "  -sample-options OPTIONS   Specify command line arguments for the sample"
-    echo
-    exit 1
-}
-
-trap 'error ${LINENO}' ERR
-
-target="CPU"
-
-# parse command line options
-while [[ $# -gt 0 ]]
-do
-key="$1"
-
-case $key in
-    -h | -help | --help)
-    usage
-    ;;
-    -d)
-    target="$2"
-    echo target = "${target}"
-    shift
-    ;;
-    -sample-options)
-    sampleoptions=("${@:2}")
-    echo sample-options = "${sampleoptions[*]}"
-    shift
-    ;;
-    *)
-    # unknown option
-    ;;
-esac
-shift
-done
-
-target_image_path="$ROOT_DIR/car_1.bmp"
-
-run_again="Then run the script again\n\n"
-
-if [ -e "$ROOT_DIR/../../bin/setupvars.sh" ]; then
-    setupvars_path="$ROOT_DIR/../../bin/setupvars.sh"
-else
-    echo -ne "Error: setupvars.sh is not found\n"
-fi
-if ! . "$setupvars_path" ; then
-    echo -ne "Unable to run ./setupvars.sh. Please check its presence. ${run_again}"
-    exit 1
-fi
-
-if [[ -f /etc/centos-release ]]; then
-    DISTRO="centos"
-elif [[ -f /etc/lsb-release ]]; then
-    DISTRO="ubuntu"
-elif [[ "$OSTYPE" == "darwin"* ]]; then
-    DISTRO="macos"
-fi
-
-if [[ $DISTRO == "centos" ]]; then
-    # check installed Python version
-    if command -v python3.5 >/dev/null 2>&1; then
-        python_binary=python3.5
-    fi
-    if command -v python3.6 >/dev/null 2>&1; then
-        python_binary=python3.6
-    fi
-elif [[ $DISTRO == "ubuntu" ]]; then
-    python_binary=python3
-elif [[ "$OSTYPE" == "darwin"* ]]; then
-    # check installed Python version
-    if command -v python3.8 >/dev/null 2>&1; then
-        python_binary=python3.8
-    elif command -v python3.7 >/dev/null 2>&1; then
-        python_binary=python3.7
-    elif command -v python3.6 >/dev/null 2>&1; then
-        python_binary=python3.6
-    elif command -v python3.5 >/dev/null 2>&1; then
-        python_binary=python3.5
-    else
-        python_binary=python3
-    fi
-fi
-
-if ! command -v $python_binary &>/dev/null; then
-    echo -ne "\n\nPython 3.5 (x64) or higher is not installed. It is required to run Model Optimizer, please install it. ${run_again}"
-    exit 1
-fi
-
-if [ -e "$VENV_DIR" ]; then
-    echo -ne "\n###############|| Using the existing python virtual environment ||###############\n\n"
-else
-    echo -ne "\n###############|| Creating the python virtual environment ||###############\n\n"
-    "$python_binary" -m venv "$VENV_DIR"
-fi
-
-. "$VENV_DIR/bin/activate"
-python -m pip install -U pip
-python -m pip install -r "$ROOT_DIR/../open_model_zoo/tools/downloader/requirements.in"
-
-# Step 1. Downloading Intel models
-echo -ne "\n###############|| Downloading Intel models ||###############\n\n"
-
-target_precision="FP16"
-
-echo -ne "target_precision = ${target_precision}\n"
-
-downloader_dir="${INTEL_OPENVINO_DIR}/deployment_tools/open_model_zoo/tools/downloader"
-
-downloader_path="$downloader_dir/downloader.py"
-models_path="$HOME/openvino_models/ir"
-models_cache="$HOME/openvino_models/cache"
-
-declare -a model_args
-
-while read -r model_opt model_name; do
-    model_subdir=$(python "$downloader_dir/info_dumper.py" --name "$model_name" |
-        python -c 'import sys, json; print(json.load(sys.stdin)[0]["subdirectory"])')
-
-    model_path="$models_path/$model_subdir/$target_precision/$model_name"
-
-    print_and_run python "$downloader_path" --name "$model_name" --output_dir "$models_path" --cache_dir "$models_cache"
-
-    model_args+=("$model_opt" "${model_path}.xml")
-done < "$ROOT_DIR/demo_security_barrier_camera.conf"
-
-# Step 2. Build samples
-echo -ne "\n###############|| Build Inference Engine demos ||###############\n\n"
-
-demos_path="${INTEL_OPENVINO_DIR}/deployment_tools/open_model_zoo/demos"
-
-if ! command -v cmake &>/dev/null; then
-    echo -ne "\n\nCMAKE is not installed. It is required to build Inference Engine demos. Please install it. ${run_again}"
-    exit 1
-fi
-
-OS_PATH=$(uname -m)
-NUM_THREADS="-j2"
-
-if [ "$OS_PATH" == "x86_64" ]; then
-  OS_PATH="intel64"
-  NUM_THREADS="-j8"
-fi
-
-build_dir="$HOME/inference_engine_demos_build"
-if [ -e "$build_dir/CMakeCache.txt" ]; then
-  rm -rf "$build_dir/CMakeCache.txt"
-fi
-mkdir -p "$build_dir"
-cd "$build_dir"
-cmake -DCMAKE_BUILD_TYPE=Release "$demos_path"
-make $NUM_THREADS security_barrier_camera_demo
-
-# Step 3. Run samples
-echo -ne "\n###############|| Run Inference Engine security_barrier_camera demo ||###############\n\n"
-
-binaries_dir="${build_dir}/${OS_PATH}/Release"
-cd "$binaries_dir"
-
-print_and_run ./security_barrier_camera_demo -d "$target" -d_va "$target" -d_lpr "$target" -i "$target_image_path" "${model_args[@]}" "${sampleoptions[@]}"
-
-echo -ne "\n###############|| Demo completed successfully ||###############\n\n"
diff --git a/scripts/demo/demo_benchmark_app.bat b/scripts/demo/run_sample_benchmark_app.bat
similarity index 89%
rename from scripts/demo/demo_benchmark_app.bat
rename to scripts/demo/run_sample_benchmark_app.bat
index 88928fddc672db..2476a75fef260a 100644
--- a/scripts/demo/demo_benchmark_app.bat
+++ b/scripts/demo/run_sample_benchmark_app.bat
@@ -22,7 +22,7 @@ if not "%1"=="" (
         shift
     )
     if "%1"=="-help" (
-        echo Benchmark demo using public SqueezeNet topology
+        echo Benchmark sample using public SqueezeNet topology
         echo.
         echo Options:
         echo    -help                      Print help message
@@ -52,8 +52,8 @@ set model_name=squeezenet1.1
 
 set target_image_path=%ROOT_DIR%car.png
 
-if exist "%ROOT_DIR%..\..\bin\setupvars.bat" (
-    call "%ROOT_DIR%..\..\bin\setupvars.bat"
+if exist "%ROOT_DIR%..\..\setupvars.bat" (
+    call "%ROOT_DIR%..\..\setupvars.bat"
 ) else (
     echo setupvars.bat is not found, INTEL_OPENVINO_DIR can't be set
     goto error
@@ -64,7 +64,7 @@ echo INTEL_OPENVINO_DIR is set to %INTEL_OPENVINO_DIR%
 :: Check if Python is installed
 python --version 2>NUL
 if errorlevel 1 (
-    echo Error^: Python is not installed. Please install Python 3.5 ^(64-bit^) or higher from https://www.python.org/downloads/
+    echo Error^: Python is not installed. Please install Python 3.6 ^(64-bit^) or higher from https://www.python.org/downloads/
     goto error
 )
 
@@ -80,13 +80,13 @@ for /F "tokens=1,2,3 delims=. " %%a in ("%version%") do (
 )
 
 if "%Major%" geq "3" (
-    if "%Minor%" geq "5" (
+    if "%Minor%" geq "6" (
         set python_ver=okay
     )
 )
 
 if not "%python_ver%"=="okay" (
-    echo Unsupported Python version. Please install Python 3.5 ^(64-bit^) or higher from https://www.python.org/downloads/
+    echo Unsupported Python version. Please install Python 3.6 ^(64-bit^) or higher from https://www.python.org/downloads/
     goto error
 )
 
@@ -108,7 +108,7 @@ python -m pip install -r "%ROOT_DIR%..\open_model_zoo\tools\downloader\requireme
 
 if ERRORLEVEL 1 GOTO errorHandling
 
-set downloader_dir=%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\downloader
+set downloader_dir=%INTEL_OPENVINO_DIR%\extras\open_model_zoo\tools\downloader
 
 for /F "tokens=* usebackq" %%d in (
     `python "%downloader_dir%\info_dumper.py" --name "%model_name%" ^|
@@ -138,7 +138,7 @@ echo.
 echo ###############^|^| Install Model Optimizer prerequisites ^|^|###############
 echo.
 CALL :delay 3
-cd /d "%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer"
+cd /d "%INTEL_OPENVINO_DIR%\tools\model_optimizer"
 python -m pip install -r requirements.txt
 if ERRORLEVEL 1 GOTO errorHandling
 
@@ -149,8 +149,8 @@ echo.
 CALL :delay 3
 
 ::set PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp
-echo python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
-python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
+echo python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
+python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
 if ERRORLEVEL 1 GOTO errorHandling
 
 CALL :delay 7
@@ -230,7 +230,7 @@ set "SOLUTION_DIR64=%BUILD_FOLDER%\inference_engine_cpp_samples_build"
 
 echo Creating Visual Studio !MSBUILD_VERSION! %PLATFORM% files in %SOLUTION_DIR64%... && ^
 if exist "%SOLUTION_DIR64%\CMakeCache.txt" del "%SOLUTION_DIR64%\CMakeCache.txt"
-cd /d "%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\samples\cpp" && cmake -E make_directory "%SOLUTION_DIR64%" && cd /d "%SOLUTION_DIR64%" && cmake -G "Visual Studio !MSBUILD_VERSION!" -A %PLATFORM% "%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\samples\cpp"
+cd /d "%INTEL_OPENVINO_DIR%\samples\cpp" && cmake -E make_directory "%SOLUTION_DIR64%" && cd /d "%SOLUTION_DIR64%" && cmake -G "Visual Studio !MSBUILD_VERSION!" -A %PLATFORM% "%INTEL_OPENVINO_DIR%\samples\cpp"
 if ERRORLEVEL 1 GOTO errorHandling
 
 CALL :delay 7
diff --git a/scripts/demo/demo_benchmark_app.sh b/scripts/demo/run_sample_benchmark_app.sh
old mode 100755
new mode 100644
similarity index 83%
rename from scripts/demo/demo_benchmark_app.sh
rename to scripts/demo/run_sample_benchmark_app.sh
index 0c2869037c4414..3b2d90a371ad6d
--- a/scripts/demo/demo_benchmark_app.sh
+++ b/scripts/demo/run_sample_benchmark_app.sh
@@ -3,7 +3,7 @@
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-echo -ne "\e[0;33mWARNING: If you get an error when running the demo in the Docker container, you may need to install additional packages. To do this, run the container as root (-u 0) and run install_openvino_dependencies.sh script. If you get a package-independent error, try setting additional parameters using -sample-options.\e[0m\n"
+echo -ne "\e[0;33mWARNING: If you get an error when running the sample in the Docker container, you may need to install additional packages. To do this, run the container as root (-u 0) and run install_openvino_dependencies.sh script. If you get a package-independent error, try setting additional parameters using -sample-options.\e[0m\n"
 
 ROOT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]-$0}" )" && pwd )"
 VENV_DIR="$HOME/venv_openvino"
@@ -69,8 +69,8 @@ target_image_path="$ROOT_DIR/car.png"
 
 run_again="Then run the script again\n\n"
 
-if [ -e "$ROOT_DIR/../../bin/setupvars.sh" ]; then
-    setupvars_path="$ROOT_DIR/../../bin/setupvars.sh"
+if [ -e "$ROOT_DIR/../../setupvars.sh" ]; then
+    setupvars_path="$ROOT_DIR/../../setupvars.sh"
 else
     echo -ne "Error: setupvars.sh is not found\n"
 fi
@@ -88,9 +88,6 @@ fi
 
 if [[ $DISTRO == "centos" ]]; then
     # check installed Python version
-    if command -v python3.5 >/dev/null 2>&1; then
-        python_binary=python3.5
-    fi
     if command -v python3.6 >/dev/null 2>&1; then
         python_binary=python3.6
     fi
@@ -104,15 +101,13 @@ elif [[ "$OSTYPE" == "darwin"* ]]; then
         python_binary=python3.7
     elif command -v python3.6 >/dev/null 2>&1; then
         python_binary=python3.6
-    elif command -v python3.5 >/dev/null 2>&1; then
-        python_binary=python3.5
     else
         python_binary=python3
     fi
 fi
 
 if ! command -v $python_binary &>/dev/null; then
-    echo -ne "\n\nPython 3.5 (x64) or higher is not installed. It is required to run Model Optimizer, please install it. ${run_again}"
+    echo -ne "\n\nPython 3.6 (x64) or higher is not installed. It is required to run Model Optimizer, please install it. ${run_again}"
     exit 1
 fi
 
@@ -125,12 +120,12 @@ fi
 
 . "$VENV_DIR/bin/activate"
 python -m pip install -U pip
-python -m pip install -r "$ROOT_DIR/../open_model_zoo/tools/downloader/requirements.in"
+python -m pip install -r "$INTEL_OPENVINO_DIR/extras/open_model_zoo/tools/downloader/requirements.in"
 
 # Step 1. Download the Caffe model and the prototxt of the model
 echo -ne "\n###############|| Downloading the Caffe model and the prototxt ||###############\n\n"
 
-downloader_dir="${INTEL_OPENVINO_DIR}/deployment_tools/open_model_zoo/tools/downloader"
+downloader_dir="${INTEL_OPENVINO_DIR}/extras/open_model_zoo/tools/downloader"
 
 model_dir=$(python "$downloader_dir/info_dumper.py" --name "$model_name" |
     python -c 'import sys, json; print(json.load(sys.stdin)[0]["subdirectory"])')
@@ -144,14 +139,14 @@ ir_dir="${irs_path}/${model_dir}/${target_precision}"
 if [ ! -e "$ir_dir" ]; then
     # Step 2. Configure Model Optimizer
     echo -ne "\n###############|| Install Model Optimizer dependencies ||###############\n\n"
-    cd "${INTEL_OPENVINO_DIR}/deployment_tools/model_optimizer"
+    cd "${INTEL_OPENVINO_DIR}/tools/model_optimizer"
     python -m pip install -r requirements.txt
     cd "$PWD"
 
     # Step 3. Convert a model with Model Optimizer
     echo -ne "\n###############|| Convert a model with Model Optimizer ||###############\n\n"
 
-    mo_path="${INTEL_OPENVINO_DIR}/deployment_tools/model_optimizer/mo.py"
+    mo_path="${INTEL_OPENVINO_DIR}/tools/model_optimizer/mo.py"
 
     export PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp
     print_and_run python "$downloader_dir/converter.py" --mo "$mo_path" --name "$model_name" -d "$models_path" -o "$irs_path" --precisions "$target_precision"
@@ -171,7 +166,7 @@ if [ "$OS_PATH" == "x86_64" ]; then
   NUM_THREADS="-j8"
 fi
 
-samples_path="${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/samples/cpp"
+samples_path="${INTEL_OPENVINO_DIR}/samples/cpp"
 build_dir="$HOME/inference_engine_cpp_samples_build"
 binaries_dir="${build_dir}/${OS_PATH}/Release"
 
diff --git a/scripts/demo/demo_squeezenet_download_convert_run.bat b/scripts/demo/run_sample_squeezenet.bat
similarity index 87%
rename from scripts/demo/demo_squeezenet_download_convert_run.bat
rename to scripts/demo/run_sample_squeezenet.bat
index c0bd34614dad0a..e07707e22e34d4 100644
--- a/scripts/demo/demo_squeezenet_download_convert_run.bat
+++ b/scripts/demo/run_sample_squeezenet.bat
@@ -22,7 +22,7 @@ if not "%1"=="" (
         shift
     )
     if "%1"=="-help" (
-        echo Classification demo using public SqueezeNet topology
+        echo Classification sample using public SqueezeNet topology
         echo.
         echo Options:
         echo    -help                      Print help message
@@ -48,8 +48,8 @@ set model_name=squeezenet1.1
 
 set target_image_path=%ROOT_DIR%car.png
 
-if exist "%ROOT_DIR%..\..\bin\setupvars.bat" (
-    call "%ROOT_DIR%..\..\bin\setupvars.bat"
+if exist "%ROOT_DIR%..\..\setupvars.bat" (
+    call "%ROOT_DIR%..\..\setupvars.bat"
 ) else (
     echo setupvars.bat is not found, INTEL_OPENVINO_DIR can't be set
     goto error
@@ -60,7 +60,7 @@ echo INTEL_OPENVINO_DIR is set to %INTEL_OPENVINO_DIR%
 :: Check if Python is installed
 python --version 2>NUL
 if errorlevel 1 (
-    echo Error^: Python is not installed. Please install Python 3.5 ^(64-bit^) or higher from https://www.python.org/downloads/
+    echo Error^: Python is not installed. Please install Python 3.6 ^(64-bit^) or higher from https://www.python.org/downloads/
     goto error
 )
 
@@ -76,13 +76,13 @@ for /F "tokens=1,2,3 delims=. " %%a in ("%version%") do (
 )
 
 if "%Major%" geq "3" (
-    if "%Minor%" geq "5" (
+    if "%Minor%" geq "6" (
         set python_ver=okay
     )
 )
 
 if not "%python_ver%"=="okay" (
-    echo Unsupported Python version. Please install Python 3.5 ^(64-bit^) or higher from https://www.python.org/downloads/
+    echo Unsupported Python version. Please install Python 3.6 ^(64-bit^) or higher from https://www.python.org/downloads/
     goto error
 )
 
@@ -104,7 +104,7 @@ python -m pip install -r "%ROOT_DIR%..\open_model_zoo\tools\downloader\requireme
 
 if ERRORLEVEL 1 GOTO errorHandling
 
-set downloader_dir=%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\downloader
+set downloader_dir=%INTEL_OPENVINO_DIR%\extras\open_model_zoo\tools\downloader
 
 for /F "tokens=* usebackq" %%d in (
     `python "%downloader_dir%\info_dumper.py" --name "%model_name%" ^|
@@ -134,7 +134,7 @@ echo.
 echo ###############^|^| Install Model Optimizer prerequisites ^|^|###############
 echo.
 CALL :delay 3
-cd /d "%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer"
+cd /d "%INTEL_OPENVINO_DIR%\tools\model_optimizer"
 python -m pip install -r requirements.txt
 if ERRORLEVEL 1 GOTO errorHandling
 
@@ -145,8 +145,8 @@ echo.
 CALL :delay 3
 
 ::set PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp
-echo python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
-python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
+echo python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
+python "%downloader_dir%\converter.py" --mo "%INTEL_OPENVINO_DIR%\tools\model_optimizer\mo.py" --name "%model_name%" -d "%models_path%" -o "%irs_path%" --precisions "%TARGET_PRECISION%"
 if ERRORLEVEL 1 GOTO errorHandling
 
 CALL :delay 7
@@ -226,7 +226,7 @@ set "SOLUTION_DIR64=%BUILD_FOLDER%\inference_engine_cpp_samples_build"
 
 echo Creating Visual Studio !MSBUILD_VERSION! %PLATFORM% files in %SOLUTION_DIR64%... && ^
 if exist "%SOLUTION_DIR64%\CMakeCache.txt" del "%SOLUTION_DIR64%\CMakeCache.txt"
-cd /d "%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\samples\cpp" && cmake -E make_directory "%SOLUTION_DIR64%" && cd /d "%SOLUTION_DIR64%" && cmake -G "Visual Studio !MSBUILD_VERSION!" -A %PLATFORM% "%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\samples\cpp"
+cd /d "%INTEL_OPENVINO_DIR%\samples\cpp" && cmake -E make_directory "%SOLUTION_DIR64%" && cd /d "%SOLUTION_DIR64%" && cmake -G "Visual Studio !MSBUILD_VERSION!" -A %PLATFORM% "%INTEL_OPENVINO_DIR%\samples\cpp"
 if ERRORLEVEL 1 GOTO errorHandling
 
 CALL :delay 7
@@ -250,7 +250,7 @@ CALL :delay 3
 copy /Y "%ROOT_DIR%%model_name%.labels" "%ir_dir%"
 cd /d "%SOLUTION_DIR64%\intel64\Release"
 if not exist classification_sample_async.exe (
-   cd /d "%INTEL_OPENVINO_DIR%\inference_engine\samples\cpp\intel64\Release"
+   cd /d "%INTEL_OPENVINO_DIR%\samples\cpp\intel64\Release"
 )
 echo classification_sample_async.exe -i "%target_image_path%" -m "%ir_dir%\%model_name%.xml" -d !TARGET! !SAMPLE_OPTIONS!
 classification_sample_async.exe -i "%target_image_path%" -m "%ir_dir%\%model_name%.xml" -d !TARGET! !SAMPLE_OPTIONS!
@@ -258,7 +258,7 @@ classification_sample_async.exe -i "%target_image_path%" -m "%ir_dir%\%model_nam
 if ERRORLEVEL 1 GOTO errorHandling
 
 echo.
-echo ###############^|^| Classification demo completed successfully ^|^|###############
+echo ###############^|^| Classification sample completed successfully ^|^|###############
 
 CALL :delay 10
 cd /d "%ROOT_DIR%"
diff --git a/scripts/demo/demo_squeezenet_download_convert_run.sh b/scripts/demo/run_sample_squeezenet.sh
old mode 100755
new mode 100644
similarity index 81%
rename from scripts/demo/demo_squeezenet_download_convert_run.sh
rename to scripts/demo/run_sample_squeezenet.sh
index 7f8427db8b9991..fc75592f3415a3
--- a/scripts/demo/demo_squeezenet_download_convert_run.sh
+++ b/scripts/demo/run_sample_squeezenet.sh
@@ -3,7 +3,7 @@
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-echo -ne "\e[0;33mWARNING: If you get an error when running the demo in the Docker container, you may need to install additional packages. To do this, run the container as root (-u 0) and run install_openvino_dependencies.sh script. If you get a package-independent error, try setting additional parameters using -sample-options.\e[0m\n"
+echo -ne "\e[0;33mWARNING: If you get an error when running the sample in the Docker container, you may need to install additional packages. To do this, run the container as root (-u 0) and run install_openvino_dependencies.sh script. If you get a package-independent error, try setting additional parameters using -sample-options.\e[0m\n"
 
 ROOT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]-$0}" )" && pwd )"
 VENV_DIR="$HOME/venv_openvino"
@@ -11,7 +11,7 @@ VENV_DIR="$HOME/venv_openvino"
 . "$ROOT_DIR/utils.sh"
 
 usage() {
-    echo "Classification demo using public SqueezeNet topology"
+    echo "Classification sample using public SqueezeNet topology"
     echo
     echo "Options:"
     echo "  -help                     Print help message"
@@ -65,8 +65,8 @@ target_image_path="$ROOT_DIR/car.png"
 
 run_again="Then run the script again\n\n"
 
-if [ -e "$ROOT_DIR/../../bin/setupvars.sh" ]; then
-    setupvars_path="$ROOT_DIR/../../bin/setupvars.sh"
+if [ -e "$ROOT_DIR/../../setupvars.sh" ]; then
+    setupvars_path="$ROOT_DIR/../../setupvars.sh"
 else
     echo -ne "Error: setupvars.sh is not found\n"
 fi
@@ -84,9 +84,6 @@ fi
 
 if [[ $DISTRO == "centos" ]]; then
     # check installed Python version
-    if command -v python3.5 >/dev/null 2>&1; then
-        python_binary=python3.5
-    fi
     if command -v python3.6 >/dev/null 2>&1; then
         python_binary=python3.6
     fi
@@ -100,15 +97,13 @@ elif [[ "$OSTYPE" == "darwin"* ]]; then
         python_binary=python3.7
     elif command -v python3.6 >/dev/null 2>&1; then
         python_binary=python3.6
-    elif command -v python3.5 >/dev/null 2>&1; then
-        python_binary=python3.5
     else
         python_binary=python3
     fi
 fi
 
 if ! command -v $python_binary &>/dev/null; then
-    echo -ne "\n\nPython 3.5 (x64) or higher is not installed. It is required to run Model Optimizer, please install it. ${run_again}"
+    echo -ne "\n\nPython 3.6 (x64) or higher is not installed. It is required to run Model Optimizer, please install it. ${run_again}"
     exit 1
 fi
 
@@ -121,12 +116,12 @@ fi
 
 . "$VENV_DIR/bin/activate"
 python -m pip install -U pip
-python -m pip install -r "$ROOT_DIR/../open_model_zoo/tools/downloader/requirements.in"
+python -m pip install -r "$INTEL_OPENVINO_DIR/extras/open_model_zoo/tools/downloader/requirements.in"
 
 # Step 1. Download the Caffe model and the prototxt of the model
 echo -ne "\n###############|| Downloading the Caffe model and the prototxt ||###############\n\n"
 
-downloader_dir="${INTEL_OPENVINO_DIR}/deployment_tools/open_model_zoo/tools/downloader"
+downloader_dir="${INTEL_OPENVINO_DIR}/extras/open_model_zoo/tools/downloader"
 
 model_dir=$(python "$downloader_dir/info_dumper.py" --name "$model_name" |
     python -c 'import sys, json; print(json.load(sys.stdin)[0]["subdirectory"])')
@@ -140,14 +135,14 @@ ir_dir="${irs_path}/${model_dir}/${target_precision}"
 if [ ! -e "$ir_dir" ]; then
     # Step 2. Configure Model Optimizer
     echo -ne "\n###############|| Install Model Optimizer dependencies ||###############\n\n"
-    cd "${INTEL_OPENVINO_DIR}/deployment_tools/model_optimizer"
+    cd "${INTEL_OPENVINO_DIR}/tools/model_optimizer"
     python -m pip install -r requirements.txt
     cd "$PWD"
 
     # Step 3. Convert a model with Model Optimizer
     echo -ne "\n###############|| Convert a model with Model Optimizer ||###############\n\n"
 
-    mo_path="${INTEL_OPENVINO_DIR}/deployment_tools/model_optimizer/mo.py"
+    mo_path="${INTEL_OPENVINO_DIR}/tools/model_optimizer/mo.py"
 
     export PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=cpp
     print_and_run python "$downloader_dir/converter.py" --mo "$mo_path" --name "$model_name" -d "$models_path" -o "$irs_path" --precisions "$target_precision"
@@ -167,7 +162,7 @@ if [ "$OS_PATH" == "x86_64" ]; then
   NUM_THREADS="-j8"
 fi
 
-samples_path="${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/samples/cpp"
+samples_path="${INTEL_OPENVINO_DIR}/samples/cpp"
 build_dir="$HOME/inference_engine_cpp_samples_build"
 binaries_dir="${build_dir}/${OS_PATH}/Release"
 
@@ -189,4 +184,4 @@ cp -f "$ROOT_DIR/${model_name}.labels" "${ir_dir}/"
 
 print_and_run ./classification_sample_async -d "$target" -i "$target_image_path" -m "${ir_dir}/${model_name}.xml" "${sampleoptions[@]}"
 
-echo -ne "\n###############|| Demo completed successfully ||###############\n\n"
+echo -ne "\n###############|| Classification sample completed successfully ||###############\n\n"
diff --git a/scripts/deployment_manager/configs/windows.json b/scripts/deployment_manager/configs/windows.json
deleted file mode 100644
index 14ceedbff8a3fb..00000000000000
--- a/scripts/deployment_manager/configs/windows.json
+++ /dev/null
@@ -1,140 +0,0 @@
-{
-  "version": "0.2",
-  "components": {
-    "setupvars": {
-      "mandatory" : "yes",
-      "files": [
-        "bin"
-      ]
-    },
-    "openvino_license": {
-      "mandatory" : "yes",
-      "files": [
-        "licensing"
-      ]
-    },
-    "ie_core": {
-      "group": ["ie"],
-      "files": [
-        "deployment_tools/inference_engine/version.txt",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_transformations.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_preproc.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_ir_reader.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_c_api.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/AutoPlugin.dll",
-        "deployment_tools/inference_engine/lib/intel64/Release/HeteroPlugin.dll",
-        "deployment_tools/inference_engine/lib/intel64/Release/MultiDevicePlugin.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/plugins.xml",
-        "deployment_tools/inference_engine/lib/intel64/Release/inference_engine.lib",
-        "deployment_tools/inference_engine/lib/intel64/Release/inference_engine_transformations.lib",
-        "deployment_tools/inference_engine/lib/intel64/Release/inference_engine_c_api.lib",
-        "deployment_tools/inference_engine/external/tbb",
-        "deployment_tools/ngraph/lib"
-      ]
-    },
-    "cpu": {
-      "ui_name": "Inference Engine Runtime for Intel(R) CPU",
-      "group": ["ie"],
-      "dependencies" : ["ie_core"],
-      "files": [
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_lp_transformations.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/MKLDNNPlugin.dll"
-      ]
-    },
-    "gpu": {
-      "ui_name": "Inference Engine Runtime for Intel(R) Processor Graphics",
-      "group": ["ie"],
-      "dependencies" : ["ie_core"],
-      "files": [
-        "deployment_tools/inference_engine/bin/intel64/Release/cache.json",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_lp_transformations.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/clDNNPlugin.dll"
-      ]
-    },
-    "vpu": {
-      "ui_name": "Inference Engine Runtime for Intel(R) Movidius(tm) VPU",
-      "group": ["ie"],
-      "dependencies" : ["ie_core"],
-      "files": [
-        "deployment_tools/inference_engine/bin/intel64/Release/usb-ma2x8x.mvcmd",
-        "deployment_tools/inference_engine/bin/intel64/Release/pcie-ma2x8x.elf",
-        "deployment_tools/inference_engine/bin/intel64/Release/myriadPlugin.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_legacy.dll"
-      ]
-    },
-    "gna": {
-      "ui_name": "Inference Engine Runtime for Intel(R) Gaussian Neural Accelerator",
-      "group": ["ie"],
-      "dependencies" : ["ie_core"],
-      "files": [
-        "deployment_tools/inference_engine/bin/intel64/Release/gna.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_legacy.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/GNAPlugin.dll"
-      ]
-    },
-    "hddl": {
-      "ui_name": "Inference Engine Runtime for Intel(R) Vision Accelerator Design with\n\t   Intel(R) Movidius(tm) VPUs",
-      "group": ["ie"],
-      "dependencies" : ["ie_core"],
-      "files": [
-        "deployment_tools/inference_engine/bin/intel64/Release/HDDLPlugin.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/inference_engine_legacy.dll",
-        "deployment_tools/inference_engine/bin/intel64/Release/hddl_perfcheck.exe",
-        "deployment_tools/inference_engine/external/MovidiusDriver",
-        "deployment_tools/inference_engine/external/hddl"
-      ]
-    },
-    "opencv": {
-      "ui_name": "OpenCV",
-      "group": ["opencv"],
-      "dependencies" : [],
-      "files": [
-        "opencv/version.txt",
-        "opencv/setupvars.bat",
-        "opencv/lib",
-        "opencv/bin"
-      ]
-    },
-    "python_common": {
-      "group": ["python"],
-      "dependencies" : ["ie_core"],
-      "files": [
-        "python/python3",
-        "python/requirements.txt"
-      ]
-    },
-    "python3.6": {
-      "ui_name": "OpenVINO Python API for Python3.6",
-      "group": ["python"],
-      "dependencies" : ["ie_core", "python_common"],
-      "files": [
-        "python/python3.6"
-      ]
-    },
-    "python3.7": {
-      "ui_name": "OpenVINO Python API for Python3.7",
-      "group": ["python"],
-      "dependencies" : ["ie_core", "python_common"],
-      "files": [
-        "python/python3.7"
-      ]
-    },
-    "python3.8": {
-      "ui_name": "OpenVINO Python API for Python3.8",
-      "group": ["python"],
-      "dependencies" : ["ie_core", "python_common"],
-      "files": [
-        "python/python3.8"
-      ]
-    },
-    "python3.9": {
-      "ui_name": "OpenVINO Python API for Python3.9",
-      "group": ["python"],
-      "dependencies" : ["ie_core", "python_common"],
-      "files": [
-        "python/python3.9"
-      ]
-    }
-  }
-}
diff --git a/scripts/install_dependencies/install_NCS_udev_rules.sh b/scripts/install_dependencies/install_NCS_udev_rules.sh
index 7062e9d753db92..b05342d6cf4b6d 100755
--- a/scripts/install_dependencies/install_NCS_udev_rules.sh
+++ b/scripts/install_dependencies/install_NCS_udev_rules.sh
@@ -6,14 +6,14 @@
 echo "Updating udev rules..."
 
 if [ -z "$INTEL_OPENVINO_DIR" ]; then
-    echo "Please set up your environment. Run 'source <OPENVINO_INSTALLDIR>/bin/setupvars.sh'."
+    echo "Please set up your environment. Run 'source <OPENVINO_INSTALLDIR>/setupvars.sh'."
     exit -1
 fi
 
-if [ -f "$INTEL_OPENVINO_DIR/deployment_tools/inference_engine/external/97-myriad-usbboot.rules" ]; then
+if [ -f "$INTEL_OPENVINO_DIR/runtime/3rdparty/97-myriad-usbboot.rules" ]; then
     sudo usermod -a -G users "$(whoami)"
 
-    sudo cp "$INTEL_OPENVINO_DIR/deployment_tools/inference_engine/external/97-myriad-usbboot.rules" /etc/udev/rules.d/
+    sudo cp "$INTEL_OPENVINO_DIR/runtime/3rdparty/97-myriad-usbboot.rules" /etc/udev/rules.d/
     sudo udevadm control --reload-rules
     sudo udevadm trigger
     sudo ldconfig
diff --git a/scripts/setupvars/setupvars.bat b/scripts/setupvars/setupvars.bat
index c7920d3fa332eb..364c651be48816 100644
--- a/scripts/setupvars/setupvars.bat
+++ b/scripts/setupvars/setupvars.bat
@@ -4,7 +4,6 @@
 :: SPDX-License-Identifier: Apache-2.0
 
 set ROOT=%~dp0
-call :GetFullPath "%ROOT%\.." ROOT
 set SCRIPT_NAME=%~nx0
 
 set "INTEL_OPENVINO_DIR=%ROOT%"
@@ -32,48 +31,35 @@ set "PATH=%INTEL_OPENVINO_DIR%\opencv\x64\vc14\bin;%PATH%"
 )
 
 :: Model Optimizer
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer (
-set PYTHONPATH=%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer;%PYTHONPATH%
-set "PATH=%INTEL_OPENVINO_DIR%\deployment_tools\model_optimizer;%PATH%"
+if exist %INTEL_OPENVINO_DIR%\tools\model_optimizer (
+set PYTHONPATH=%INTEL_OPENVINO_DIR%\tools\model_optimizer;%PYTHONPATH%
+set "PATH=%INTEL_OPENVINO_DIR%\tools\model_optimizer;%PATH%"
 )
 
 
 :: Model Downloader
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\downloader (
-set PYTHONPATH=%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\downloader;%PYTHONPATH%
-set "PATH=%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\downloader;%PATH%"
+if exist %INTEL_OPENVINO_DIR%\extras\open_model_zoo\tools\downloader (
+set PYTHONPATH=%INTEL_OPENVINO_DIR%\extras\open_model_zoo\tools\downloader;%PYTHONPATH%
+set "PATH=%INTEL_OPENVINO_DIR%\extras\open_model_zoo\tools\downloader;%PATH%"
 )
 
-:: Inference Engine
-set "InferenceEngine_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\share"
-set "HDDL_INSTALL_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\hddl"
-set "OPENMP_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\omp\lib"
-set "GNA_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\gna\lib"
-
-set "OPENVINO_LIB_PATHS=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\Release;%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\Debug;%HDDL_INSTALL_DIR%\bin;%OPENMP_DIR%;%GNA_DIR%;%OPENVINO_LIB_PATHS%"
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\arch_descriptions (
-set ARCH_ROOT_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\arch_descriptions
-)
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\arch_descriptions (
-set ARCH_ROOT_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\bin\intel64\arch_descriptions
-)
+:: OpenVINO runtime
+set "InferenceEngine_DIR=%INTEL_OPENVINO_DIR%\runtime\cmake"
+set "ngraph_DIR=%INTEL_OPENVINO_DIR%\runtime\cmake"
+set "OpenVINO_DIR=%INTEL_OPENVINO_DIR%\runtime\cmake"
+set "HDDL_INSTALL_DIR=%INTEL_OPENVINO_DIR%\runtime\3rdparty\hddl"
+set "OPENVINO_LIB_PATHS=%INTEL_OPENVINO_DIR%\runtime\bin\intel64\Release;%INTEL_OPENVINO_DIR%\runtime\bin\intel64\Debug;%HDDL_INSTALL_DIR%\bin;%OPENVINO_LIB_PATHS%"
+set "OV_FRONTEND_PATH=%INTEL_OPENVINO_DIR%\runtime\bin\intel64\Release;%INTEL_OPENVINO_DIR%\runtime\bin\intel64\Debug;%OV_FRONTEND_PATH%"
 
 :: TBB
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\tbb (
-set "OPENVINO_LIB_PATHS=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\tbb\bin;%OPENVINO_LIB_PATHS%"
-set "TBB_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\inference_engine\external\tbb\cmake"
-)
-
-:: nGraph
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\ngraph (
-set "OPENVINO_LIB_PATHS=%INTEL_OPENVINO_DIR%\deployment_tools\ngraph\lib;%OPENVINO_LIB_PATHS%"
-set "ngraph_DIR=%INTEL_OPENVINO_DIR%\deployment_tools\ngraph\cmake"
-set "OV_FRONTEND_PATH=%INTEL_OPENVINO_DIR%\deployment_tools\ngraph\lib;%OV_FRONTEND_PATH%"
+if exist %INTEL_OPENVINO_DIR%\runtime\3rdparty\tbb (
+set "OPENVINO_LIB_PATHS=%INTEL_OPENVINO_DIR%\runtime\3rdparty\tbb\bin;%OPENVINO_LIB_PATHS%"
+set "TBB_DIR=%INTEL_OPENVINO_DIR%\runtime\3rdparty\tbb\cmake"
 )
 
 :: Compile tool
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\tools\compile_tool (
-set "PATH=%INTEL_OPENVINO_DIR%\deployment_tools\tools\compile_tool;%PATH%"
+if exist %INTEL_OPENVINO_DIR%\tools\compile_tool (
+set "PATH=%INTEL_OPENVINO_DIR%\tools\compile_tool;%PATH%"
 )
 
 :: Add libs dirs to the PATH
@@ -128,12 +114,12 @@ if not "%bitness%"=="64" (
 
 set PYTHONPATH=%INTEL_OPENVINO_DIR%\python\python%pyversion_major%.%pyversion_minor%;%INTEL_OPENVINO_DIR%\python\python3;%PYTHONPATH%
 
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\accuracy_checker (
-    set PYTHONPATH=%INTEL_OPENVINO_DIR%\deployment_tools\open_model_zoo\tools\accuracy_checker;%PYTHONPATH%
+if exist %INTEL_OPENVINO_DIR%\tools\accuracy_checker (
+    set PYTHONPATH=%INTEL_OPENVINO_DIR%\tools\accuracy_checker;%PYTHONPATH%
 )
 
-if exist %INTEL_OPENVINO_DIR%\deployment_tools\tools\post_training_optimization_toolkit (
-    set PYTHONPATH=%INTEL_OPENVINO_DIR%\deployment_tools\tools\post_training_optimization_toolkit;%PYTHONPATH%
+if exist %INTEL_OPENVINO_DIR%\post_training_optimization_toolkit (
+    set PYTHONPATH=%INTEL_OPENVINO_DIR%\post_training_optimization_toolkit;%PYTHONPATH%
 )
 
 echo [setupvars.bat] OpenVINO environment initialized
diff --git a/scripts/setupvars/setupvars.sh b/scripts/setupvars/setupvars.sh
index 199ef0edd9355f..fc6251211e6378 100755
--- a/scripts/setupvars/setupvars.sh
+++ b/scripts/setupvars/setupvars.sh
@@ -4,13 +4,8 @@
 # SPDX-License-Identifier: Apache-2.0
 
 SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]-$0}" )" >/dev/null 2>&1 && pwd )"
-BASE_DIR="$( dirname "$SCRIPT_DIR" )"
-
-INSTALLDIR="${BASE_DIR}"
-
-
+INSTALLDIR="${SCRIPT_DIR}"
 export INTEL_OPENVINO_DIR="$INSTALLDIR"
-export INTEL_CVSDK_DIR="$INTEL_OPENVINO_DIR"
 
 # parse command line options
 while [[ $# -gt 0 ]]
@@ -29,46 +24,40 @@ esac
 shift
 done
 
-if [ -e "$INSTALLDIR/deployment_tools/inference_engine" ]; then
-    export InferenceEngine_DIR=$INTEL_OPENVINO_DIR/deployment_tools/inference_engine/share
-    system_type=$(ls "$INTEL_OPENVINO_DIR/deployment_tools/inference_engine/lib/")
-    IE_PLUGINS_PATH=$INTEL_OPENVINO_DIR/deployment_tools/inference_engine/lib/$system_type
+if [ -e "$INSTALLDIR/runtime" ]; then
+    export InferenceEngine_DIR=$INSTALLDIR/runtime/cmake
+    export ngraph_DIR=$INSTALLDIR/runtime/cmake
+    export OpenVINO_DIR=$INSTALLDIR/runtime/cmake
 
-    if [[ -e ${IE_PLUGINS_PATH}/arch_descriptions ]]; then
-        export ARCH_ROOT_DIR=${IE_PLUGINS_PATH}/arch_descriptions
-    fi
+    system_type=$(ls "$INSTALLDIR/runtime/lib/")
+    IE_PLUGINS_PATH=$INSTALLDIR/runtime/lib/$system_type
+    export OV_FRONTEND_PATH=${IE_PLUGINS_PATH}${OV_FRONTEND_PATH:+:$OV_FRONTEND_PATH}
 
-    export HDDL_INSTALL_DIR=$INSTALLDIR/deployment_tools/inference_engine/external/hddl
+    export HDDL_INSTALL_DIR=$INSTALLDIR/runtime/3rdparty/hddl
     if [[ "$OSTYPE" == "darwin"* ]]; then
-        export DYLD_LIBRARY_PATH=$INSTALLDIR/deployment_tools/inference_engine/external/omp/lib:$INSTALLDIR/deployment_tools/inference_engine/external/mkltiny_mac/lib:${IE_PLUGINS_PATH}${DYLD_LIBRARY_PATH:+:DYLD_LIBRARY_PATH}
-        export LD_LIBRARY_PATH=$INSTALLDIR/deployment_tools/inference_engine/external/omp/lib:$INSTALLDIR/deployment_tools/inference_engine/external/mkltiny_mac/lib:${IE_PLUGINS_PATH}${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
+        export DYLD_LIBRARY_PATH=${IE_PLUGINS_PATH}${DYLD_LIBRARY_PATH:+:DYLD_LIBRARY_PATH}
+        export LD_LIBRARY_PATH=${IE_PLUGINS_PATH}${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
     else
-        export LD_LIBRARY_PATH=$HDDL_INSTALL_DIR/lib:$INSTALLDIR/deployment_tools/inference_engine/external/omp/lib:$INSTALLDIR/deployment_tools/inference_engine/external/gna/lib:$INSTALLDIR/deployment_tools/inference_engine/external/mkltiny_lnx/lib:${IE_PLUGINS_PATH}${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
+        export LD_LIBRARY_PATH=$HDDL_INSTALL_DIR/lib:${IE_PLUGINS_PATH}${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
     fi
 
-    HDDL_UNITE_DIR=$INSTALLDIR/deployment_tools/inference_engine/external/hddl_unite
+    HDDL_UNITE_DIR=$INSTALLDIR/runtime/3rdparty/hddl_unite
 
     if [ -e "$HDDL_UNITE_DIR" ]; then
         export LD_LIBRARY_PATH=$HDDL_UNITE_DIR/lib:$HDDL_UNITE_DIR/thirdparty/XLink/lib${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
     fi
 fi
 
-if [ -e "$INSTALLDIR/deployment_tools/inference_engine/external/tbb" ]; then
+if [ -e "$INSTALLDIR/runtime/3rdparty/tbb" ]; then
     if [[ "$OSTYPE" == "darwin"* ]]; then
-        export DYLD_LIBRARY_PATH=$INSTALLDIR/deployment_tools/inference_engine/external/tbb/lib:${DYLD_LIBRARY_PATH:+:DYLD_LIBRARY_PATH}
+        export DYLD_LIBRARY_PATH=$INSTALLDIR/runtime/3rdparty/tbb/lib:${DYLD_LIBRARY_PATH:+:DYLD_LIBRARY_PATH}
     fi
-    export LD_LIBRARY_PATH=$INSTALLDIR/deployment_tools/inference_engine/external/tbb/lib:${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
-    export TBB_DIR=$INSTALLDIR/deployment_tools/inference_engine/external/tbb/cmake
-fi
-
-if [ -e "$INSTALLDIR/deployment_tools/tools/compile_tool" ]; then
-    export LD_LIBRARY_PATH=$INSTALLDIR/deployment_tools/tools/compile_tool${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
+    export LD_LIBRARY_PATH=$INSTALLDIR/runtime/3rdparty/tbb/lib:${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
+    export TBB_DIR=$INSTALLDIR/runtime/3rdparty/tbb/cmake
 fi
 
-if [ -e "$INSTALLDIR/deployment_tools/ngraph" ]; then
-    export LD_LIBRARY_PATH=$INSTALLDIR/deployment_tools/ngraph/lib${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
-    export ngraph_DIR=$INSTALLDIR/deployment_tools/ngraph/cmake
-    export OV_FRONTEND_PATH=$INSTALLDIR/deployment_tools/ngraph/lib${OV_FRONTEND_PATH:+:$OV_FRONTEND_PATH}
+if [ -e "$INSTALLDIR/tools/compile_tool" ]; then
+    export LD_LIBRARY_PATH=$INSTALLDIR/tools/compile_tool${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}
 fi
 
 if [ -e "$INSTALLDIR/opencv" ]; then
@@ -82,26 +71,26 @@ if [ -e "$INSTALLDIR/opencv" ]; then
 fi
 
 
-if [ -f "$INTEL_OPENVINO_DIR/data_processing/dl_streamer/bin/setupvars.sh" ]; then
-    source "$INTEL_OPENVINO_DIR/data_processing/dl_streamer/bin/setupvars.sh"
+if [ -f "$INTEL_OPENVINO_DIR/extras/dl_streamer/setupvars.sh" ]; then
+    source "$INTEL_OPENVINO_DIR/extras/dl_streamer/setupvars.sh"
 fi
 
-export PATH="$INTEL_OPENVINO_DIR/deployment_tools/model_optimizer${PATH:+:$PATH}"
-export PYTHONPATH="$INTEL_OPENVINO_DIR/deployment_tools/model_optimizer${PYTHONPATH:+:$PYTHONPATH}"
+export PATH="$INTEL_OPENVINO_DIR/tools/model_optimizer${PATH:+:$PATH}"
+export PYTHONPATH="$INTEL_OPENVINO_DIR/tools/model_optimizer${PYTHONPATH:+:$PYTHONPATH}"
 
 
 
-if [ -e "$INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/tools/downloader" ]; then
-    export PYTHONPATH="$INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/tools/downloader:$PYTHONPATH"
-    export PATH="$INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/tools/downloader:$PATH"
+if [ -e "$INTEL_OPENVINO_DIR/extras/open_model_zoo/tools/downloader" ]; then
+    export PYTHONPATH="$INTEL_OPENVINO_DIR/extras/open_model_zoo/tools/downloader:$PYTHONPATH"
+    export PATH="$INTEL_OPENVINO_DIR/extras/open_model_zoo/tools/downloader:$PATH"
 fi
 
-if [ -e "$INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/tools/accuracy_checker" ]; then
-    export PYTHONPATH="$INTEL_OPENVINO_DIR/deployment_tools/open_model_zoo/tools/accuracy_checker:$PYTHONPATH"
+if [ -e "$INTEL_OPENVINO_DIR/tools/accuracy_checker" ]; then
+    export PYTHONPATH="$INTEL_OPENVINO_DIR/tools/accuracy_checker:$PYTHONPATH"
 fi
 
-if [ -e "$INTEL_OPENVINO_DIR/deployment_tools/tools/post_training_optimization_toolkit" ]; then
-    export PYTHONPATH="$INTEL_OPENVINO_DIR/deployment_tools/tools/post_training_optimization_toolkit:$PYTHONPATH"
+if [ -e "$INTEL_OPENVINO_DIR/tools/post_training_optimization_toolkit" ]; then
+    export PYTHONPATH="$INTEL_OPENVINO_DIR/tools/post_training_optimization_toolkit:$PYTHONPATH"
 fi
 
 if [ -z "$python_version" ]; then
diff --git a/tests/conditional_compilation/README.md b/tests/conditional_compilation/README.md
index f8feabc965bce7..05e0f2c94cd45d 100644
--- a/tests/conditional_compilation/README.md
+++ b/tests/conditional_compilation/README.md
@@ -8,6 +8,8 @@ Install Python modules required for tests:
 pip3 install -r requirements.txt 
 ```
 
+Clone Open Model Zoo from https://github.com/openvinotoolkit/open_model_zoo
+
 ## Run tests
 
 ```bash
@@ -18,14 +20,16 @@ pytest test_cc.py
 - `collector_dir` - path to collector file parent folder.
 - `artifacts` - Path to directory where test write output or read input.
 - `openvino_root_dir` - Path to OpenVINO repo root directory.
+- `omz_repo` - Path to Open Model Zoo repository root directory. 
 
 **Optional:**
 - `test_conf` - path to test cases .yml config.
 - `openvino_ref` - Path to root directory with installed OpenVINO. If the option is not specified, CC test firstly build and install
     instrumented package at `<artifacts>/ref_pkg` folder with OpenVINO repository specified in `--openvino_root_dir` option.
     > If OpenVINO instrumented package has been successfuly installed, in the future you can set `--openvino_ref` parameter as `<artifacts>/ref_pkg` for better performance.
+- `omz_cache_dir` - Path to Open Model Zoo cache directory.
 
 **Sample usage:**
 ```bash
-pytest test_cc.py --sea_runtool=./thirdparty/itt_collector/runtool/sea_runtool.py --collector_dir=./bin/intel64/Release --artifacts=../artifacts --openvino_root_dir=.
+pytest test_cc.py --sea_runtool=./thirdparty/itt_collector/runtool/sea_runtool.py --collector_dir=./bin/intel64/Release --artifacts=../artifacts --openvino_root_dir=. --omz_repo=../_open_model_zoo
 ```
diff --git a/tests/conditional_compilation/conftest.py b/tests/conditional_compilation/conftest.py
index a4f9a07acd4c3b..3c246e3b379933 100644
--- a/tests/conditional_compilation/conftest.py
+++ b/tests/conditional_compilation/conftest.py
@@ -6,22 +6,28 @@
 # pylint: disable=line-too-long
 
 """Pytest configuration for compilation tests."""
+import json
 import logging
 import sys
 from inspect import getsourcefile
 from pathlib import Path
 
-# add ../lib to imports
-sys.path.insert(0, str((Path(getsourcefile(lambda: 0)) / ".." / ".." / "lib").resolve(strict=True)))
+# add utils folder to imports
+sys.path.insert(0, str((Path(getsourcefile(lambda: 0)) / ".." / ".." / "utils").resolve(strict=True)))
 
 import yaml
 import pytest
 
+from install_pkg import get_openvino_environment  # pylint: disable=import-error
 from path_utils import expand_env_vars  # pylint: disable=import-error
+from proc_utils import cmd_exec  # pylint: disable=import-error
 from test_utils import make_build, validate_path_arg, write_session_info, \
     SESSION_INFO_FILE  # pylint: disable=import-error
 
 log = logging.getLogger()
+logging.basicConfig(format="[ %(name)s ] [ %(levelname)s ] %(message)s", level=logging.INFO, stream=sys.stdout)
+
+OMZ_NUM_ATTEMPTS = 6
 
 
 def pytest_addoption(parser):
@@ -59,6 +65,18 @@ def pytest_addoption(parser):
         type=Path,
         help="Path to OpenVINO repository root directory",
     )
+    parser.addoption(
+        "--omz_repo",
+        type=Path,
+        default=Path("../_open_model_zoo").resolve(),
+        help="Path to Open Model Zoo repository root directory",
+    )
+    parser.addoption(
+        "--omz_cache_dir",
+        type=Path,
+        default=Path("../_omz_out/cache").resolve(),
+        help="Path to Open Model Zoo cache directory",
+    )
 
 
 def pytest_generate_tests(metafunc):
@@ -72,13 +90,18 @@ def pytest_generate_tests(metafunc):
     for test in test_cases:
         model_list = []
         test_id_list = []
-        for models in test:
+        for model in test:
             extra_args = {}
-            model_path = models["model"]["path"]
             if "marks" in test:
                 extra_args["marks"] = test["marks"]
-            model_list.append(expand_env_vars(model_path))
-            test_id_list.append(model_path.split("/")[- 1])
+            model = model["model"]
+            is_omz = model.get("type") == "omz"
+            if is_omz:
+                test_id_list.append(f'{model["name"]}_{model["precision"]}')
+            else:
+                test_id_list.append(model["path"].split("/")[-1])
+                model["path"] = Path(expand_env_vars(model["path"]))
+            model_list.append(model)
         ids = ids + ['-'.join(test_id_list)]
         params.append(pytest.param('-'.join(test_id_list), model_list), **extra_args)
 
@@ -171,3 +194,86 @@ def save_session_info(pytestconfig, artifacts):
     """Fixture function for saving additional attributes to configuration file."""
     yield
     write_session_info(path=artifacts / SESSION_INFO_FILE, data=pytestconfig.session_info)
+
+
+@pytest.fixture(scope="session")
+def omz_repo(request):
+    """Fixture function for command-line option."""
+    omz_repo = request.config.getoption("omz_repo", skip=True)
+    validate_path_arg(omz_repo, is_dir=True)
+
+    return omz_repo
+
+
+@pytest.fixture(scope="session")
+def omz_cache_dir(request):
+    """Fixture function for command-line option."""
+    omz_cache_dir = request.config.getoption("omz_cache_dir", skip=True)
+    if omz_cache_dir:
+        try:
+            validate_path_arg(omz_cache_dir, is_dir=True)
+        except ValueError:
+            log.warning(f'The Open Model Zoo cache directory'
+                        f' "{omz_cache_dir}" does not exist.')
+
+    return omz_cache_dir
+
+
+@pytest.fixture(scope="function")
+def prepared_models(openvino_ref, models, omz_repo, omz_cache_dir, tmpdir):
+    """
+    Process models: prepare Open Model Zoo models, skip non-OMZ models.
+    """
+    for model in models:
+        if model.get("type") == "omz":
+            model["path"] = prepare_omz_model(openvino_ref, model, omz_repo, omz_cache_dir, tmpdir)
+    models = [model["path"] for model in models]
+    return models
+
+
+def prepare_omz_model(openvino_ref, model, omz_repo, omz_cache_dir, tmpdir):
+    """
+    Download and convert Open Model Zoo model to Intermediate Representation,
+    get path to model XML.
+    """
+    # Step 1: downloader
+    omz_log = logging.getLogger("prepare_omz_model")
+
+    python_executable = sys.executable
+    downloader_path = omz_repo / "tools" / "downloader" / "downloader.py"
+    model_path_root = tmpdir
+
+    cmd = f'{python_executable} {downloader_path} --name {model["name"]}' \
+          f' --precisions={model["precision"]}' \
+          f' --num_attempts {OMZ_NUM_ATTEMPTS}' \
+          f' --output_dir {model_path_root}'
+
+    if omz_cache_dir:
+        cmd += f' --cache_dir {omz_cache_dir}'
+
+    cmd_exec(cmd, log=omz_log)
+
+    # Step 2: converter
+    converter_path = omz_repo / "tools" / "downloader" / "converter.py"
+    ir_path = model_path_root / "_IR"
+    # Note: remove --precisions if both precisions (FP32 & FP16) are required
+    cmd = f'{python_executable} {converter_path} --name {model["name"]}' \
+          f' -p {python_executable}' \
+          f' --precisions={model["precision"]}' \
+          f' --output_dir {ir_path}' \
+          f' --download_dir {model_path_root}' \
+          f' --mo {Path("../../model-optimizer/mo.py").resolve()}'
+
+    cmd_exec(cmd, env=get_openvino_environment(openvino_ref), log=omz_log)
+
+    # Step 3: info_dumper
+    info_dumper_path = omz_repo / "tools" / "downloader" / "info_dumper.py"
+    cmd = f'"{python_executable}" "{info_dumper_path}" --name {model["name"]}'
+
+    return_code, output = cmd_exec(cmd, log=omz_log)
+    model_info = json.loads(output)[0]
+
+    # Step 4: form model_path
+    model_path = ir_path / model_info["subdirectory"] / model["precision"] / f'{model_info["name"]}.xml'
+
+    return model_path
diff --git a/tests/conditional_compilation/requirements.txt b/tests/conditional_compilation/requirements.txt
index f7d4fbd771782c..50de7dd57c87c7 100644
--- a/tests/conditional_compilation/requirements.txt
+++ b/tests/conditional_compilation/requirements.txt
@@ -1,4 +1,5 @@
+pytest>=6.2.1
 pytest-dependency==0.5.1
-PyYAML
-numpy
-pytest-html
\ No newline at end of file
+PyYAML>=5.4.1
+numpy>=1.16.6
+pytest-html>=1.19.0
\ No newline at end of file
diff --git a/tests/conditional_compilation/test_cc.py b/tests/conditional_compilation/test_cc.py
index 50bf71f9d14a70..f42a4a1a87728f 100644
--- a/tests/conditional_compilation/test_cc.py
+++ b/tests/conditional_compilation/test_cc.py
@@ -22,7 +22,7 @@
 
 
 @pytest.mark.dependency(name="cc_collect")
-def test_cc_collect(test_id, models, openvino_ref, test_info,
+def test_cc_collect(test_id, prepared_models, openvino_ref, test_info,
                     save_session_info, sea_runtool, collector_dir, artifacts):  # pylint: disable=unused-argument
     """Test conditional compilation statistics collection
     :param test_info: custom `test_info` field of built-in `request` pytest fixture.
@@ -48,7 +48,7 @@ def test_cc_collect(test_id, models, openvino_ref, test_info,
             "!",
             sys.executable,
             infer_tool,
-            *[f"-m={model}" for model in models],
+            *[f"-m={model}" for model in prepared_models],
             "-d=CPU",
             f"-r={infer_out_dir}"
         ]
@@ -83,18 +83,18 @@ def test_minimized_pkg(test_id, models, openvino_root_dir, artifacts):  # pylint
 
 
 @pytest.mark.dependency(depends=["cc_collect", "minimized_pkg"])
-def test_infer(test_id, models, artifacts):
+def test_infer(test_id, prepared_models, artifacts):
     """Test inference with conditional compiled binaries."""
     out = artifacts / test_id
     minimized_pkg = out / "install_pkg"
-    infer_out_dir_cc =  out / "inference_result_cc/"
+    infer_out_dir_cc = out / "inference_result_cc/"
 
-    return_code, output = run_infer(models, infer_out_dir_cc, minimized_pkg)
+    return_code, output = run_infer(prepared_models, infer_out_dir_cc, minimized_pkg)
     assert return_code == 0, f"Command exited with non-zero status {return_code}:\n {output}"
 
 
 @pytest.mark.dependency(depends=["cc_collect", "minimized_pkg"])
-def test_verify(test_id, models, openvino_ref, artifacts, tolerance=1e-6):  # pylint: disable=too-many-arguments
+def test_verify(test_id, prepared_models, openvino_ref, artifacts, tolerance=1e-6):  # pylint: disable=too-many-arguments
     """Test verifying that inference results are equal."""
     out = artifacts / test_id
     minimized_pkg = out / "install_pkg"
@@ -102,12 +102,12 @@ def test_verify(test_id, models, openvino_ref, artifacts, tolerance=1e-6):  # py
     infer_out_dir_cc = out / "inference_result_cc/"
     infer_out_dir = out / "inference_result/"
 
-    return_code, output = run_infer(models, infer_out_dir, openvino_ref)
+    return_code, output = run_infer(prepared_models, infer_out_dir, openvino_ref)
     assert return_code == 0, f"Command exited with non-zero status {return_code}:\n {output}"
-    return_code, output = run_infer(models, infer_out_dir_cc, minimized_pkg)
+    return_code, output = run_infer(prepared_models, infer_out_dir_cc, minimized_pkg)
     assert return_code == 0, f"Command exited with non-zero status {return_code}:\n {output}"
 
-    for model in models:
+    for model in prepared_models:
         out_file = f"{infer_out_dir / Path(model).name}.npz"
         out_file_cc = f"{infer_out_dir_cc / Path(model).name}.npz"
 
diff --git a/tests/conditional_compilation/test_config.yml b/tests/conditional_compilation/test_config.yml
index bc56db783b05f8..97a073427b8a20 100644
--- a/tests/conditional_compilation/test_config.yml
+++ b/tests/conditional_compilation/test_config.yml
@@ -29,3 +29,33 @@
         path: ${TESTDATA}/models/mobilenet_v2_1.4_224/mobilenet_v2_1.4_224_i8.xml
     - model:
         path: ${TESTDATA}/models/mobilenet_v2_1.0_224/mobilenet_v2_1.0_224_i8.xml
+-
+    - model:
+        name: inception-resnet-v2-tf
+        type: omz
+        precision: FP32
+-
+    - model:
+        name: yolo-v3-tf
+        type: omz
+        precision: FP32
+-
+    - model:
+        name: octave-resnext-101-0.25
+        type: omz
+        precision: FP32
+-
+    - model:
+        name: fast-neural-style-mosaic-onnx
+        type: omz
+        precision: FP32
+-
+    - model:
+        name: efficientdet-d1-tf
+        type: omz
+        precision: FP32
+-
+    - model:
+        name: densenet-201
+        type: omz
+        precision: FP32
diff --git a/tests/fuzz/CMakeLists.txt b/tests/fuzz/CMakeLists.txt
index 18cbc60a1368b8..a5f46c5a07e2d4 100644
--- a/tests/fuzz/CMakeLists.txt
+++ b/tests/fuzz/CMakeLists.txt
@@ -13,14 +13,12 @@ endif()
 
 set(OpenVINO_SOURCE_DIR "${CMAKE_CURRENT_SOURCE_DIR}/../../")
 
-if (NOT TARGET IE::inference_engine)
-    find_package(IEDevScripts REQUIRED
-                 PATHS "${OpenVINO_SOURCE_DIR}/cmake/developer_package"
-                 NO_CMAKE_FIND_ROOT_PATH
-                 NO_DEFAULT_PATH)
-endif()
+find_package(IEDevScripts REQUIRED
+             PATHS "${OpenVINO_SOURCE_DIR}/cmake/developer_package"
+             NO_CMAKE_FIND_ROOT_PATH
+             NO_DEFAULT_PATH)
 
-find_package(InferenceEngine REQUIRED)
+find_package(OpenVINO REQUIRED)
 
 if (NOT ENABLE_FUZZING)
     message(STATUS
diff --git a/tests/fuzz/src/CMakeLists.txt b/tests/fuzz/src/CMakeLists.txt
index 7ae1097443fd19..59056ea3674ac8 100644
--- a/tests/fuzz/src/CMakeLists.txt
+++ b/tests/fuzz/src/CMakeLists.txt
@@ -16,8 +16,8 @@ foreach(test_source ${tests})
     get_filename_component(test_name ${test_source} NAME_WE)
     add_fuzzer(${test_name} ${test_source})
 
-    target_link_libraries(${test_name} PRIVATE IE::inference_engine cnpy zlib ${NGRAPH_LIBRARIES}
-            ngraph::frontend_manager)
+    target_link_libraries(${test_name} PRIVATE
+        openvino::runtime openvino::frontend::manager cnpy zlib)
 
     add_dependencies(fuzz ${test_name})
 
diff --git a/tests/layer_tests/common/constants.py b/tests/layer_tests/common/constants.py
index f1e97d43817983..cf570fc40c2d88 100644
--- a/tests/layer_tests/common/constants.py
+++ b/tests/layer_tests/common/constants.py
@@ -20,6 +20,6 @@
     if not os.path.exists(out_path):
         os.makedirs(out_path)
 
-# supported_devices : CPU, GPU, MYRIAD, FPGA
+# supported_devices : CPU, GPU, MYRIAD
 test_device = os.environ.get('TEST_DEVICE', 'CPU;GPU').split(';')
 test_precision = os.environ.get('TEST_PRECISION', 'FP32;FP16').split(';')
diff --git a/tests/layer_tests/tensorflow_tests/test_tf_RandomUniform.py b/tests/layer_tests/tensorflow_tests/test_tf_RandomUniform.py
new file mode 100644
index 00000000000000..400ea147524cd0
--- /dev/null
+++ b/tests/layer_tests/tensorflow_tests/test_tf_RandomUniform.py
@@ -0,0 +1,93 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import pytest
+import tensorflow as tf
+from mo.front.common.partial_infer.utils import int64_array
+from unit_tests.utils.graph import build_graph, regular_op_with_shaped_data, connect, \
+    shaped_data, connect_front
+
+from common.layer_test_class import check_ir_version
+from common.tf_layer_test_class import CommonTFLayerTest
+
+
+class TestTFRandomUniform(CommonTFLayerTest):
+    def create_tf_random_uniform_net(self, global_seed, op_seed, x_shape, min_val, max_val, input_type, precision,
+                                     ir_version):
+        tf.compat.v1.reset_default_graph()
+
+        # Create the graph and model
+        with tf.compat.v1.Session() as sess:
+            tf_x_shape = x_shape.copy()
+            # reshaping
+            if len(tf_x_shape) >= 3:
+                tf_x_shape.append(tf_x_shape.pop(1))
+
+            x = tf.compat.v1.placeholder(input_type, x_shape, 'Input')
+            if global_seed is not None:
+                tf.random.set_seed(global_seed)
+            random_uniform = tf.random.uniform(x_shape, seed=op_seed, dtype=input_type, minval=min_val,
+                                               maxval=max_val) + x
+
+            tf.compat.v1.global_variables_initializer()
+            tf_net = sess.graph_def
+
+        ref_net = None
+        if check_ir_version(10, None, ir_version):
+
+            const_for_layer_tests = lambda name, value, shape, shape1: {
+                **{name + '_dd': {'kind': 'data', 'value': value, 'shape': shape1}},
+                **{name: {'kind': 'op', 'type': 'Const'}},
+                **shaped_data(name + '_d', shape)}
+
+            connect_const_for_layer_tests = lambda first_tensor_name, second_tensor_name: [
+                *connect_front(first_tensor_name + '_dd', first_tensor_name),
+                *connect(first_tensor_name, second_tensor_name)]
+
+            nodes_attributes = {
+                **regular_op_with_shaped_data('input', x_shape, {'type': 'Parameter'}),
+                **const_for_layer_tests('shape', x_shape, int64_array([len(x_shape)]), int64_array([len(x_shape)])),
+                **const_for_layer_tests('min_val', min_val, int64_array([]), int64_array([1])),
+                **const_for_layer_tests('max_val', max_val, int64_array([]), int64_array([1])),
+                **regular_op_with_shaped_data('random_uniform', x_shape, {'type': 'RandomUniform'}),
+                **regular_op_with_shaped_data('convert', x_shape, {'type': 'Convert'}),
+                **regular_op_with_shaped_data('add', x_shape, {'type': 'Add'}),
+                **regular_op_with_shaped_data('result', x_shape, {'type': 'Result'}),
+
+            }
+
+            if precision == 'FP16' and input_type == tf.float32:
+                ref_net = build_graph(nodes_attributes,
+                                      [*connect_const_for_layer_tests('shape', '0:random_uniform'),
+                                       *connect_const_for_layer_tests('min_val', '1:random_uniform'),
+                                       *connect_const_for_layer_tests('max_val', '2:random_uniform'),
+                                       *connect('random_uniform', 'convert'),
+                                       *connect('convert', '0:add'),
+                                       *connect('input', '1:add'),
+                                       *connect('add', 'result')])
+            else:
+                ref_net = build_graph(nodes_attributes,
+                                      [*connect_const_for_layer_tests('shape', '0:random_uniform'),
+                                       *connect_const_for_layer_tests('min_val', '1:random_uniform'),
+                                       *connect_const_for_layer_tests('max_val', '2:random_uniform'),
+                                       *connect('random_uniform', '0:add'),
+                                       *connect('input', '1:add'),
+                                       *connect('add', 'result')])
+
+        return tf_net, ref_net
+
+    test_data = [pytest.param(
+        dict(global_seed=32465, op_seed=48971, min_val=0.0, max_val=1.0, x_shape=[3, 7], input_type=tf.float32),
+        marks=pytest.mark.precommit),
+        dict(global_seed=None, op_seed=56197, min_val=-100, max_val=100, x_shape=[6], input_type=tf.float32),
+        dict(global_seed=78132, op_seed=None, min_val=-200, max_val=-50, x_shape=[5, 8], input_type=tf.int32),
+        dict(global_seed=4571, op_seed=48971, min_val=1.5, max_val=2.3, x_shape=[7], input_type=tf.float32),
+        dict(global_seed=32465, op_seed=12335, min_val=-150, max_val=-100, x_shape=[18], input_type=tf.int32)]
+
+    @pytest.mark.parametrize("params", test_data)
+    @pytest.mark.nightly
+    def test_tf_random_uniform(self, params, ie_device, precision, ir_version, temp_dir):
+        if ie_device == 'GPU':
+            pytest.skip("RandomUniform is not supported on GPU")
+        self._test(*self.create_tf_random_uniform_net(**params, precision=precision, ir_version=ir_version), ie_device,
+                   precision, temp_dir=temp_dir, ir_version=ir_version, **params)
diff --git a/tests/lib/src/CMakeLists.txt b/tests/lib/src/CMakeLists.txt
index 8a2c8ec7bb054e..bd0f187a46c440 100644
--- a/tests/lib/src/CMakeLists.txt
+++ b/tests/lib/src/CMakeLists.txt
@@ -9,7 +9,7 @@ add_library(${TARGET_NAME} STATIC ${SRC})
 
 target_include_directories(${TARGET_NAME} PUBLIC ${CMAKE_CURRENT_SOURCE_DIR})
 
-# Search OpenVINO Inference Engine installed
-find_package(InferenceEngine REQUIRED)
+# Search OpenVINO Runtime installed
+find_package(OpenVINO REQUIRED COMPONENTS Runtime)
 
-target_link_libraries(${TARGET_NAME} PUBLIC ${InferenceEngine_LIBRARIES})
+target_link_libraries(${TARGET_NAME} PUBLIC openvino::runtime)
diff --git a/tests/lsan/suppressions.txt b/tests/lsan/suppressions.txt
index 64ff833d1efa1d..8e940a64a4b2e0 100644
--- a/tests/lsan/suppressions.txt
+++ b/tests/lsan/suppressions.txt
@@ -12,6 +12,18 @@ leak:__pthread_once_slow
 # memory leaks in graphics driver
 leak:libigdrcl.so
 
+# leaks from python packages used by tests
+leak:site-packages/scipy/
+leak:site-packages/tensorflow/
+leak:site-packages/onnx/
+leak:site-packages/mxnet/
+
+# leaks from mostly tensorflow when used by tests
+leak:_PyObject_New
+leak:_PyLong_New
+leak:PyCode_NewWithPosOnlyArgs
+leak:PyLong_FromLongLong
+
 # Noisy leaks from pybind11. TODO: investigate.
 leak:pybind11
 
diff --git a/tests/memory_tests/.automation/nightly_configs/desktop_test_config.yml b/tests/memory_tests/.automation/nightly_configs/desktop_test_config.yml
new file mode 100644
index 00000000000000..b81b7c24d88802
--- /dev/null
+++ b/tests/memory_tests/.automation/nightly_configs/desktop_test_config.yml
@@ -0,0 +1,1481 @@
+# Models with precision: FP32 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-inception
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-152
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v3
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: alexnet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd300
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg19
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v3-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-o
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-169
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: Sphereface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctpn
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-ssd
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnext-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: caffenet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-r
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121
+    precision: FP32
+    source: omz
+  references: {}
+
+# Models with precision: FP32 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-inception
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-152
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v3
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: alexnet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd300
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg19
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v3-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-o
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-169
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: Sphereface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctpn
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-ssd
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnext-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: caffenet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-r
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121
+    precision: FP32
+    source: omz
+  references: {}
+
+# Models with precision: FP16 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-inception
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-152
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v3
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: alexnet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd300
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg19
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v3-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-o
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-169
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: Sphereface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctpn
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-ssd
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnext-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: caffenet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-r
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121
+    precision: FP16
+    source: omz
+  references: {}
+
+# Models with precision: FP16 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-inception
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-152
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v3
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: alexnet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd300
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg19
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v3-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-o
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-169
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: Sphereface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctpn
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-ssd
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnext-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: caffenet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-r
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121
+    precision: FP16
+    source: omz
+  references: {}
+
+# Models with precision: FP16-INT8 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: vehicle-attributes-recognition-barrier-0039
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-0006
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-1016
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: age-gender-recognition-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-detection-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: image-retrieval-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-retail-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-attributes-recognition-crossroad-0230
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: action-recognition-0001-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-teacher-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-0078
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: unet-camvid-onnx-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: human-pose-estimation-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster-rcnn-resnet101-coco-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: action-recognition-0001-encoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-sparse-35-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-raisinghand-recognition-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-asl-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: license-plate-recognition-barrier-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: single-image-super-resolution-1032
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: landmarks-regression-retail-0009
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: driver-action-recognition-adas-0002-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-0005
+    precision: FP16-INT8
+    source: omz
+  references: {}
+
+# Models with precision: FP16-INT8 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: vehicle-attributes-recognition-barrier-0039
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-0006
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-1016
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: age-gender-recognition-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-detection-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: image-retrieval-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-retail-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-attributes-recognition-crossroad-0230
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: action-recognition-0001-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-teacher-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-0078
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: unet-camvid-onnx-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: human-pose-estimation-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster-rcnn-resnet101-coco-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: action-recognition-0001-encoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-sparse-35-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-raisinghand-recognition-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-asl-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: license-plate-recognition-barrier-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: single-image-super-resolution-1032
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: landmarks-regression-retail-0009
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: driver-action-recognition-adas-0002-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-0005
+    precision: FP16-INT8
+    source: omz
+  references: {}
diff --git a/tests/memory_tests/.automation/nightly_configs/myriad_test_config.yml b/tests/memory_tests/.automation/nightly_configs/myriad_test_config.yml
new file mode 100644
index 00000000000000..ed111b514ac605
--- /dev/null
+++ b/tests/memory_tests/.automation/nightly_configs/myriad_test_config.yml
@@ -0,0 +1,740 @@
+# Models with precision: FP32 -- device: MYRIAD
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-inception
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: efficientnet-b0
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-resnet-152
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v3
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: alexnet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v4-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd300
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: vgg19
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v1
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v3-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mtcnn-o
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v1-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: densenet-169
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: Sphereface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ctpn
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: i3d-rgb-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-ssd
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-resnext-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: caffenet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mtcnn-r
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-resnet-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: densenet-121
+    precision: FP32
+    source: omz
+  references: {}
+
+# Models with precision: FP16 -- device: MYRIAD
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-inception
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: efficientnet-b0
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-resnet-152
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v3
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: alexnet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v4-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd300
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: vgg19
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v1
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v3-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mtcnn-o
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v1-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ssd512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: densenet-169
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: Sphereface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: googlenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: ctpn
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: i3d-rgb-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mobilenet-ssd
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-resnext-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: caffenet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: mtcnn-r
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: se-resnet-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: densenet-121
+    precision: FP16
+    source: omz
+  references: {}
+
+# Models with precision: FP16-INT8 -- device: MYRIAD
+- device:
+    name: MYRIAD
+  model:
+    name: vehicle-attributes-recognition-barrier-0039
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-detection-action-recognition-0006
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-vehicle-bike-detection-crossroad-1016
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: age-gender-recognition-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: vehicle-detection-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: image-retrieval-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-detection-retail-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-attributes-recognition-crossroad-0230
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: action-recognition-0001-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-detection-action-recognition-teacher-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-vehicle-bike-detection-crossroad-0078
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: face-detection-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: unet-camvid-onnx-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: human-pose-estimation-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: faster-rcnn-resnet101-coco-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: action-recognition-0001-encoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v2-ava-sparse-35-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-detection-raisinghand-recognition-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-detection-asl-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v2-tiny-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: license-plate-recognition-barrier-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-detection-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: single-image-super-resolution-1032
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: landmarks-regression-retail-0009
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: driver-action-recognition-adas-0002-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: yolo-v2-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: MYRIAD
+  model:
+    name: person-detection-action-recognition-0005
+    precision: FP16-INT8
+    source: omz
+  references: {}
diff --git a/tests/memory_tests/.automation/precommit_configs/desktop_test_config.yml b/tests/memory_tests/.automation/precommit_configs/desktop_test_config.yml
new file mode 100644
index 00000000000000..89ccc7162e1203
--- /dev/null
+++ b/tests/memory_tests/.automation/precommit_configs/desktop_test_config.yml
@@ -0,0 +1,119 @@
+# Models with precision: FP32 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: vgg16
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-r
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-ssd
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd300
+    precision: FP32
+    source: omz
+  references: {}
+
+# Models with precision: FP32 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: vgg16
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-r
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-ssd
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd300
+    precision: FP32
+    source: omz
+  references: {}
+
+# Models with precision: FP16 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: vgg16
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-r
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-ssd
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd300
+    precision: FP16
+    source: omz
+  references: {}
+
+# Models with precision: FP16 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: vgg16
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-r
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-ssd
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd300
+    precision: FP16
+    source: omz
+  references: {}
diff --git a/tests/memory_tests/.automation/weekly_configs/desktop_test_config.yml b/tests/memory_tests/.automation/weekly_configs/desktop_test_config.yml
new file mode 100644
index 00000000000000..ad51bd859e3d6d
--- /dev/null
+++ b/tests/memory_tests/.automation/weekly_configs/desktop_test_config.yml
@@ -0,0 +1,4463 @@
+# Models with precision: FP32 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-101-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b7_auto_aug
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-1.0-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-inception
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-152
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v3
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: alexnet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: license-plate-recognition-barrier-0007
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-0.50-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v1_fpn_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg16
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-resnet34-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: gmcnn-places2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-1.0-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-101
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-retail-0044
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-mobilefacenet-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0123
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-161
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnext-101-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-resnet50-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-161-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-200-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-p
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnext-101
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b5
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-169-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-201
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-50-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: squeezenet1.1
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: squeezenet1.0
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-26-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd300
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: rfcn-resnet101-coco-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg19
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0_auto_aug
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_inception_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_inception_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: inception-resnet-v2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: deeplabv3
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v3-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-o
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-se-resnet-50-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-169
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: Sphereface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-resnet100-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-0.25-128
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: facenet-20180408-102900
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctpn
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssdlite_mobilenet_v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-ssd
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnext-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: caffenet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-r
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_resnet50_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_resnet50_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-50-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-0.50-160
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_resnet101_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-densenet-121-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: colorization-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b5-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b7-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v3-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: human-pose-estimation-3d-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: midasnet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-18-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-50-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-50-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: single-human-pose-estimation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: squeezenet1.1-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg19-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: facial-landmarks-35-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-attributes-recognition-barrier-0039
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-0006
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: asl-recognition-0004
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-30-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-detection-0004
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-1016
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: age-gender-recognition-retail-0013
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-detection-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: image-retrieval-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-retail-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-attributes-recognition-crossroad-0230
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-0010
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-0083
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: icnet-camvid-ava-sparse-30-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: action-recognition-0001-decoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-teacher-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-0078
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: icnet-camvid-ava-sparse-60-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: unet-camvid-onnx-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: human-pose-estimation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster-rcnn-resnet101-coco-sparse-60-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: action-recognition-0001-encoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-sparse-35-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-sparse-70-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-raisinghand-recognition-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-asl-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: emotions-recognition-retail-0003
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-ava-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: license-plate-recognition-barrier-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-retail-0013
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-0050
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: single-image-super-resolution-1032
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: landmarks-regression-retail-0009
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: driver-action-recognition-adas-0002-decoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-0005
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-recognition-0012
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-retail-0004
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: product-detection-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-60-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: road-segmentation-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: single-image-super-resolution-1033
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-retail-0005
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: pedestrian-and-vehicle-detector-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: handwritten-japanese-recognition-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: semantic-segmentation-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: pedestrian-detection-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: driver-action-recognition-adas-0002-encoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-detection-0003
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: handwritten-score-recognition-0003
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: icnet-camvid-ava-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-image-super-resolution-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: gaze-estimation-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: head-pose-estimation-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0106
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-1025
+    precision: FP32
+    source: omz
+  references: {}
+
+# Models with precision: FP32 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-101-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b7_auto_aug
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-1.0-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-inception
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-152
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v3
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: alexnet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: license-plate-recognition-barrier-0007
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-0.50-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v1_fpn_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg16
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-resnet34-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: gmcnn-places2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-1.0-224
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-101
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-retail-0044
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-mobilefacenet-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0123
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-161
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnext-101-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-resnet50-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-161-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-200-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-p
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnext-101
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b5
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-169-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-201
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-50-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: squeezenet1.1
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: squeezenet1.0
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-26-0.25
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd300
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: rfcn-resnet101-coco-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg19
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0_auto_aug
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_inception_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_inception_v2_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: inception-resnet-v2-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: deeplabv3
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v3-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-o
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-se-resnet-50-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-169
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: Sphereface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-resnet100-arcface
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-0.25-128
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: facenet-20180408-102900
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctpn
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssdlite_mobilenet_v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-ssd
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnext-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: caffenet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-r
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_resnet50_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-50
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_resnet50_atrous_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-50-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121-tf
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-0.50-160
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_resnet101_coco
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-densenet-121-0.125
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: colorization-v2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b5-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b7-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v3-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: human-pose-estimation-3d-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: midasnet
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-18-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-50-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-50-pytorch
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: single-human-pose-estimation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: squeezenet1.1-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg19-caffe2
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: facial-landmarks-35-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-attributes-recognition-barrier-0039
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-0006
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: asl-recognition-0004
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-30-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-detection-0004
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-1016
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: age-gender-recognition-retail-0013
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-detection-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: image-retrieval-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-retail-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-attributes-recognition-crossroad-0230
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-0010
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-0083
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: icnet-camvid-ava-sparse-30-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: action-recognition-0001-decoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-teacher-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-0078
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: icnet-camvid-ava-sparse-60-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: unet-camvid-onnx-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: human-pose-estimation-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster-rcnn-resnet101-coco-sparse-60-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: action-recognition-0001-encoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-sparse-35-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-sparse-70-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-raisinghand-recognition-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-asl-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: emotions-recognition-retail-0003
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-ava-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: license-plate-recognition-barrier-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-retail-0013
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-0050
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: single-image-super-resolution-1032
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: landmarks-regression-retail-0009
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: driver-action-recognition-adas-0002-decoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-0005
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-recognition-0012
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-retail-0004
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: product-detection-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-60-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: road-segmentation-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: single-image-super-resolution-1033
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-retail-0005
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: pedestrian-and-vehicle-detector-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: handwritten-japanese-recognition-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: semantic-segmentation-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: pedestrian-detection-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: driver-action-recognition-adas-0002-encoder
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-detection-0003
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: handwritten-score-recognition-0003
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: icnet-camvid-ava-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-image-super-resolution-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: gaze-estimation-adas-0002
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: head-pose-estimation-adas-0001
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0106
+    precision: FP32
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-1025
+    precision: FP32
+    source: omz
+  references: {}
+
+# Models with precision: FP16 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-101-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b7_auto_aug
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-1.0-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-inception
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-152
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v3
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: alexnet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: license-plate-recognition-barrier-0007
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-0.50-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd_mobilenet_v1_fpn_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg16
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-resnet34-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: gmcnn-places2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-1.0-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-101
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-retail-0044
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-mobilefacenet-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0123
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-161
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnext-101-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-resnet50-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-161-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-200-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-p
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnext-101
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b5
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-169-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-201
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-50-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: squeezenet1.1
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: squeezenet1.0
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-26-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd300
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: rfcn-resnet101-coco-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg19
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0_auto_aug
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_inception_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_inception_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: inception-resnet-v2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: deeplabv3
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v3-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-o
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-se-resnet-50-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssd512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-169
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: Sphereface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-recognition-resnet100-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-0.25-128
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: facenet-20180408-102900
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ctpn
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: ssdlite_mobilenet_v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-ssd
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnext-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: caffenet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mtcnn-r
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_resnet50_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: se-resnet-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mask_rcnn_resnet50_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-resnet-50-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v1-0.50-160
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster_rcnn_resnet101_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: octave-densenet-121-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: colorization-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: densenet-121-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b0-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b5-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: efficientnet-b7-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: googlenet-v3-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: human-pose-estimation-3d-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: asl-recognition-0004
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: midasnet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: mobilenet-v2-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-18-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-50-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: resnet-50-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: single-human-pose-estimation-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: squeezenet1.1-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vgg19-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+
+# Models with precision: FP16 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-1.4-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-101-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b7_auto_aug
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-1.0-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-inception
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-1.0-224-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_resnet101_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v1_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-152
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnext-50-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v3
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: alexnet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: license-plate-recognition-barrier-0007
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-0.50-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd_mobilenet_v1_fpn_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg16
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-resnet34-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: gmcnn-places2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-1.0-224
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-101
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-retail-0044
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-mobilefacenet-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0123
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-161
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_inception_resnet_v2_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnext-101-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-resnet50-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-161-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-200-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-p
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnext-101
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b5
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-169-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-201
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-50-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: squeezenet1.1
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: squeezenet1.0
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-26-0.25
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v4-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd300
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: rfcn-resnet101-coco-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg19
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_384
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0_auto_aug
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_inception_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_inception_v2_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: inception-resnet-v2-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: deeplabv3
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v3-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-o
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-se-resnet-50-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v1-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v1-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssd512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-169
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: brain-tumor-segmentation-0002
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: Sphereface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-recognition-resnet100-arcface
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-0.25-128
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctdet_coco_dlav0_512
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: facenet-20180408-102900
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ctpn
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: ssdlite_mobilenet_v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: i3d-rgb-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-ssd
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnext-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: caffenet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mtcnn-r
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_resnet50_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: se-resnet-50
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mask_rcnn_resnet50_atrous_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-resnet-50-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121-tf
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v1-0.50-160
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster_rcnn_resnet101_coco
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: octave-densenet-121-0.125
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: colorization-v2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: densenet-121-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b0-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b5-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: efficientnet-b7-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: googlenet-v3-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: human-pose-estimation-3d-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: asl-recognition-0004
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: midasnet
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: mobilenet-v2-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-18-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-50-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: resnet-50-pytorch
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: single-human-pose-estimation-0001
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: squeezenet1.1-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vgg19-caffe2
+    precision: FP16
+    source: omz
+  references: {}
+
+# Models with precision: FP16-INT8 -- device: CPU
+- device:
+    name: CPU
+  model:
+    name: facial-landmarks-35-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-attributes-recognition-barrier-0039
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-0006
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-30-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-detection-0004
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-1016
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: age-gender-recognition-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-detection-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: image-retrieval-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-retail-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-attributes-recognition-crossroad-0230
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-0010
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-0083
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: icnet-camvid-ava-sparse-30-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: action-recognition-0001-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-teacher-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-0078
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: icnet-camvid-ava-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: unet-camvid-onnx-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: human-pose-estimation-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: faster-rcnn-resnet101-coco-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: action-recognition-0001-encoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-sparse-35-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-sparse-70-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-raisinghand-recognition-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-asl-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: emotions-recognition-retail-0003
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: license-plate-recognition-barrier-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-0050
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: single-image-super-resolution-1032
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: landmarks-regression-retail-0009
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: driver-action-recognition-adas-0002-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: person-detection-action-recognition-0005
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-recognition-0012
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-retail-0004
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: product-detection-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: road-segmentation-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: single-image-super-resolution-1033
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: face-detection-retail-0005
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: pedestrian-and-vehicle-detector-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: handwritten-japanese-recognition-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: semantic-segmentation-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: pedestrian-detection-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: driver-action-recognition-adas-0002-encoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-detection-0003
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: handwritten-score-recognition-0003
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: icnet-camvid-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: text-image-super-resolution-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: gaze-estimation-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: head-pose-estimation-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0106
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: CPU
+  model:
+    name: instance-segmentation-security-1025
+    precision: FP16-INT8
+    source: omz
+  references: {}
+
+# Models with precision: FP16-INT8 -- device: GPU
+- device:
+    name: GPU
+  model:
+    name: facial-landmarks-35-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-attributes-recognition-barrier-0039
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-0006
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-30-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-detection-0004
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-1016
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: age-gender-recognition-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-detection-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: image-retrieval-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-retail-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-attributes-recognition-crossroad-0230
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-0010
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-0083
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: icnet-camvid-ava-sparse-30-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: action-recognition-0001-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-teacher-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-vehicle-bike-detection-crossroad-0078
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: icnet-camvid-ava-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: unet-camvid-onnx-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: human-pose-estimation-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: faster-rcnn-resnet101-coco-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: action-recognition-0001-encoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-sparse-35-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-sparse-70-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-raisinghand-recognition-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-asl-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: emotions-recognition-retail-0003
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: license-plate-recognition-barrier-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-retail-0013
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-0050
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: single-image-super-resolution-1032
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: landmarks-regression-retail-0009
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: driver-action-recognition-adas-0002-decoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: person-detection-action-recognition-0005
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-recognition-0012
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-retail-0004
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: product-detection-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: yolo-v2-tiny-ava-sparse-60-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: road-segmentation-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: single-image-super-resolution-1033
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: face-detection-retail-0005
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: pedestrian-and-vehicle-detector-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: handwritten-japanese-recognition-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: semantic-segmentation-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: pedestrian-detection-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: driver-action-recognition-adas-0002-encoder
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-detection-0003
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: handwritten-score-recognition-0003
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: icnet-camvid-ava-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: text-image-super-resolution-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: gaze-estimation-adas-0002
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: head-pose-estimation-adas-0001
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: vehicle-license-plate-detection-barrier-0106
+    precision: FP16-INT8
+    source: omz
+  references: {}
+- device:
+    name: GPU
+  model:
+    name: instance-segmentation-security-1025
+    precision: FP16-INT8
+    source: omz
+  references: {}
diff --git a/tests/memory_tests/CMakeLists.txt b/tests/memory_tests/CMakeLists.txt
new file mode 100644
index 00000000000000..fdf0ebe0dd5c95
--- /dev/null
+++ b/tests/memory_tests/CMakeLists.txt
@@ -0,0 +1,21 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+cmake_minimum_required(VERSION 3.13)
+
+if (CMAKE_BUILD_TYPE STREQUAL "")
+    message(STATUS "CMAKE_BUILD_TYPE not defined, 'Release' will be used")
+    set(CMAKE_BUILD_TYPE "Release")
+endif()
+
+# Define directory where artifacts will be placed
+set(OUTPUT_ROOT ${CMAKE_CURRENT_SOURCE_DIR})
+
+set(OpenVINO_SOURCE_DIR "${CMAKE_CURRENT_SOURCE_DIR}/../../")
+
+project(memory_tests)
+
+find_package(InferenceEngine REQUIRED)
+
+add_subdirectory(src)
diff --git a/tests/memory_tests/README.md b/tests/memory_tests/README.md
new file mode 100644
index 00000000000000..a2ccc5daea850b
--- /dev/null
+++ b/tests/memory_tests/README.md
@@ -0,0 +1,37 @@
+# Memory Tests
+
+This test suite contains pipelines, which are executables. 
+Memory tests measuring memory required for the use cases and fail when memory
+usage exceeds a pre-defined level.
+
+## Prerequisites
+
+To build the time tests, you need to have OpenVINO™ installed or build from source.
+
+## Measure Time
+
+To build and run the tests, open a terminal, set OpenVINO™ environment and run
+the commands below:
+
+1. Build tests:
+``` bash
+mkdir build && cd build
+cmake .. && make memory_tests
+```
+
+2. Install tests:
+``` bash
+make install tests --prefix <install_path>
+```
+
+3. Run test:
+``` bash
+./scripts/run_memorytest.py <install_path>/tests/memtest_infer -m model.xml -d CPU
+```
+
+4. Run several configurations using `pytest`:
+``` bash
+pytest ./test_runner/test.py --exe <install_path>/tests/memorytest_infer
+# For parse_stat testing:
+pytest ./scripts/run_memorytest.py
+```
\ No newline at end of file
diff --git a/tests/memory_tests/include/memory_tests_helper/memory_counter.h b/tests/memory_tests/include/memory_tests_helper/memory_counter.h
new file mode 100644
index 00000000000000..9585761d321a49
--- /dev/null
+++ b/tests/memory_tests/include/memory_tests_helper/memory_counter.h
@@ -0,0 +1,27 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+
+namespace MemoryTest {
+
+/** Encapsulate memory measurements.
+Object of a class measures memory at start of object's life cycle.
+StatisticsWriter adds MemCounter to the memory structure.
+*/
+
+class MemoryCounter {
+private:
+  std::string name;
+
+public:
+  /// Constructs MemoryCounter object.
+  MemoryCounter(const std::string &mem_counter_name);
+};
+
+#define MEMORY_SNAPSHOT(mem_counter_name) MemoryTest::MemoryCounter (#mem_counter_name);
+
+} // namespace MemoryTest
diff --git a/tests/memory_tests/include/memory_tests_helper/utils.h b/tests/memory_tests/include/memory_tests_helper/utils.h
new file mode 100644
index 00000000000000..59cbb87e7c5021
--- /dev/null
+++ b/tests/memory_tests/include/memory_tests_helper/utils.h
@@ -0,0 +1,20 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+
+namespace MemoryTest {
+/**
+* @brief Get extension from filename
+* @param filename - name of the file which extension should be extracted
+* @return string with extracted file extension
+*/
+std::string fileExt(const std::string& filename) {
+    auto pos = filename.rfind('.');
+    if (pos == std::string::npos) return "";
+    return filename.substr(pos + 1);
+}
+}
diff --git a/tests/memory_tests/scripts/run_memorytest.py b/tests/memory_tests/scripts/run_memorytest.py
new file mode 100644
index 00000000000000..c4ce69b43b2873
--- /dev/null
+++ b/tests/memory_tests/scripts/run_memorytest.py
@@ -0,0 +1,198 @@
+#!/usr/bin/env python3
+
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+"""
+This script runs test executable several times and aggregate
+collected statistics.
+"""
+
+# pylint: disable=redefined-outer-name
+
+import argparse
+import copy
+import logging
+import os
+import statistics
+import sys
+import tempfile
+from pathlib import Path
+from pprint import pprint
+
+import yaml
+
+UTILS_DIR = os.path.join(Path(__file__).parent.parent.parent, "utils")
+sys.path.insert(0, str(UTILS_DIR))
+
+from proc_utils import cmd_exec
+from path_utils import check_positive_int
+
+
+def prepare_executable_cmd(args: dict):
+    """Generate common part of cmd from arguments to execute"""
+    return [str(args["executable"].resolve(strict=True)),
+            "-m", str(args["model"].resolve(strict=True)),
+            "-d", args["device"]]
+
+
+def parse_stats(stats: dict, res: dict):
+    """Parse statistics to dict"""
+    for k, v in stats.items():
+        if k not in res.keys():
+            res.update({k: {}})
+        if isinstance(v, list):
+            for element in v:
+                for metric, value in element.items():
+                    res[k].update({metric: [value]})
+
+
+def append_stats(stats: dict, parsed_dict: dict):
+    if not stats:
+        return copy.deepcopy(parsed_dict)
+    for step_name, vm_values in parsed_dict.items():
+        for vm_metric, vm_value in vm_values.items():
+            stats[step_name][vm_metric].extend(vm_value)
+    return stats
+
+
+def aggregate_stats(stats: dict):
+    return {step_name: {vm_metric: {"avg": statistics.mean(vm_values_list),
+                                    "stdev": statistics.stdev(vm_values_list) if len(vm_values_list) > 1 else 0}
+                        for vm_metric, vm_values_list in vm_values.items()}
+            for step_name, vm_values in stats.items()}
+
+
+def run_memorytest(args: dict, log=None):
+    """Run provided executable several times and aggregate collected statistics"""
+
+    if log is None:
+        log = logging.getLogger('run_test')
+
+    cmd_common = prepare_executable_cmd(args)
+
+    # Run executable and collect statistics
+    stats = {}
+    for run_iter in range(args["niter"]):
+        tmp_stats_path = tempfile.NamedTemporaryFile().name
+        retcode, msg = cmd_exec(cmd_common + ["-s", str(tmp_stats_path)], log=log)
+        if retcode != 0:
+            log.error("Run of executable '{}' failed with return code '{}'. Error: {}\n"
+                      "Statistics aggregation is skipped.".format(args["executable"], retcode, msg))
+            return retcode, msg, {}, {}
+
+        # Read raw statistics
+        with open(tmp_stats_path, "r") as file:
+            raw_data = list(yaml.load_all(file, Loader=yaml.SafeLoader))
+
+        os.unlink(tmp_stats_path)
+
+        # Parse raw data
+        parsed_data = {}
+        parse_stats(raw_data[0], parsed_data)
+
+        log.debug("Statistics after run of executable #{}: {}".format(run_iter, parsed_data))
+
+        stats = append_stats(stats, parsed_data)
+
+    # Aggregate results
+    aggregated_stats = aggregate_stats(stats)
+    log.debug("Aggregated statistics after full run: {}".format(aggregated_stats))
+
+    return 0, "", aggregated_stats, stats
+
+
+def cli_parser():
+    """parse command-line arguments"""
+    parser = argparse.ArgumentParser(description='Run test executable')
+    parser.add_argument('executable',
+                        type=Path,
+                        help='binary to execute')
+    parser.add_argument('-m',
+                        required=True,
+                        dest="model",
+                        type=Path,
+                        help='path to an .xml/.onnx/.prototxt file with a trained model or'
+                             ' to a .blob files with a trained compiled model')
+    parser.add_argument('-d',
+                        required=True,
+                        dest="device",
+                        type=str,
+                        help='target device to infer on')
+    parser.add_argument('-niter',
+                        default=10,
+                        type=check_positive_int,
+                        help='number of times to execute binary to aggregate statistics of')
+    parser.add_argument('-s',
+                        dest="stats_path",
+                        type=Path,
+                        help='path to a file to save aggregated statistics')
+
+    args = parser.parse_args()
+
+    return args
+
+
+if __name__ == "__main__":
+    args = cli_parser()
+
+    logging.basicConfig(format="[ %(levelname)s ] %(message)s",
+                        level=logging.DEBUG, stream=sys.stdout)
+
+    exit_code, _, aggr_stats, _ = run_memorytest(dict(args._get_kwargs()),
+                                                 log=logging)  # pylint: disable=protected-access
+
+    if args.stats_path:
+        # Save aggregated results to a file
+        with open(args.stats_path, "w") as file:
+            yaml.safe_dump(aggr_stats, file)
+        logging.info("Aggregated statistics saved to a file: '{}'".format(
+            args.stats_path.resolve()))
+    else:
+        logging.info("Aggregated statistics:")
+        pprint(aggr_stats)
+
+    sys.exit(exit_code)
+
+
+def test_memorytest_parser():
+    # Example of test yml file
+    raw_data_example = {'after_objects_release': [{'vmrss': 1}, {'vmhwm': 1},
+                                                  {'vmsize': 1}, {'vmpeak': 1}, {'threads': 1}],
+                        'create_exenetwork': [{'vmrss': 1}, {'vmhwm': 1},
+                                              {'vmsize': 1}, {'vmpeak': 1}, {'threads': 1}],
+                        'fill_inputs': [{'vmrss': 1}, {'vmhwm': 1}, {'vmsize': 1},
+                                        {'vmpeak': 1}, {'threads': 1}],
+                        'first_inference': [{'vmrss': 1}, {'vmhwm': 1},
+                                            {'vmsize': 1}, {'vmpeak': 1}, {'threads': 1}],
+                        'full_run': [{'vmrss': 1}, {'vmhwm': 1}, {'vmsize': 1},
+                                     {'vmpeak': 1}, {'threads': 1}],
+                        'load_network': [{'vmrss': 1}, {'vmhwm': 1},
+                                         {'vmsize': 1}, {'vmpeak': 1}, {'threads': 1}],
+                        'load_plugin': [{'vmrss': 1}, {'vmhwm': 1}, {'vmsize': 1},
+                                        {'vmpeak': 1}, {'threads': 1}],
+                        'read_network': [{'vmrss': 1}, {'vmhwm': 1}, {'vmsize': 1},
+                                         {'vmpeak': 1}, {'threads': 1}]}
+
+    # Refactoring raw data from yml
+    parsed_data = {}
+    parse_stats(raw_data_example, parsed_data)
+
+    expected_result = {'after_objects_release': {'vmrss': [1], 'vmhwm': [1],
+                                                 'vmsize': [1], 'vmpeak': [1], 'threads': [1]},
+                       'create_exenetwork': {'vmrss': [1], 'vmhwm': [1],
+                                             'vmsize': [1], 'vmpeak': [1], 'threads': [1]},
+                       'fill_inputs': {'vmrss': [1], 'vmhwm': [1], 'vmsize': [1],
+                                       'vmpeak': [1], 'threads': [1]},
+                       'first_inference': {'vmrss': [1], 'vmhwm': [1],
+                                           'vmsize': [1], 'vmpeak': [1], 'threads': [1]},
+                       'full_run': {'vmrss': [1], 'vmhwm': [1], 'vmsize': [1],
+                                    'vmpeak': [1], 'threads': [1]},
+                       'load_network': {'vmrss': [1], 'vmhwm': [1],
+                                        'vmsize': [1], 'vmpeak': [1], 'threads': [1]},
+                       'load_plugin': {'vmrss': [1], 'vmhwm': [1], 'vmsize': [1],
+                                       'vmpeak': [1], 'threads': [1]},
+                       'read_network': {'vmrss': [1], 'vmhwm': [1],
+                                        'vmsize': [1], 'vmpeak': [1], 'threads': [1]}}
+
+    assert parsed_data == expected_result, "Statistics parsing is performed incorrectly!"
diff --git a/tests/memory_tests/src/CMakeLists.txt b/tests/memory_tests/src/CMakeLists.txt
new file mode 100644
index 00000000000000..c3c5fe33b9e296
--- /dev/null
+++ b/tests/memory_tests/src/CMakeLists.txt
@@ -0,0 +1,6 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+add_subdirectory(memory_tests)
+add_subdirectory(memory_tests_helper)
diff --git a/tests/memory_tests/src/memory_tests/CMakeLists.txt b/tests/memory_tests/src/memory_tests/CMakeLists.txt
new file mode 100644
index 00000000000000..20ac7b01d2c9b9
--- /dev/null
+++ b/tests/memory_tests/src/memory_tests/CMakeLists.txt
@@ -0,0 +1,24 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+# add dummy `memory_tests` target combines all memory tests
+add_custom_target(memory_tests)
+
+# Build test from every source file.
+# Test target name is source file name without extension.
+FILE(GLOB tests "*.cpp")
+
+add_subdirectory("${OpenVINO_SOURCE_DIR}/tests/lib" tests_shared_lib)
+
+foreach(test_source ${tests})
+    get_filename_component(test_name ${test_source} NAME_WE)
+    add_executable(${test_name} ${test_source})
+
+    target_link_libraries(${test_name} PRIVATE IE::inference_engine memory_tests_helper tests_shared_lib)
+
+    add_dependencies(memory_tests ${test_name})
+
+    install(TARGETS ${test_name}
+            RUNTIME DESTINATION tests COMPONENT tests EXCLUDE_FROM_ALL)
+endforeach()
diff --git a/tests/memory_tests/src/memory_tests/memtest_infer.cpp b/tests/memory_tests/src/memory_tests/memtest_infer.cpp
new file mode 100644
index 00000000000000..a0b8ac25b31280
--- /dev/null
+++ b/tests/memory_tests/src/memory_tests/memtest_infer.cpp
@@ -0,0 +1,73 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <inference_engine.hpp>
+#include <iostream>
+
+#include "common_utils.h"
+#include "memory_tests_helper/memory_counter.h"
+#include "memory_tests_helper/utils.h"
+using namespace InferenceEngine;
+
+
+/**
+ * @brief Function that contain executable pipeline which will be called from
+ * main(). The function should not throw any exceptions and responsible for
+ * handling it by itself.
+ */
+int runPipeline(const std::string &model, const std::string &device) {
+  auto pipeline = [](const std::string &model, const std::string &device) {
+    Core ie;
+    CNNNetwork cnnNetwork;
+    ExecutableNetwork exeNetwork;
+    InferRequest inferRequest;
+    size_t batchSize = 0;
+
+    ie.GetVersions(device);
+    MEMORY_SNAPSHOT(load_plugin);
+
+    if (MemoryTest::fileExt(model) == "blob") {
+      exeNetwork = ie.ImportNetwork(model, device);
+      MEMORY_SNAPSHOT(import_network);
+    }
+    else {
+      cnnNetwork = ie.ReadNetwork(model);
+      MEMORY_SNAPSHOT(read_network);
+
+      exeNetwork = ie.LoadNetwork(cnnNetwork, device);
+
+      MEMORY_SNAPSHOT(load_network);
+      batchSize = cnnNetwork.getBatchSize();
+    }
+    MEMORY_SNAPSHOT(create_exenetwork);
+
+    inferRequest = exeNetwork.CreateInferRequest();
+
+    batchSize = batchSize != 0 ? batchSize : 1;
+    const InferenceEngine::ConstInputsDataMap inputsInfo(exeNetwork.GetInputsInfo());
+    fillBlobs(inferRequest, inputsInfo, batchSize);
+    MEMORY_SNAPSHOT(fill_inputs)
+
+    inferRequest.Infer();
+    MEMORY_SNAPSHOT(first_inference);
+    MEMORY_SNAPSHOT(full_run);
+  };
+
+  try {
+    pipeline(model, device);
+  } catch (const InferenceEngine::Exception &iex) {
+    std::cerr
+        << "Inference Engine pipeline failed with Inference Engine exception:\n"
+        << iex.what();
+    return 1;
+  } catch (const std::exception &ex) {
+    std::cerr << "Inference Engine pipeline failed with exception:\n"
+              << ex.what();
+    return 2;
+  } catch (...) {
+    std::cerr << "Inference Engine pipeline failed\n";
+    return 3;
+  }
+  return 0;
+}
diff --git a/tests/memory_tests/src/memory_tests_helper/CMakeLists.txt b/tests/memory_tests/src/memory_tests_helper/CMakeLists.txt
new file mode 100644
index 00000000000000..4216a60030f867
--- /dev/null
+++ b/tests/memory_tests/src/memory_tests_helper/CMakeLists.txt
@@ -0,0 +1,15 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+set (TARGET_NAME "memory_tests_helper")
+
+file (GLOB SRC *.cpp)
+add_library(${TARGET_NAME} STATIC ${SRC})
+target_include_directories(${TARGET_NAME} PUBLIC "${CMAKE_SOURCE_DIR}/include")
+
+add_subdirectory(${OpenVINO_SOURCE_DIR}/thirdparty/gflags
+                 ${CMAKE_CURRENT_BINARY_DIR}/gflags_build
+                 EXCLUDE_FROM_ALL)
+
+target_link_libraries(${TARGET_NAME} PUBLIC gflags)
diff --git a/tests/memory_tests/src/memory_tests_helper/cli.h b/tests/memory_tests/src/memory_tests_helper/cli.h
new file mode 100644
index 00000000000000..3370f16eebdeab
--- /dev/null
+++ b/tests/memory_tests/src/memory_tests_helper/cli.h
@@ -0,0 +1,65 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <gflags/gflags.h>
+#include <iostream>
+#include <string>
+#include <vector>
+
+/// @brief message for help argument
+static const char help_message[] = "Print a usage message";
+
+/// @brief message for model argument
+static const char model_message[] =
+    "Required. Path to an .xml/.onnx/.prototxt file with a trained model or to "
+    "a .blob files with a trained compiled model.";
+
+/// @brief message for target device argument
+static const char target_device_message[] =
+    "Required. Specify a target device to infer on. "
+    "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO "
+    "plugin. "
+    "Use \"-d MULTI:<comma-separated_devices_list>\" format to specify MULTI "
+    "plugin. "
+    "The application looks for a suitable plugin for the specified device.";
+
+/// @brief message for statistics path argument
+static const char statistics_path_message[] =
+    "Required. Path to a file to write statistics.";
+
+/// @brief Define flag for showing help message <br>
+DEFINE_bool(h, false, help_message);
+
+/// @brief Declare flag for showing help message <br>
+DECLARE_bool(help);
+
+/// @brief Define parameter for set model file <br>
+/// It is a required parameter
+DEFINE_string(m, "", model_message);
+
+/// @brief Define parameter for set target device to infer on <br>
+/// It is a required parameter
+DEFINE_string(d, "", target_device_message);
+
+/// @brief Define parameter for set path to a file to write statistics <br>
+/// It is a required parameter
+DEFINE_string(s, "", statistics_path_message);
+
+/**
+ * @brief This function show a help message
+ */
+static void showUsage() {
+  std::cout << std::endl;
+  std::cout << "TimeTests [OPTION]" << std::endl;
+  std::cout << "Options:" << std::endl;
+  std::cout << std::endl;
+  std::cout << "    -h, --help                " << help_message << std::endl;
+  std::cout << "    -m \"<path>\"               " << model_message << std::endl;
+  std::cout << "    -d \"<device>\"             " << target_device_message
+            << std::endl;
+  std::cout << "    -s \"<path>\"               " << statistics_path_message
+            << std::endl;
+}
diff --git a/tests/memory_tests/src/memory_tests_helper/main.cpp b/tests/memory_tests/src/memory_tests_helper/main.cpp
new file mode 100644
index 00000000000000..25c23668e9955f
--- /dev/null
+++ b/tests/memory_tests/src/memory_tests_helper/main.cpp
@@ -0,0 +1,58 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "cli.h"
+#include "statistics_writer.h"
+#include "memory_tests_helper/memory_counter.h"
+
+#include <iostream>
+
+int runPipeline(const std::string &model, const std::string &device);
+
+/**
+ * @brief Parses command line and check required arguments
+ */
+bool parseAndCheckCommandLine(int argc, char **argv) {
+  gflags::ParseCommandLineNonHelpFlags(&argc, &argv, true);
+  if (FLAGS_help || FLAGS_h) {
+    showUsage();
+    return false;
+  }
+
+  if (FLAGS_m.empty())
+    throw std::logic_error(
+        "Model is required but not set. Please set -m option.");
+
+  if (FLAGS_d.empty())
+    throw std::logic_error(
+        "Device is required but not set. Please set -d option.");
+
+  if (FLAGS_s.empty())
+    throw std::logic_error(
+        "Statistics file path is required but not set. Please set -s option.");
+
+  return true;
+}
+
+/**
+ * @brief Function calls `runPipeline` with mandatory memory values tracking of full run
+ */
+int _runPipeline() {
+  auto status = runPipeline(FLAGS_m, FLAGS_d);
+  MEMORY_SNAPSHOT(after_objects_release);
+  return status;
+}
+
+/**
+ * @brief Main entry point
+ */
+int main(int argc, char **argv) {
+  if (!parseAndCheckCommandLine(argc, argv))
+    return -1;
+
+  auto status =  _runPipeline();
+  StatisticsWriter::Instance().setFile(FLAGS_s);
+  StatisticsWriter::Instance().write();
+  return status;
+}
diff --git a/tests/memory_tests/src/memory_tests_helper/memory_counter.cpp b/tests/memory_tests/src/memory_tests_helper/memory_counter.cpp
new file mode 100644
index 00000000000000..2de0719a147a99
--- /dev/null
+++ b/tests/memory_tests/src/memory_tests_helper/memory_counter.cpp
@@ -0,0 +1,118 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "memory_tests_helper/memory_counter.h"
+#include <fstream>
+#include <memory>
+#include <string>
+#include <cstring>
+#include <vector>
+
+#ifdef _WIN32
+#include <windows.h>
+#include <psapi.h>
+#include <tlhelp32.h>
+#else
+#include <sys/unistd.h>
+#include <sys/wait.h>
+#endif
+
+#include "statistics_writer.h"
+
+namespace MemoryTest {
+#ifdef _WIN32
+static PROCESS_MEMORY_COUNTERS getMemoryInfo() {
+    static PROCESS_MEMORY_COUNTERS pmc;
+    pmc.cb = sizeof(PROCESS_MEMORY_COUNTERS);
+    GetProcessMemoryInfo(GetCurrentProcess(),&pmc, pmc.cb);
+    return pmc;
+}
+
+size_t getVmSizeInKB() {
+    return getMemoryInfo().PagefileUsage / 1024;
+    }
+
+size_t getVmPeakInKB() {
+    return getMemoryInfo().PeakPagefileUsage / 1024;
+    }
+
+size_t getVmRSSInKB() {
+    return getMemoryInfo().WorkingSetSize / 1024;
+    }
+
+size_t getVmHWMInKB() {
+    return getMemoryInfo().PeakWorkingSetSize / 1024;
+    }
+
+size_t getThreadsNum() {
+    // first determine the id of the current process
+    DWORD const  id = GetCurrentProcessId();
+
+    // then get a process list snapshot.
+    HANDLE const  snapshot = CreateToolhelp32Snapshot( TH32CS_SNAPALL, 0 );
+
+    // initialize the process entry structure.
+    PROCESSENTRY32 entry = { 0 };
+    entry.dwSize = sizeof( entry );
+
+    // get the first process info.
+    BOOL  ret = true;
+    ret = Process32First( snapshot, &entry );
+    while( ret && entry.th32ProcessID != id ) {
+        ret = Process32Next( snapshot, &entry );
+    }
+    CloseHandle( snapshot );
+    return ret
+        ?   entry.cntThreads
+        :   -1;
+    }
+
+#else
+
+/// Parses number from provided string
+static int parseLine(std::string line) {
+    std::string res = "";
+    for (auto c: line)
+        if (isdigit(c))
+            res += c;
+    if (res.empty())
+        // If number wasn't found return -1
+        return -1;
+    return std::stoi(res);
+}
+
+size_t getSystemDataByName(char *name){
+    FILE* file = fopen("/proc/self/status", "r");
+    size_t result = 0;
+    if (file != nullptr) {
+        char line[128];
+
+        while (fgets(line, 128, file) != NULL) {
+            if (strncmp(line, name, strlen(name)) == 0) {
+                result = parseLine(line);
+                break;
+            }
+        }
+        fclose(file);
+    }
+    return result;
+}
+
+size_t getVmSizeInKB() {return getSystemDataByName((char*) "VmSize:");}
+size_t getVmPeakInKB() {return getSystemDataByName((char*) "VmPeak:");}
+size_t getVmRSSInKB() {return getSystemDataByName((char*) "VmRSS:");}
+size_t getVmHWMInKB() {return getSystemDataByName((char*) "VmHWM:");}
+size_t getThreadsNum() {return getSystemDataByName((char*) "Threads:");}
+
+#endif
+
+
+MemoryCounter::MemoryCounter(const std::string &mem_counter_name) {
+  name = mem_counter_name;
+  std::vector<size_t> memory_measurements = {getVmRSSInKB(), getVmHWMInKB(), getVmSizeInKB(),
+                                             getVmPeakInKB(), getThreadsNum()};
+  StatisticsWriter::Instance().addMemCounterToStructure({name, memory_measurements});
+}
+
+} // namespace MemoryTest
diff --git a/tests/memory_tests/src/memory_tests_helper/statistics_writer.h b/tests/memory_tests/src/memory_tests_helper/statistics_writer.h
new file mode 100644
index 00000000000000..806a129638f8a3
--- /dev/null
+++ b/tests/memory_tests/src/memory_tests_helper/statistics_writer.h
@@ -0,0 +1,80 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <cstdio>
+#include <fstream>
+#include <sstream>
+#include <string>
+#include <stdexcept>
+#include <map>
+#include <vector>
+
+#define SEPARATOR " - "
+
+/**
+ * @brief Class response for writing provided statistics
+ *
+ * Object of the class is writing provided statistics to a specified
+ * file in YAML format.
+ */
+class StatisticsWriter {
+private:
+  std::ofstream statistics_file;
+
+  std::map<std::string, std::vector<size_t>> mem_structure; // mem_counter_name, memory measurements
+  std::vector<std::string> mem_struct_order;
+
+  StatisticsWriter() = default;
+  StatisticsWriter(const StatisticsWriter &) = delete;
+  StatisticsWriter &operator=(const StatisticsWriter &) = delete;
+
+public:
+  /**
+   * @brief Creates StatisticsWriter singleton object
+   */
+  static StatisticsWriter &Instance() {
+    static StatisticsWriter writer;
+    return writer;
+  }
+
+  /**
+   * @brief Specifies, opens and validates statistics path for writing
+   */
+  void setFile(const std::string &statistics_path) {
+    statistics_file.open(statistics_path);
+    if (!statistics_file.good()) {
+      std::stringstream err;
+      err << "Statistic file \"" << statistics_path
+          << "\" can't be used for writing";
+      throw std::runtime_error(err.str());
+    }
+  }
+
+  /**
+   * @brief Creates counter structure
+   */
+  void addMemCounterToStructure(const std::pair<std::string, std::vector<size_t>> &record) {
+    mem_struct_order.push_back(record.first);
+    mem_structure[record.first] = record.second;
+  }
+
+  /**
+   * @brief Writes provided statistics in YAML format.
+   */
+  void write() {
+    if (!statistics_file)
+      throw std::runtime_error("Statistic file path isn't set");
+    for (auto& mem_counter: mem_struct_order) {
+      statistics_file << mem_counter << ":" << '\n'
+                      << SEPARATOR << "vmrss: " << mem_structure[mem_counter][0] << '\n'
+                      << SEPARATOR << "vmhwm: " << mem_structure[mem_counter][1] << '\n'
+                      << SEPARATOR << "vmsize: " << mem_structure[mem_counter][2] << '\n'
+                      << SEPARATOR << "vmpeak: " << mem_structure[mem_counter][3] << '\n'
+                      << SEPARATOR << "threads: " << mem_structure[mem_counter][4] << '\n';
+    }
+    statistics_file << "---" << '\n' << "measurement_unit: Kb";
+  }
+};
diff --git a/tests/memory_tests/test_runner/conftest.py b/tests/memory_tests/test_runner/conftest.py
new file mode 100644
index 00000000000000..3e17afc7a9222e
--- /dev/null
+++ b/tests/memory_tests/test_runner/conftest.py
@@ -0,0 +1,545 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+"""
+Basic high-level plugin file for pytest.
+
+See [Writing plugins](https://docs.pytest.org/en/latest/writing_plugins.html)
+for more information.
+
+This plugin adds the following command-line options:
+
+* `--test_conf` - Path to test configuration file. Used to parametrize tests.
+  Format: YAML file.
+* `--exe` - Path to a test binary to execute.
+* `--niter` - Number of times to run executable.
+"""
+
+import hashlib
+import json
+import logging
+# pylint:disable=import-error
+import os
+import sys
+from copy import deepcopy
+from inspect import getsourcefile
+from pathlib import Path
+
+import pytest
+import yaml
+from jsonschema import validate, ValidationError
+
+# add utils folder to imports
+UTILS_DIR = os.path.join(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))), "utils")
+sys.path.insert(0, str(UTILS_DIR))
+
+from plugins.conftest import *
+from path_utils import check_positive_int
+from proc_utils import cmd_exec
+from platform_utils import get_os_name, get_os_version, get_cpu_info
+from utils import metadata_from_manifest, DATABASES, DB_COLLECTIONS
+
+MEMORY_TESTS_DIR = os.path.dirname(os.path.dirname(__file__))
+sys.path.append(MEMORY_TESTS_DIR)
+
+from test_runner.utils import query_memory_timeline, REFS_FACTOR
+
+
+OMZ_NUM_ATTEMPTS = 6
+
+
+def abs_path(relative_path):
+    """Return absolute path given path relative to the current file.
+    """
+    return os.path.realpath(
+        os.path.join(os.path.dirname(getsourcefile(lambda: 0)), relative_path))
+
+
+# -------------------- CLI options --------------------
+
+
+def pytest_addoption(parser):
+    """Specify command-line options for all plugins"""
+    test_args_parser = parser.getgroup("test run")
+    test_args_parser.addoption(
+        "--test_conf",
+        type=Path,
+        help="path to a test config",
+        default=Path(__file__).parent / "test_config.yml"
+    )
+    test_args_parser.addoption(
+        "--exe",
+        required=True,
+        dest="executable",
+        type=Path,
+        help="path to a test binary to execute"
+    )
+    test_args_parser.addoption(
+        "--niter",
+        type=check_positive_int,
+        help="number of iterations to run executable and aggregate results",
+        default=3
+    )
+    omz_args_parser = parser.getgroup("test with omz models")
+    omz_args_parser.addoption(
+        "--omz",
+        type=Path,
+        required=False,
+        help="Path to Open Model Zoo (OMZ) repository root.",
+    )
+    omz_args_parser.addoption(
+        "--omz_models_out_dir",
+        type=Path,
+        default=abs_path('../_omz_out/models'),
+        help="Directory to put test data into.",
+    )
+    omz_args_parser.addoption(
+        '--omz_cache_dir',
+        type=Path,
+        default=abs_path('../_omz_out/cache'),
+        help='Directory with test data cache. Required for OMZ downloader.py only.'
+    )
+    omz_args_parser.addoption(
+        '--omz_irs_out_dir',
+        type=Path,
+        default=abs_path('../_omz_out/irs'),
+        help='Directory to put test data into. Required for OMZ converter.py only.'
+    )
+    omz_args_parser.addoption(
+        "--mo",
+        type=Path,
+        default=abs_path("../../../model-optimizer/mo.py"),
+        help="Path to model-optimizer mo.py. Required for OMZ converter.py only",
+    )
+    helpers_args_parser = parser.getgroup("test helpers")
+    helpers_args_parser.addoption(
+        "--dump_refs",
+        type=str,
+        help="path to dump test config with references updated with statistics collected while run",
+    )
+    db_args_parser = parser.getgroup("test database use")
+    db_args_parser.addoption(
+        '--db_submit',
+        metavar="RUN_ID",
+        type=str,
+        help='submit results to the database. ' \
+             '`RUN_ID` should be a string uniquely identifying the run' \
+             ' (like Jenkins URL or time)'
+    )
+    is_db_used = db_args_parser.parser.parse_known_args(sys.argv).db_submit
+    db_args_parser.addoption(
+        '--db_url',
+        type=str,
+        required=is_db_used,
+        help='MongoDB URL in a form "mongodb://server:port"'
+    )
+    db_args_parser.addoption(
+        '--db_name',
+        type=str,
+        required=is_db_used,
+        help='database name',
+        choices=DATABASES
+    )
+    db_args_parser.addoption(
+        '--db_collection',
+        type=str,
+        required=is_db_used,
+        help='collection name in database',
+        choices=DB_COLLECTIONS
+    )
+    db_args_parser.addoption(
+        '--manifest',
+        type=Path,
+        required=is_db_used,
+        help='path to build manifest to extract commit information'
+    )
+    db_args_parser.addoption(
+        '--db_metadata',
+        type=str,
+        default=None,
+        help='path to JSON-formatted file to extract additional information'
+    )
+    db_args_parser.addoption(
+        '--timeline_report',
+        type=str,
+        required=False,
+        help='path to build manifest to extract commit information'
+    )
+
+
+@pytest.fixture(scope="session")
+def executable(request):
+    """Fixture function for command-line option."""
+    return request.config.getoption('executable')
+
+
+@pytest.fixture(scope="session")
+def niter(request):
+    """Fixture function for command-line option."""
+    return request.config.getoption('niter')
+
+
+# -------------------- CLI options --------------------
+
+
+@pytest.fixture(scope="function")
+def omz_models_conversion(instance, request):
+    """
+    Fixture for preparing omz models and updating test config with new paths
+    """
+    # Check Open Model Zoo key
+    omz_path = request.config.getoption("omz")
+    if omz_path:
+        cache_dir = request.config.getoption("omz_cache_dir")
+        omz_models_out_dir = request.config.getoption("omz_models_out_dir")
+        omz_irs_out_dir = request.config.getoption("omz_irs_out_dir")
+        mo_path = request.config.getoption("mo")
+
+        downloader_path = omz_path / "tools" / "downloader" / "downloader.py"
+        converter_path = omz_path / "tools" / "downloader" / "converter.py"
+        info_dumper_path = omz_path / "tools" / "downloader" / "info_dumper.py"
+
+        if instance["instance"]["model"]["source"] == "omz":
+            model_name = instance["instance"]["model"]["name"]
+            model_precision = instance["instance"]["model"]["precision"]
+
+            # get full model info
+            cmd = f'"{sys.executable}" "{info_dumper_path}" --name {model_name}'
+            _, info = cmd_exec([cmd], shell=True, log=logging)
+
+            model_info = json.loads(info)[0]
+
+            if model_precision not in model_info['precisions']:
+                logging.error(f"Please specify precision for the model "
+                              f"{model_name} from the list: {model_info['precisions']}")
+
+            model_path = Path(model_info["subdirectory"]) / model_precision / (model_name + ".xml")
+            model_full_path = omz_irs_out_dir / model_info["subdirectory"] / model_precision / (model_name + ".xml")
+
+            # prepare models and convert models to IRs
+            cmd = f'{sys.executable} {downloader_path}' \
+                  f' --name {model_name}' \
+                  f' --precisions={model_precision}' \
+                  f' --num_attempts {OMZ_NUM_ATTEMPTS}' \
+                  f' --output_dir {omz_models_out_dir}' \
+                  f' --cache_dir {cache_dir}'
+            cmd_exec([cmd], shell=True, log=logging)
+
+            cmd = f'{sys.executable} {converter_path}' \
+                  f' --name {model_name}' \
+                  f' -p {sys.executable}' \
+                  f' --precisions={model_precision}' \
+                  f' --output_dir {omz_irs_out_dir}' \
+                  f' --download_dir {omz_models_out_dir}' \
+                  f' --mo {mo_path}'
+            cmd_exec([cmd], shell=True, log=logging)
+
+            instance["instance"]["model"]["framework"] = model_info["framework"]
+            instance["instance"]["model"]["path"] = model_path
+            instance["instance"]["model"]["full_path"] = model_full_path
+
+
+@pytest.fixture(scope="function")
+def validate_test_case(request):
+    """Fixture for validating test case on correctness.
+
+    Fixture checks current test case contains all fields required for
+    a correct work.
+    """
+    schema = """
+    {
+        "type": "object",
+        "properties": {
+            "device": {
+                "type": "object",
+                "properties": {
+                    "name": {"type": "string"}
+                },
+                "required": ["name"]
+            },
+            "model": {
+                "type": "object",
+                "properties": {
+                    "name": {"type": "string"}
+                },
+                "required": ["name"]
+            }
+        },
+        "required": ["device", "model"],
+        "additionalProperties": true
+    }
+    """
+    schema = json.loads(schema)
+
+    try:
+        validate(instance=request.node.funcargs["instance"]["instance"], schema=schema)
+    except ValidationError:
+        request.config.option.db_submit = False
+        raise
+    yield
+
+
+@pytest.fixture(scope="function")
+def prepare_db_info(request, instance, executable, niter, manifest_metadata):
+    """Fixture for preparing and validating data to submit to a database.
+
+    Fixture prepares data and metadata to submit to a database. One of the steps
+    is parsing of build information from build manifest. After preparation,
+    it checks if data contains required properties.
+    """
+    FIELDS_FOR_ID = ['run_id', "test_exe", 'model', 'device', 'niter']
+
+    run_id = request.config.getoption("db_submit")
+    if not run_id:
+        yield
+        return
+
+    # add db_metadata
+    db_meta_path = request.config.getoption("db_metadata")
+    if db_meta_path:
+        with open(db_meta_path, "r") as db_meta_f:
+            instance["db"].update(json.load(db_meta_f))
+
+    # add test info
+    info = {
+        # results will be added immediately before uploading to DB in `pytest_runtest_makereport`.
+        **instance["orig_instance"],  # TODO: think about use `instance` instead of `orig_instance`
+        "run_id": run_id,
+        "test_exe": str(executable.stem),
+        "niter": niter,
+        "test_name": request.node.name,
+        "os": "_".join([str(item) for item in [get_os_name(), *get_os_version()]]),
+        "cpu_info": get_cpu_info(),
+        "status": "not_finished",
+        "error_msg": "",
+        "results": {},
+        "raw_results": {},
+        "references": instance["instance"].get("references", {}),  # upload actual references that were used
+        "ref_factor": REFS_FACTOR,
+    }
+    info['_id'] = hashlib.sha256(
+        ''.join([str(info[key]) for key in FIELDS_FOR_ID]).encode()).hexdigest()
+    instance["db"] = info
+
+    # add manifest metadata
+    instance["db"].update(manifest_metadata)
+
+    # validate db_info
+    schema = """
+    {
+        "type": "object",
+        "properties": {
+            "device": {
+                "type": "object",
+                "properties": {
+                    "name": {"type": "string"}
+                },
+                "required": ["name"]
+            },
+            "model": {
+                "type": "object",
+                "properties": {
+                    "path": {"type": "string"},
+                    "name": {"type": "string"},
+                    "precision": {"type": "string"},
+                    "framework": {"type": "string"}
+                },
+                "required": ["name", "precision"]
+            },
+            "run_id": {"type": "string"},
+            "test_exe": {"type": "string"},
+            "niter": {"type": "integer"},
+            "test_name": {"type": "string"},
+            "os": {"type": "string"},
+            "cpu_info": {"type": "string"},
+            "status": {"type": "string"},
+            "error_msg": {"type": "string"},
+            "results": {"type": "object"},
+            "raw_results": {"type": "object"},
+            "references": {"type": "object"},
+            "_id": {"type": "string"}
+        },
+        "required": ["device", "model", "run_id", "test_exe", "niter", "test_name", "os", "cpu_info", 
+                     "status", "error_msg", "results", "raw_results", "references", "_id"],
+        "additionalProperties": true
+    }
+    """
+    schema = json.loads(schema)
+
+    try:
+        validate(instance=instance["db"], schema=schema)
+    except ValidationError:
+        request.config.option.db_submit = False
+        raise
+    yield
+    instance["db"]["results"] = instance["results"]
+    instance["db"]["raw_results"] = instance["raw_results"]
+
+
+@pytest.fixture(scope="session", autouse=True)
+def manifest_metadata(request):
+    """Fixture function for command-line option."""
+
+    run_id = request.config.getoption("db_submit")
+    if not run_id:
+        yield
+        return
+
+    manifest_meta = metadata_from_manifest(request.config.getoption("manifest"))
+
+    schema = """
+        {
+            "type": "object",
+            "properties": {
+                "product_type": {"type": "string"},
+                "repo_url": {"type": "string"},
+                "commit_sha": {"type": "string"},
+                "commit_date": {"type": "string"},
+                "branch": {"type": "string"},
+                "target_branch": {"type": "string"},
+                "version": {"type": "string"}
+            },
+            "required": ["product_type", "repo_url", "commit_sha", "commit_date", "branch", "target_branch", "version"],
+            "additionalProperties": false
+        }
+        """
+    schema = json.loads(schema)
+
+    try:
+        validate(instance=manifest_meta, schema=schema)
+    except ValidationError:
+        request.config.option.db_submit = False
+        raise
+    yield manifest_meta
+
+
+@pytest.fixture(scope="session", autouse=True)
+def prepare_timeline_report(pytestconfig):
+    """ Create memcheck timeline HTML report for records.
+    """
+    yield
+    report_path = pytestconfig.getoption('timeline_report')
+    if report_path:
+        db_url = pytestconfig.getoption("db_url")
+        db_name = pytestconfig.getoption("db_name")
+        db_collection = pytestconfig.getoption("db_collection")
+        records = [rec["db"] for rec in pytestconfig.session_info]
+        records.sort(
+            key=lambda item: f"{item['status']}{item['device']['name']}{item['model']['name']}{item['test_name']}")
+
+        timelines = query_memory_timeline(records, db_url, db_name, db_collection)
+
+        import jinja2  # pylint: disable=import-outside-toplevel
+
+        env = jinja2.Environment(
+            loader=jinja2.FileSystemLoader(
+                searchpath=Path().absolute() / 'memory-template'),
+            autoescape=False)
+        template = env.get_template('timeline_report.html')
+        template.stream(records=records, timelines=timelines).dump(report_path)
+
+
+@pytest.fixture(scope="session", autouse=True)
+def prepare_tconf_with_refs(pytestconfig):
+    """Fixture for preparing test config based on original test config
+    with timetests results saved as references.
+    """
+    yield
+    new_tconf_path = pytestconfig.getoption('dump_refs')
+    if new_tconf_path:
+        logging.info("Save new test config with test results as references to {}".format(new_tconf_path))
+
+        upd_cases = []
+        steps_to_dump = {"create_exenetwork", "first_inference"}
+        vm_metrics_to_dump = {"vmhwm", "vmrss"}
+        stat_metrics_to_dump = {"avg"}
+
+        for record in pytestconfig.session_info:
+            rec_i = deepcopy(record["orig_instance"])
+            rec_i["references"] = deepcopy(record["results"])
+
+            for step_name, vm_records in rec_i["references"].copy().items():
+                if step_name not in steps_to_dump:
+                    del rec_i["references"][step_name]
+                    continue
+                for vm_metric, stat_metrics in vm_records.copy().items():
+                    if vm_metric not in vm_metrics_to_dump:
+                        del rec_i["references"][step_name][vm_metric]
+                        continue
+                    for stat_metric_name, _ in stat_metrics.copy().items():
+                        if stat_metric_name not in stat_metrics_to_dump:
+                            del rec_i["references"][step_name][vm_metric][stat_metric_name]
+                            continue
+            upd_cases.append(rec_i)
+
+        with open(new_tconf_path, "w") as tconf:
+            yaml.safe_dump(upd_cases, tconf)
+
+
+def pytest_generate_tests(metafunc):
+    """Pytest hook for test generation.
+
+    Generate parameterized tests from discovered modules and test config
+    parameters.
+    """
+    with open(metafunc.config.getoption('test_conf'), "r") as file:
+        test_cases = yaml.safe_load(file)
+    if test_cases:
+        test_cases = [{
+            "instance": case,
+            "orig_instance": deepcopy(case),
+            "results": {},
+            "raw_results": {},
+        } for case in test_cases]
+        metafunc.parametrize("instance", test_cases)
+        setattr(metafunc.config, "session_info", test_cases)
+
+
+def pytest_make_parametrize_id(config, val, argname):
+    """Pytest hook for user-friendly test name representation"""
+
+    def get_dict_values(d):
+        """Unwrap dictionary to get all values of nested dictionaries"""
+        if isinstance(d, dict):
+            for v in d.values():
+                yield from get_dict_values(v)
+        else:
+            yield d
+
+    keys = ["device", "model"]
+    values = {key: val["instance"][key] for key in keys}
+    values = list(get_dict_values(values))
+
+    return "-".join(["_".join([key, str(val)]) for key, val in zip(keys, values)])
+
+
+@pytest.mark.hookwrapper
+def pytest_runtest_makereport(item, call):
+    """Pytest hook for report preparation.
+
+    Submit tests' data to a database.
+    """
+    run_id = item.config.getoption("db_submit")
+    if not run_id:
+        yield
+        return
+
+    db_url = item.config.getoption("db_url")
+    db_name = item.config.getoption("db_name")
+    db_collection = item.config.getoption("db_collection")
+
+    instance = item.funcargs["instance"]  # alias
+    report = (yield).get_result()
+    if call.when in ["setup", "call"]:
+        if call.when == "call":
+            if not report.passed:
+                instance["db"]["status"] = "failed"
+                instance["db"]["error_msg"] = report.longrepr.reprcrash.message
+            else:
+                instance["db"]["status"] = "passed"
+        instance["db"]["results"] = instance["results"]
+        instance["db"]["raw_results"] = instance["raw_results"]
+        logging.info("Upload data to {}/{}.{}. Data: {}".format(db_url, db_name, db_collection, instance["db"]))
+
+        # TODO: upload to new DB (memcheck -> memory_tests)
+        # upload_data(data, db_url, db_name, db_collection)
diff --git a/tests/memory_tests/test_runner/memory_template/base.html b/tests/memory_tests/test_runner/memory_template/base.html
new file mode 100644
index 00000000000000..f34958e832cc50
--- /dev/null
+++ b/tests/memory_tests/test_runner/memory_template/base.html
@@ -0,0 +1,15 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    {% block head %}
+    <title>{% block title %}{% endblock %}</title>
+    {% endblock %}
+</head>
+<body>
+    <div id="content">{% block content %}{% endblock %}</div>
+    <div id="footer">
+        {% block footer %}
+        {% endblock %}
+    </div>
+</body>
+</html>
diff --git a/tests/memory_tests/test_runner/memory_template/timeline_report.html b/tests/memory_tests/test_runner/memory_template/timeline_report.html
new file mode 100644
index 00000000000000..a4f09cc652ec75
--- /dev/null
+++ b/tests/memory_tests/test_runner/memory_template/timeline_report.html
@@ -0,0 +1,156 @@
+{% extends "base.html" %}
+{% block title %}Memory report{% endblock %}
+{% block head %}
+    {{ super() }}
+<link rel="stylesheet" href="https://www.w3schools.com/w3css/4/w3.css">
+<script src="https://ajax.googleapis.com/ajax/libs/jquery/2.1.1/jquery.min.js"></script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/moment.js/2.13.0/moment.min.js"></script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/Chart.js/2.9.3/Chart.min.js"></script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/chartjs-plugin-annotation/0.5.7/chartjs-plugin-annotation.min.js"></script>
+{% endblock %}
+{% block content %}
+<div class="w3-container">
+<h2>Memory report</h2>
+    {% for timeline in timelines %}
+    {% for step_name in timeline['references'] %}
+    <div class="w3-container">
+        <h4> {{ timeline['model']['name'][0]|e }} - {{ timeline['model']['precision'][0]|e }} - {{ timeline['device']['name'][0]|e }}- {{ step_name }} </h4>
+        <div class={{ '"w3-text-green"' if timeline['status'] else '"w3-text-red"' }}>
+            {{ "PASS" if timeline["status"] else "FAIL" }}
+        </div>
+
+        <div id="{{timeline['_id'][0]|e}}-details" class="w3-show w3-container">
+            <div class="w3-container">
+                Test timeline:
+            <canvas class="chartjs"
+                id="{{timeline['_id'][0]|e}}-chart"
+                height="100"
+                data-labels='[{% for point in timeline["commit_date"] %} "{{point}}" {{ "," if not loop.last }} {% endfor %}]'
+                data-charttype='line'>
+
+                <div class="chartjs-item"
+                    data-label='vmrss'
+                    data-commitid='[{% for point in timeline["commit_sha"] %} "{{point}}" {{ "," if not loop.last }} {% endfor %}]'
+                    data-data='[{% for point in timeline["results"][step_name]["vmrss"]["avg"] %} {{point}} {{ "," if not loop.last }} {% endfor %}]'
+                    data-rgb='255, 68, 55'
+                    data-waterline='{{ timeline["references"][step_name]["vmrss"]["avg"][-1]|float * timeline["ref_factor"][0]|float }}'>
+                </div>
+                <div class="chartjs-item"
+                    data-label='vmhwms'
+                    data-commitid='[{% for point in timeline["commit_sha"] %} "{{point}}" {{ "," if not loop.last }} {% endfor %}]'
+                    data-data='[{% for point in timeline["results"][step_name]["vmhwm"]["avg"] %} {{point}} {{ "," if not loop.last }} {% endfor %}]'
+                    data-rgb='66,133,244'
+                    data-waterline='{{ timeline["references"][step_name]["vmhwm"]["avg"][-1]|float * timeline["ref_factor"][0]|float }}'>
+                </div>
+            </canvas>
+            </div>
+        </div>
+    </div>
+    {% endfor %}
+    {% endfor %}
+</div>
+<script>
+    if ($(".chartjs").length > 0) {
+        $( ".chartjs" ).each(function() {
+            datasets=[];
+            annotations=[];
+            $(this).find('.chartjs-item').each(function(index, el){
+                var data=$(this).data('data');
+                var label=$(this).data('label');
+                var commitid=$(this).data('commitid');
+                var waterline=$(this).data('waterline');
+                if($(this).data('rgb')){
+                    var rgb=$(this).data('rgb');
+                }else{
+                    var rgb='244,160,0';
+                }
+                var dataset=[{
+                    label: label,
+                    data: data,
+                    commitid: commitid,
+                    borderColor: 'rgba('+rgb+', 1)',
+                    backgroundColor: 'rgba('+rgb+', 0.12)',
+                    borderWidth:3,
+                    pointBorderWidth:3,
+                    pointBorderColor:'rgba('+rgb+', 1)',
+                    pointBackgroundColor:'#465f80',
+                    pointRadius: 5,
+                    lineTension: 0,
+                }];
+                datasets = $.merge(dataset, datasets);
+                var annotation = [{
+                    type: 'line',
+                    mode: 'horizontal',
+                    scaleID: 'y-axis-0',
+                    value: waterline,
+                    borderColor: 'black',
+                    borderWidth: 3,
+                    label: {
+                        backgroundColor: 'rgba('+rgb+', 1)',
+                        content: label + 'waterline',
+                        enabled: true,
+                    },
+                }]
+                annotations = $.merge(annotation, annotations)
+            });
+
+
+            var chartType=$(this).data('charttype');
+            var labels=$(this).data('labels');
+            var myChart = new Chart(this, {
+                type: chartType,
+                data: {
+                    labels: labels,
+                    datasets: datasets,
+                },
+                options: {
+                    annotation: {
+                        annotations: annotations
+                    },
+                    scales: {
+                        xAxes: [{
+                            type: 'time',
+                            distribution: 'series',
+                            time:       {
+                                parser: 'YYYY-MM-DD hh:mm:ss',
+                                displayFormats: {
+                                    'millisecond': 'MMM DD hh:mm',
+                                    'second': 'MMM DD hh:mm',
+                                    'minute': 'MMM DD hh:mm',
+                                    'hour': 'MMM DD hh:mm',
+                                    'day': 'MMM DD hh:mm',
+                                    'week': 'MMM DD hh:mm',
+                                    'month': 'MMM DD hh:mm',
+                                    'quarter': 'MMM DD hh:mm',
+                                    'year': 'MMM DD hh:mm',
+                                },
+                            },
+                            scaleLabel: {
+                                display: true,
+                                labelString: 'Commit Time'
+                            }
+                        }]
+                    }
+                }
+            });
+
+            $(this).on('click', function(evt){
+                var activePoint = myChart.getElementAtEvent(evt);
+                if(activePoint[0]){
+                    var commitid = myChart.data.datasets[activePoint[0]._datasetIndex].commitid[activePoint[0]._index];
+                    window.open('https://github.com/openvinotoolkit/openvino/commit/' + commitid, '_blank');
+                }
+            });
+        });
+    }
+
+function show(id) {
+    var x = document.getElementById(id);
+    if (x.className.indexOf("w3-show") == -1) {
+        x.className += " w3-show";
+    } else {
+        x.className = x.className.replace(" w3-show", "");
+    }
+}
+</script>
+{% endblock %}
diff --git a/tests/memory_tests/test_runner/requirements.txt b/tests/memory_tests/test_runner/requirements.txt
new file mode 100644
index 00000000000000..66d153d1aca8a3
--- /dev/null
+++ b/tests/memory_tests/test_runner/requirements.txt
@@ -0,0 +1,7 @@
+pytest~=5.0
+PyYAML==5.4.1
+jsonschema==3.2.0
+distro==1.5.0
+numpy>=1.19.2
+pymongo>=3.12.0
+pytest-html>=1.19.0
diff --git a/tests/memory_tests/test_runner/test_config.yml b/tests/memory_tests/test_runner/test_config.yml
new file mode 100644
index 00000000000000..7cb5b5f7793091
--- /dev/null
+++ b/tests/memory_tests/test_runner/test_config.yml
@@ -0,0 +1,16 @@
+- device:
+    name: CPU
+  model:
+    full_path: ${SHARE}/stress_tests/master_04d6f112132f92cab563ae7655747e0359687dc9/caffe/FP32/alexnet/alexnet.xml
+    name: alexnet
+    precision: FP32
+    framework: caffe
+  references: {}
+- device:
+    name: GPU
+  model:
+    full_path: ${SHARE}/stress_tests/master_04d6f112132f92cab563ae7655747e0359687dc9/caffe/FP32/alexnet/alexnet.xml
+    name: alexnet
+    precision: FP32
+    framework: caffe
+  references: {}
diff --git a/tests/memory_tests/test_runner/test_memorytest.py b/tests/memory_tests/test_runner/test_memorytest.py
new file mode 100644
index 00000000000000..324b329fdb46d5
--- /dev/null
+++ b/tests/memory_tests/test_runner/test_memorytest.py
@@ -0,0 +1,69 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+"""Main entry-point to run tests tests.
+Default run:
+$ pytest test_test.py
+Options[*]:
+--test_conf     Path to test config
+--exe           Path to test binary to execute
+--niter         Number of times to run executable
+[*] For more information see conftest.py
+"""
+
+import logging
+import os
+import shutil
+import sys
+from pathlib import Path
+
+# add utils folder to imports
+UTILS_DIR = os.path.join(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))), "utils")
+sys.path.insert(0, str(UTILS_DIR))
+
+from path_utils import expand_env_vars
+
+MEMORY_TESTS_DIR = os.path.dirname(os.path.dirname(__file__))
+sys.path.append(MEMORY_TESTS_DIR)
+
+from scripts.run_memorytest import run_memorytest
+from test_runner.utils import compare_with_references
+
+
+def test(instance, executable, niter, temp_dir, omz_models_conversion, validate_test_case, prepare_db_info):
+    """Parameterized test.
+    :param instance: test instance. Should not be changed during test run
+    :param executable: test executable to run
+    :param niter: number of times to run executable
+    :param temp_dir: path to a temporary directory. Will be cleaned up after test run
+    :param validate_test_case: custom pytest fixture. Should be declared as test argument to be enabled
+    :param prepare_db_info: custom pytest fixture. Should be declared as test argument to be enabled
+    :param omz_models_conversion: custom pytest fixture. Should be declared as test argument to be enabled
+    """
+    # Prepare model to get model_path
+    model_path = instance["instance"]["model"].get("full_path")
+    assert model_path, "Model path is empty"
+    model_path = Path(expand_env_vars(model_path))
+
+    # Copy model to a local temporary directory
+    model_dir = temp_dir / "model"
+    shutil.copytree(model_path.parent, model_dir)
+    model_path = model_dir / model_path.name
+
+    # Run executable
+    exe_args = {
+        "executable": Path(executable),
+        "model": Path(model_path),
+        "device": instance["instance"]["device"]["name"],
+        "niter": niter
+    }
+    retcode, msg, aggr_stats, raw_stats = run_memorytest(exe_args, log=logging)
+    assert retcode == 0, f"Run of executable failed: {msg}"
+
+    # Add test results to submit to database and save in new test conf as references
+    instance["results"] = aggr_stats
+    instance["raw_results"] = raw_stats
+
+    # Compare with references
+    metrics_comparator_status = compare_with_references(aggr_stats, instance["orig_instance"]["references"])
+    assert metrics_comparator_status == 0, "Comparison with references failed"
diff --git a/tests/memory_tests/test_runner/utils.py b/tests/memory_tests/test_runner/utils.py
new file mode 100644
index 00000000000000..34fcb41f0a9691
--- /dev/null
+++ b/tests/memory_tests/test_runner/utils.py
@@ -0,0 +1,106 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+"""Utility module."""
+
+import logging
+import sys
+
+from pymongo import MongoClient
+
+# constants
+REFS_FACTOR = 1.2  # 120%
+TIMELINE_SIMILARITY = ('test_name', 'model', 'device', 'target_branch')
+
+
+def _transpose_dicts(items, template=None):
+    """ Build dictionary of arrays from array of dictionaries
+    Example:
+    > in = [{'a':1, 'b':3}, {'a':2}]
+    > _transpose_dicts(in, template=in[0])
+    {'a':[1,2], 'b':[3, None]}
+    """
+    result = {}
+    if not items:
+        return result
+    if not template:
+        template = items[0]
+    for key, template_val in template.items():
+        if isinstance(template_val, dict):
+            result[key] = _transpose_dicts(
+                [item[key] for item in items if key in item], template_val)
+        else:
+            result[key] = [item.get(key, None) for item in items]
+    return result
+
+
+def query_memory_timeline(records, db_url, db_name, db_collection, max_items=20, similarity=TIMELINE_SIMILARITY):
+    """ Query database for similar memory items committed previously
+    """
+    def timeline_key(item):
+        """ Defines order for timeline report entries
+        """
+        order = 0
+        for step_name, _ in item['results'].items():
+            if len(item['results'][step_name]['vmhwm']) <= 1:
+                return 1
+            order = item['results'][step_name]['vmhwm']["avg"][-1] - item['results'][step_name]['vmhwm']["avg"][-2] + \
+                item['results'][step_name]['vmrss']["avg"][-1] - item['results'][step_name]['vmrss']["avg"][-2]
+            if not item['status']:
+                # ensure failed cases are always on top
+                order += sys.maxsize/2
+        return order
+
+    client = MongoClient(db_url)
+    collection = client[db_name][db_collection]
+    result = []
+    for record in records:
+        items = []
+        try:
+            query = dict((key, record[key]) for key in similarity)
+            query['commit_date'] = {'$lt': record['commit_date']}
+            pipeline = [
+                {'$match': query},
+                {'$addFields': {
+                    'commit_date': {'$dateFromString': {'dateString': '$commit_date'}}}},
+                {'$sort': {'commit_date': -1}},
+                {'$limit': max_items},
+                {'$sort': {'commit_date': 1}},
+            ]
+            items += list(collection.aggregate(pipeline))
+        except KeyError:
+            pass  # keep only the record if timeline failed to generate
+        items += [record]
+        for item in items:
+            item["status"] = {"passed": True, "failed": False, "not_finished": False}[item["status"]]
+        timeline = _transpose_dicts(items, template=record)
+        result += [timeline]
+
+    result.sort(key=timeline_key, reverse=True)
+    return result
+
+
+def compare_with_references(aggr_stats: dict, reference: dict):
+    """Compare values with provided reference"""
+
+    vm_metrics_to_compare = {"vmrss", "vmhwm"}
+    stat_metrics_to_compare = {"avg"}
+    status = 0
+
+    for step_name, vm_records in reference.items():
+        for vm_metric, stat_metrics in vm_records.items():
+            if vm_metric not in vm_metrics_to_compare:
+                continue
+            for stat_metric_name, reference_val in stat_metrics.items():
+                if stat_metric_name not in stat_metrics_to_compare:
+                    continue
+                if aggr_stats[step_name][vm_metric][stat_metric_name] > reference_val * REFS_FACTOR:
+                    logging.error(f"Comparison failed for '{step_name}' step for '{vm_metric}' for"
+                                  f" '{stat_metric_name}' metric. Reference: {reference_val}."
+                                  f" Current values: {aggr_stats[step_name][vm_metric][stat_metric_name]}")
+                    status = 1
+                else:
+                    logging.info(f"Comparison passed for '{step_name}' step for '{vm_metric}' for"
+                                 f" '{stat_metric_name}' metric. Reference: {reference_val}."
+                                 f" Current values: {aggr_stats[step_name][vm_metric][stat_metric_name]}")
+    return status
diff --git a/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml b/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml
index 87e2e36522b659..fadaaabfcc568f 100644
--- a/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml
+++ b/tests/stress_tests/.automation/memcheck_tests/precommit_configs/desktop_references_config.xml
@@ -3,54 +3,62 @@
     <models>
         <!--Models with FP32 precision-->
         <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="740214" vmpeak="805110" vmrss="129308" vmhwm="129308" />
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="1935798" vmpeak="1958798" vmrss="467729" vmhwm="796421" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="1007890" vmpeak="1007890" vmrss="138652" vmhwm="138652" />
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2021089" vmpeak="2106286" vmrss="514124" vmhwm="839956" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="2554255" vmpeak="2575892" vmrss="535334" vmhwm="1223398" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1351818" vmpeak="1437014" vmrss="143057" vmhwm="143057" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2137673" vmpeak="2222870" vmrss="516708" vmhwm="793426" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2751751" vmpeak="2836948" vmrss="582176" vmhwm="1249487" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="1007890" vmpeak="1007890" vmrss="138652" vmhwm="138652" />
+        <model path="public/mobilenet-ssd/FP32/mobilenet-ssd.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2640835" vmpeak="2726032" vmrss="538382" vmhwm="1228006" /> # values from {"branch": "releases/2021/4",  "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="691589" vmpeak="922864" vmrss="31054" vmhwm="31054" />
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="1866794" vmpeak="1887028" vmrss="260561" vmhwm="333803" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="958240" vmpeak="1043437" vmrss="31366" vmhwm="31366" />
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="1952137" vmpeak="2037334" vmrss="258554" vmhwm="333730" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="1965792" vmpeak="1986301" vmrss="251992" vmhwm="410316" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1369586" vmpeak="1454783" vmrss="26634" vmhwm="26634" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2047978" vmpeak="2133175" vmrss="259313" vmhwm="333392" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2146809" vmpeak="2232006" vmrss="253271" vmhwm="410794" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="958240" vmpeak="1043437" vmrss="31366" vmhwm="31366" />
+        <model path="public/mtcnn/mtcnn-r/FP32/mtcnn-r.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2050984" vmpeak="2050984" vmrss="252309" vmhwm="410451" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="1050000" vmpeak="1179042" vmrss="323000" vmhwm="439457" />
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="2253336" vmpeak="2345397" vmrss="776094" vmhwm="1094714" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="2834738" vmpeak="2886488" vmrss="833331" vmhwm="1464366" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1569401" vmpeak="1570774" vmrss="497967" vmhwm="497967" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="3074453" vmpeak="3074453" vmrss="899652" vmhwm="1462297" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="1321819" vmpeak="1321819" vmrss="374207" vmhwm="439748" />
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2341352" vmpeak="2426548" vmrss="787503" vmhwm="1098801" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="1840212" vmpeak="1840212" vmrss="1840212" vmhwm="495575" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="2536071" vmpeak="2621268" vmrss="900863" vmhwm="1094906" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/ssd300/FP32/ssd300.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="2917262" vmpeak="2917262" vmrss="862830" vmhwm="1509835" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="create_exenetwork" device="CPU" vmsize="2300000" vmpeak="2836412" vmrss="1570000" vmhwm="2140533" />
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="3353303" vmpeak="4657338" vmrss="1801144" vmhwm="3036415" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="create_exenetwork" device="GPU" vmsize="3590771" vmpeak="4719837" vmrss="1876217" vmhwm="3028786" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="inference_with_streams" device="CPU" vmsize="3255907" vmpeak="3256676" vmrss="2063937" vmhwm="2063937" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="3433996" vmpeak="4652835" vmrss="1764859" vmhwm="3037299" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="inference_with_streams" device="GPU" vmsize="3786489" vmpeak="4816884" vmrss="1891172" vmhwm="3027060" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="infer_request_inference" device="CPU" vmsize="2800000" vmpeak="2836412" vmrss="1590000" vmhwm="2140377" />
-        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="3572067" vmpeak="4748634" vmrss="1808586" vmhwm="3011195" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/vgg16/FP32/vgg16.xml" precision="FP32" test="infer_request_inference" device="GPU" vmsize="3665173" vmpeak="4627511" vmrss="1853924" vmhwm="3027278" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <!--Models with FP16 precision-->
         <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="1057487" vmpeak="1085224" vmrss="109694" vmhwm="137295" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1892389" vmpeak="1916798" vmrss="458312" vmhwm="806010" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="1058844" vmpeak="1085224" vmrss="123016" vmhwm="136682" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="1979182" vmpeak="2064379" vmrss="455520" vmhwm="805480" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2517418" vmpeak="2539108" vmrss="532485" vmhwm="1249050" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="1279876" vmpeak="1365072" vmrss="156566" vmhwm="156566" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2083478" vmpeak="2168675" vmrss="489460" vmhwm="809676" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2693719" vmpeak="2778916" vmrss="541034" vmhwm="1250189" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="1058844" vmpeak="1085224" vmrss="123016" vmhwm="136682" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
+        <model path="public/mobilenet-ssd/FP16/mobilenet-ssd.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2598715" vmpeak="2683912" vmrss="529250" vmhwm="1245504" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="955427" vmpeak="955806" vmrss="27700" vmhwm="27700" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1860040" vmpeak="1886794" vmrss="238092" vmhwm="358046" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="955827" vmpeak="955827" vmrss="27222" vmhwm="27222" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="1945314" vmpeak="2030511" vmrss="240125" vmhwm="359730" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1964518" vmpeak="1988079" vmrss="262563" vmhwm="462222" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="906443" vmpeak="986913" vmrss="27404" vmhwm="27404" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2039549" vmpeak="2039549" vmrss="264035" vmhwm="382652" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2145587" vmpeak="2230784" vmrss="263468" vmhwm="462207" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="955827" vmpeak="955827" vmrss="27222" vmhwm="27222" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
+        <model path="public/mtcnn/mtcnn-r/FP16/mtcnn-r.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2049808" vmpeak="2049808" vmrss="262230" vmhwm="461962" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="1372961" vmpeak="1505639" vmrss="380000" vmhwm="501649" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="1988677" vmpeak="2210670" vmrss="548293" vmhwm="909142" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2603416" vmpeak="2604170" vmrss="646604" vmhwm="1286537" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="1816224" vmpeak="1870970" vmrss="561241" vmhwm="561241" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2803117" vmpeak="2888314" vmrss="670711" vmhwm="1284150" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="1381265" vmpeak="1505472" vmrss="437039" vmhwm="500630" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2080119" vmpeak="2212730" vmrss="562437" vmhwm="886828" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="1815990" vmpeak="1894131" vmrss="561948" vmhwm="561948" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2203822" vmpeak="2307895" vmrss="580829" vmhwm="892496" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/ssd300/FP16/ssd300.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2688202" vmpeak="2773399" vmrss="657810" vmhwm="1300488" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="create_exenetwork" device="CPU" vmsize="2748220" vmpeak="3450818" vmrss="1840000" vmhwm="2486161" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2573651" vmpeak="3236880" vmrss="995810" vmhwm="1545211" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="2749458" vmpeak="3450818" vmrss="1860000" vmhwm="2486525" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2644886" vmpeak="3222918" vmrss="1024223" vmhwm="1567935" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="create_exenetwork" device="GPU" vmsize="2764710" vmpeak="3315140" vmrss="1048127" vmhwm="1587118" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
         <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="inference_with_streams" device="CPU" vmsize="3607037" vmpeak="3607806" vmrss="2415992" vmhwm="2415992" /> # values from {"commit_id": "761e571042fa2b291d5954e523fffc1e2dfcafae", "commit_date": "2021-05-20 10:36"} and *= 1.3
-        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2761231" vmpeak="3318697" vmrss="1047467" vmhwm="1565647" /> # values from {"commit_id": "2947789b3b18a724096abbd9a5c535ae3128ce05", "commit_date": "2021-07-12 23:30"} and *= 1.3
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="inference_with_streams" device="GPU" vmsize="2967858" vmpeak="3406124" vmrss="1058657" vmhwm="1575516" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="CPU" vmsize="2749458" vmpeak="3450818" vmrss="1860000" vmhwm="2486525" /> # values from {"commit_id": "af63cb78ee5cbd66bac0d0980db61cb11b5d9995", "commit_date": "2021-03-03 15:44"} and *= 1.3
+        <model path="public/vgg16/FP16/vgg16.xml" precision="FP16" test="infer_request_inference" device="GPU" vmsize="2847364" vmpeak="3310273" vmrss="1032465" vmhwm="1578205" /> # values from {"branch": "releases/2021/4", "commit_id": "96bc1b9bfb6140981e88bf09ee756b70f1723533", "commit_date": "2021-08-13 14:38"} and *= 1.3
+
         <!--Models with FP16-INT8 precision-->
         <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="845462" vmpeak="845462" vmrss="54277" vmhwm="54277" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="1917323" vmpeak="1917739" vmrss="581136" vmhwm="949936" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
@@ -58,18 +66,21 @@
         <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="2147454" vmpeak="2232651" vmrss="671205" vmhwm="969524" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="939926" vmpeak="939926" vmrss="61235" vmhwm="61235" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/face-detection-adas-0001/FP16-INT8/face-detection-adas-0001.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="2009384" vmpeak="2094580" vmrss="583086" vmhwm="944008" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
+
         <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="985509" vmpeak="985509" vmrss="102684" vmhwm="102684" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="3018548" vmpeak="3038781" vmrss="1967492" vmhwm="2351637" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="1893320" vmpeak="1897464" vmrss="153072" vmhwm="153072" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="3234410" vmpeak="3319607" vmrss="1993123" vmhwm="2356712" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="989825" vmpeak="989825" vmrss="112465" vmhwm="112465" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/person-detection-action-recognition-0006/FP16-INT8/person-detection-action-recognition-0006.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="3102907" vmpeak="3188104" vmrss="1959562" vmhwm="2354128" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
+
         <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="998602" vmpeak="998602" vmrss="67246" vmhwm="67246" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="2190047" vmpeak="2190047" vmrss="624036" vmhwm="624036" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="2004033" vmpeak="2069199" vmrss="334141" vmhwm="334250" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="inference_with_streams" device="GPU" vmsize="2799196" vmpeak="2799196" vmrss="1061351" vmhwm="1061351" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="infer_request_inference" device="CPU" vmsize="1063769" vmpeak="1063769" vmrss="297944" vmhwm="297944" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/single-image-super-resolution-1032/FP16-INT8/single-image-super-resolution-1032.xml" precision="FP16-INT8" test="infer_request_inference" device="GPU" vmsize="2364830" vmpeak="2450026" vmrss="711063" vmhwm="711063" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
+
         <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="create_exenetwork" device="CPU" vmsize="792677" vmpeak="866647" vmrss="33794" vmhwm="33794" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="create_exenetwork" device="GPU" vmsize="1850950" vmpeak="1871251" vmrss="265959" vmhwm="410160" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
         <model path="intel/vehicle-attributes-recognition-barrier-0039/FP16-INT8/vehicle-attributes-recognition-barrier-0039.xml" precision="FP16-INT8" test="inference_with_streams" device="CPU" vmsize="1527453" vmpeak="1527453" vmrss="36462" vmhwm="36462" /> # values from {"commit_id": "30a30efbc44f3e74a0283acd0f9ccf2e7caf94b6", "commit_date": "2021-08-19 21:17"} and *= 1.3
diff --git a/tests/stress_tests/.automation/unittests/nightly_configs/desktop_test_config.xml b/tests/stress_tests/.automation/unittests/nightly_configs/desktop_test_config.xml
index fdb3e2746ca1ad..fc2ed5cba5cce6 100644
--- a/tests/stress_tests/.automation/unittests/nightly_configs/desktop_test_config.xml
+++ b/tests/stress_tests/.automation/unittests/nightly_configs/desktop_test_config.xml
@@ -1,6 +1,7 @@
 <attributes>
     <processes>
         <value>1</value>
+        <value>2</value>
     </processes>
     <threads>
         <value>1</value>
diff --git a/tests/stress_tests/.automation/unittests/nightly_configs/myriad_test_config.xml b/tests/stress_tests/.automation/unittests/nightly_configs/myriad_test_config.xml
index 979194a991ac26..b2f9a839233f88 100644
--- a/tests/stress_tests/.automation/unittests/nightly_configs/myriad_test_config.xml
+++ b/tests/stress_tests/.automation/unittests/nightly_configs/myriad_test_config.xml
@@ -1,6 +1,7 @@
 <attributes>
     <processes>
         <value>1</value>
+        <value>2</value>
     </processes>
     <threads>
         <value>1</value>
diff --git a/tests/stress_tests/.automation/unittests/weekly_configs/desktop_test_config.xml b/tests/stress_tests/.automation/unittests/weekly_configs/desktop_test_config.xml
index 2ada874cccb268..6b3a23160700f8 100644
--- a/tests/stress_tests/.automation/unittests/weekly_configs/desktop_test_config.xml
+++ b/tests/stress_tests/.automation/unittests/weekly_configs/desktop_test_config.xml
@@ -1,6 +1,8 @@
 <attributes>
     <processes>
         <value>1</value>
+        <value>2</value>
+        <value>8</value>
     </processes>
     <threads>
         <value>1</value>
@@ -17,4 +19,4 @@
         <model name="alexnet" precision="FP32" source="omz" />
         <model name="mobilenet-ssd" precision="FP32" source="omz" />
     </models>
-</attributes>
\ No newline at end of file
+</attributes>
diff --git a/tests/stress_tests/CMakeLists.txt b/tests/stress_tests/CMakeLists.txt
index 7bed0cf1bff049..a2c328b16c3d5f 100644
--- a/tests/stress_tests/CMakeLists.txt
+++ b/tests/stress_tests/CMakeLists.txt
@@ -4,6 +4,13 @@
 
 cmake_minimum_required(VERSION 3.13)
 
+set (CMAKE_CXX_STANDARD 11)
+set (CMAKE_CXX_EXTENSIONS OFF)
+set (CMAKE_CXX_STANDARD_REQUIRED ON)
+if (CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
+    set (CMAKE_CXX_FLAGS "-std=c++11 ${CMAKE_CXX_FLAGS}")
+endif()
+
 if (CMAKE_BUILD_TYPE STREQUAL "")
     message(STATUS "CMAKE_BUILD_TYPE not defined, 'Release' will be used")
     set(CMAKE_BUILD_TYPE "Release")
@@ -12,7 +19,8 @@ endif()
 # Define directory where artifacts will be placed
 set(OUTPUT_ROOT ${CMAKE_CURRENT_SOURCE_DIR})
 
-find_package(InferenceEngineDeveloperPackage REQUIRED)
+# Search OpenVINO Inference Engine installed
+find_package(OpenVINO REQUIRED)
 
 set(OpenVINO_SOURCE_DIR "${CMAKE_CURRENT_SOURCE_DIR}/../../")
 
diff --git a/tests/stress_tests/README.md b/tests/stress_tests/README.md
index cc8a2911d16830..78800463372aef 100644
--- a/tests/stress_tests/README.md
+++ b/tests/stress_tests/README.md
@@ -32,27 +32,13 @@ one at a time to mitigate memory statistics pollution. You can use
 
 ### Building Tests
 
-Stress tests should be built in 2 steps.
-
-1. Build `openvino`
-
-Build `openvino` as usual but with `-DENABLE_TESTS=ON`.
-
-2. Build `stress_tests`
-
-Stress tests depend from the Inference Engine Developer Package located in the
-`openvino` build directory.
-
-In the command line snippet bellow, it is assumed that the Inference Engine
-Developer Package CMake module can be found in the directory `build` under
-`openvino` repository root.
-
+To build the tests, you need to have OpenVINO™ installed or build from source.
+Before build the tests, open a terminal, set OpenVINO™ environment, and after that
+run the commands below:
 ``` bash
-(
-export OPENVINO_BUILD_DIR=$(git rev-parse --show-toplevel)/build
-mkdir -p build && cd build && \
-cmake -DInferenceEngineDeveloperPackage_DIR=$OPENVINO_BUILD_DIR .. && make -j$(nproc) \
-)
+source <OpenVINO_install_dir>/setupvars.sh
+mkdir build && cd build
+cmake .. && make -j$(nproc)
 ```
 
 ### Preparing Test Data
diff --git a/tests/stress_tests/common/CMakeLists.txt b/tests/stress_tests/common/CMakeLists.txt
index 32a1ca455a9efd..4a1890a226cd32 100644
--- a/tests/stress_tests/common/CMakeLists.txt
+++ b/tests/stress_tests/common/CMakeLists.txt
@@ -9,6 +9,7 @@ file (GLOB_RECURSE HDR *.h)
 
 add_library(${TARGET_NAME} STATIC ${SRC} ${HDR})
 
+include(${OpenVINO_SOURCE_DIR}cmake/developer_package/compile_flags/os_flags.cmake)
 target_include_directories(${TARGET_NAME} PUBLIC ${CMAKE_CURRENT_SOURCE_DIR})
 
 add_subdirectory(${OpenVINO_SOURCE_DIR}/thirdparty/gflags
diff --git a/tests/stress_tests/common/utils.cpp b/tests/stress_tests/common/utils.cpp
index 33a8b392a194de..c9fc9b805d9f71 100644
--- a/tests/stress_tests/common/utils.cpp
+++ b/tests/stress_tests/common/utils.cpp
@@ -122,7 +122,7 @@ size_t getThreadsNum() {return getSystemDataByName((char*) "Threads:");}
 int run_in_processes(const int &numprocesses, const std::function<void()> &function) {
 #ifdef _WIN32
     // TODO: implement run in separate process by using WinAPI
-    function;
+    function();
     return 0;
 #else
     std::vector<pid_t> child_pids(numprocesses);
@@ -130,7 +130,7 @@ int run_in_processes(const int &numprocesses, const std::function<void()> &funct
     for (int i = 0; i < numprocesses; i++) {
         child_pids[i] = fork();
         if (child_pids[i] == 0) {
-            function;
+            function();
             exit(EXIT_SUCCESS);
         }
     }
diff --git a/tests/stress_tests/scripts/compare_memcheck_2_runs.py b/tests/stress_tests/scripts/compare_memcheck_2_runs.py
index 7af2f90f490129..0757cbd442b04d 100644
--- a/tests/stress_tests/scripts/compare_memcheck_2_runs.py
+++ b/tests/stress_tests/scripts/compare_memcheck_2_runs.py
@@ -12,19 +12,19 @@
 
 import argparse
 import json
+import logging as log
 import os
 import sys
 from collections import OrderedDict
 from glob import glob
 from operator import itemgetter
 from pathlib import Path
-import logging as log
 
 from pymongo import MongoClient
-from memcheck_upload import create_memcheck_records
 
 # Database arguments
 from memcheck_upload import DATABASE, DB_COLLECTIONS
+from memcheck_upload import create_memcheck_records
 
 
 class HashableDict(dict):
diff --git a/tests/stress_tests/scripts/get_testdata.py b/tests/stress_tests/scripts/get_testdata.py
index cae9de7bec032a..b6a50b7bb1993c 100755
--- a/tests/stress_tests/scripts/get_testdata.py
+++ b/tests/stress_tests/scripts/get_testdata.py
@@ -9,13 +9,12 @@
 # pylint:disable=line-too-long
 
 import argparse
+import json
 import logging as log
 import os
 import shutil
 import subprocess
 import sys
-import json
-
 from distutils.dir_util import copy_tree
 from inspect import getsourcefile
 from pathlib import Path
diff --git a/tests/stress_tests/scripts/memcheck_upload.py b/tests/stress_tests/scripts/memcheck_upload.py
index 7283b8ab49985c..f1a88529e8592f 100644
--- a/tests/stress_tests/scripts/memcheck_upload.py
+++ b/tests/stress_tests/scripts/memcheck_upload.py
@@ -10,18 +10,18 @@
     --artifact_root ./gtest-parallel-logs --dryrun
 """
 
+import argparse
+import hashlib
 import json
 import logging
-from types import SimpleNamespace
 import os
 import re
 import sys
-import argparse
-from inspect import getsourcefile
-from glob import glob
 import xml.etree.ElementTree as ET
-import hashlib
-from pathlib import Path
+from glob import glob
+from inspect import getsourcefile
+from types import SimpleNamespace
+
 import yaml
 from pymongo import MongoClient
 
diff --git a/tests/stress_tests/scripts/requirements.txt b/tests/stress_tests/scripts/requirements.txt
index 681af3a4261d88..5434dab958dd26 100644
--- a/tests/stress_tests/scripts/requirements.txt
+++ b/tests/stress_tests/scripts/requirements.txt
@@ -1,7 +1,6 @@
-pymongo
-Jinja2
-PyYAML
+pymongo>=3.12.0
+Jinja2>=2.11.2
+PyYAML>=5.4.1
 fastjsonschema~=2.15.1
-pandas
-
-h5py<3.0.0 # WA for OMZ Keras models. Details: https://github.com/openvinotoolkit/open_model_zoo/issues/1806
\ No newline at end of file
+pandas>=1.1.5
+h5py>=3.1.0
\ No newline at end of file
diff --git a/tests/time_tests/test_runner/.automation/desktop_test_config.yml b/tests/time_tests/.automation/desktop_test_config.yml
similarity index 100%
rename from tests/time_tests/test_runner/.automation/desktop_test_config.yml
rename to tests/time_tests/.automation/desktop_test_config.yml
diff --git a/tests/time_tests/test_runner/.automation/desktop_test_config_cache.yml b/tests/time_tests/.automation/desktop_test_config_cache.yml
similarity index 100%
rename from tests/time_tests/test_runner/.automation/desktop_test_config_cache.yml
rename to tests/time_tests/.automation/desktop_test_config_cache.yml
diff --git a/tests/time_tests/CMakeLists.txt b/tests/time_tests/CMakeLists.txt
index 69fbb56bd0cc71..5e872c53f6f902 100644
--- a/tests/time_tests/CMakeLists.txt
+++ b/tests/time_tests/CMakeLists.txt
@@ -4,6 +4,13 @@
 
 cmake_minimum_required(VERSION 3.13)
 
+set (CMAKE_CXX_STANDARD 11)
+set (CMAKE_CXX_EXTENSIONS OFF)
+set (CMAKE_CXX_STANDARD_REQUIRED ON)
+if (CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
+    set (CMAKE_CXX_FLAGS "-std=c++11 ${CMAKE_CXX_FLAGS}")
+endif()
+
 set (CMAKE_BUILD_TYPE "Release" CACHE STRING "Choose the build type")
 
 project(time_tests)
@@ -11,18 +18,11 @@ project(time_tests)
 set(OpenVINO_SOURCE_DIR "${CMAKE_CURRENT_SOURCE_DIR}/../../")
 
 # Search OpenVINO Inference Engine installed
-find_package(InferenceEngine)
-
-if(NOT InferenceEngine_FOUND)
-    # Define directory where artifacts will be placed
-    set(OUTPUT_ROOT ${CMAKE_CURRENT_SOURCE_DIR})
-
-    # Search OpenVINO Inference Engine via InferenceEngineDeveloperPackage_DIR
-    # in order to provide backward compatibility with old OpenVINO packages
-    find_package(InferenceEngineDeveloperPackage REQUIRED)
-endif()
+find_package(OpenVINO REQUIRED)
 
 add_subdirectory(src)
 
 install(DIRECTORY test_runner/ DESTINATION tests/time_tests/test_runner COMPONENT tests EXCLUDE_FROM_ALL)
+install(DIRECTORY .automation/ DESTINATION tests/time_tests/test_runner/.automation COMPONENT tests EXCLUDE_FROM_ALL)
 install(DIRECTORY scripts/ DESTINATION tests/time_tests/scripts COMPONENT tests EXCLUDE_FROM_ALL)
+install(DIRECTORY ../utils/ DESTINATION tests/utils COMPONENT tests EXCLUDE_FROM_ALL)
diff --git a/tests/time_tests/README.md b/tests/time_tests/README.md
index b8c7d77509aaed..447186ad706800 100644
--- a/tests/time_tests/README.md
+++ b/tests/time_tests/README.md
@@ -15,21 +15,11 @@ the commands below:
 
 1. Build tests:
 ``` bash
+source <OpenVINO_install_dir>/setupvars.sh
 mkdir build && cd build
 cmake .. && make time_tests
 ```
 
-If you don't have OpenVINO™ installed you need to have the `build` folder, which
-is created when you configure and build OpenVINO™ from sources:
-
-``` bash
-cmake .. -DInferenceEngine_DIR=$(realpath ../../../build) && make time_tests
-```
-For old versions of OpenVINO™ from sources use `-DInferenceEngineDeveloperPackage_DIR`:
-``` bash
-cmake .. -DInferenceEngineDeveloperPackage_DIR=$(realpath ../../../build) && make time_tests
-```
-
 2. Run test:
 ``` bash
 ./scripts/run_timetest.py ../../bin/intel64/Release/timetest_infer -m model.xml -d CPU
diff --git a/tests/time_tests/scripts/run_timetest.py b/tests/time_tests/scripts/run_timetest.py
index 7b14c1e9c7292c..c97a85f0c36b79 100644
--- a/tests/time_tests/scripts/run_timetest.py
+++ b/tests/time_tests/scripts/run_timetest.py
@@ -12,7 +12,6 @@
 
 import statistics
 import tempfile
-import subprocess
 import logging
 import argparse
 import sys
@@ -27,35 +26,11 @@
 
 from test_runner.utils import filter_timetest_result
 
+UTILS_DIR = os.path.join(Path(__file__).parent.parent.parent, "utils")
+sys.path.insert(0, str(UTILS_DIR))
 
-def run_cmd(args: list, log=None, verbose=True):
-    """ Run command
-    """
-    if log is None:
-        log = logging.getLogger('run_cmd')
-    log_out = log.info if verbose else log.debug
-
-    log.info(f'========== cmd: {" ".join(args)}')  # pylint: disable=logging-fstring-interpolation
-
-    proc = subprocess.Popen(args,
-                            stdout=subprocess.PIPE,
-                            stderr=subprocess.STDOUT,
-                            encoding='utf-8',
-                            universal_newlines=True)
-    output = []
-    for line in iter(proc.stdout.readline, ''):
-        log_out(line.strip('\n'))
-        output.append(line)
-        if line or proc.poll() is None:
-            continue
-        break
-    outs = proc.communicate()[0]
-
-    if outs:
-        log_out(outs.strip('\n'))
-        output.append(outs)
-    log.info('========== Completed. Exit code: %d', proc.returncode)
-    return proc.returncode, ''.join(output)
+from proc_utils import cmd_exec
+from path_utils import check_positive_int
 
 
 def parse_stats(stats: list, res: dict):
@@ -100,7 +75,7 @@ def run_timetest(args: dict, log=None):
     stats = {}
     for run_iter in range(args["niter"]):
         tmp_stats_path = tempfile.NamedTemporaryFile().name
-        retcode, msg = run_cmd(cmd_common + ["-s", str(tmp_stats_path)], log=log)
+        retcode, msg = cmd_exec(cmd_common + ["-s", str(tmp_stats_path)], log=log)
         if retcode != 0:
             log.error("Run of executable '{}' failed with return code '{}'. Error: {}\n"
                       "Statistics aggregation is skipped.".format(args["executable"], retcode, msg))
@@ -132,15 +107,6 @@ def run_timetest(args: dict, log=None):
     return 0, "", aggregated_stats, stats
 
 
-def check_positive_int(val):
-    """Check argsparse argument is positive integer and return it"""
-    value = int(val)
-    if value < 1:
-        msg = "%r is less than 1" % val
-        raise argparse.ArgumentTypeError(msg)
-    return value
-
-
 def cli_parser():
     """parse command-line arguments"""
     parser = argparse.ArgumentParser(description='Run timetest executable')
@@ -151,7 +117,7 @@ def cli_parser():
                         required=True,
                         dest="model",
                         type=Path,
-                        help='path to an .xml/.onnx/.prototxt file with a trained model or'
+                        help='path to an .xml/.onnx file with a trained model or'
                              ' to a .blob files with a trained compiled model')
     parser.add_argument('-d',
                         required=True,
diff --git a/tests/time_tests/src/timetests/timetest_infer_vpu_mlir_compiler.cpp b/tests/time_tests/src/timetests/timetest_infer_vpu_mlir_compiler.cpp
new file mode 100644
index 00000000000000..597d0612b4e972
--- /dev/null
+++ b/tests/time_tests/src/timetests/timetest_infer_vpu_mlir_compiler.cpp
@@ -0,0 +1,84 @@
+// Copyright (C) 2018-2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <inference_engine.hpp>
+#include <iostream>
+
+#include "common_utils.h"
+#include "timetests_helper/timer.h"
+#include "timetests_helper/utils.h"
+using namespace InferenceEngine;
+
+
+/**
+ * @brief Function that contain executable pipeline which will be called from
+ * main(). The function should not throw any exceptions and responsible for
+ * handling it by itself.
+ */
+int runPipeline(const std::string &model, const std::string &device) {
+  auto pipeline = [](const std::string &model, const std::string &device) {
+    Core ie;
+    CNNNetwork cnnNetwork;
+    ExecutableNetwork exeNetwork;
+    InferRequest inferRequest;
+    size_t batchSize = 0;
+
+    {
+      SCOPED_TIMER(first_inference_latency);
+      {
+        SCOPED_TIMER(load_plugin);
+        ie.GetVersions(device);
+      }
+      {
+        SCOPED_TIMER(create_exenetwork);
+        if (TimeTest::fileExt(model) == "blob") {
+          SCOPED_TIMER(import_network);
+          exeNetwork = ie.ImportNetwork(model, device);
+        }
+        else {
+          {
+            SCOPED_TIMER(read_network);
+            cnnNetwork = ie.ReadNetwork(model);
+            batchSize = cnnNetwork.getBatchSize();
+          }
+
+          {
+            SCOPED_TIMER(load_network);
+            exeNetwork = ie.LoadNetwork(cnnNetwork, device, {{"VPUX_COMPILER_TYPE", "MLIR"}});
+          }
+        }
+      }
+    }
+
+    {
+      SCOPED_TIMER(first_inference);
+      inferRequest = exeNetwork.CreateInferRequest();
+
+      {
+        SCOPED_TIMER(fill_inputs)
+        batchSize = batchSize != 0 ? batchSize : 1;
+        const InferenceEngine::ConstInputsDataMap inputsInfo(exeNetwork.GetInputsInfo());
+        fillBlobs(inferRequest, inputsInfo, batchSize);
+      }
+      inferRequest.Infer();
+    }
+  };
+
+  try {
+    pipeline(model, device);
+  } catch (const InferenceEngine::Exception &iex) {
+    std::cerr
+        << "Inference Engine pipeline failed with Inference Engine exception:\n"
+        << iex.what();
+    return 1;
+  } catch (const std::exception &ex) {
+    std::cerr << "Inference Engine pipeline failed with exception:\n"
+              << ex.what();
+    return 2;
+  } catch (...) {
+    std::cerr << "Inference Engine pipeline failed\n";
+    return 3;
+  }
+  return 0;
+}
diff --git a/tests/time_tests/src/timetests_helper/cli.h b/tests/time_tests/src/timetests_helper/cli.h
index 3370f16eebdeab..9beaceda3730f7 100644
--- a/tests/time_tests/src/timetests_helper/cli.h
+++ b/tests/time_tests/src/timetests_helper/cli.h
@@ -14,7 +14,7 @@ static const char help_message[] = "Print a usage message";
 
 /// @brief message for model argument
 static const char model_message[] =
-    "Required. Path to an .xml/.onnx/.prototxt file with a trained model or to "
+    "Required. Path to an .xml/.onnx file with a trained model or to "
     "a .blob files with a trained compiled model.";
 
 /// @brief message for target device argument
diff --git a/inference-engine/tools/cross_check_tool/__init__.py b/tests/time_tests/test_runner/__init__.py
similarity index 100%
rename from inference-engine/tools/cross_check_tool/__init__.py
rename to tests/time_tests/test_runner/__init__.py
diff --git a/tests/time_tests/test_runner/conftest.py b/tests/time_tests/test_runner/conftest.py
index f60be60d963238..086d6848084d97 100644
--- a/tests/time_tests/test_runner/conftest.py
+++ b/tests/time_tests/test_runner/conftest.py
@@ -3,12 +3,9 @@
 #
 """
 Basic high-level plugin file for pytest.
-
 See [Writing plugins](https://docs.pytest.org/en/latest/writing_plugins.html)
 for more information.
-
 This plugin adds the following command-line options:
-
 * `--test_conf` - Path to test configuration file. Used to parametrize tests.
   Format: YAML file.
 * `--exe` - Path to a timetest binary to execute.
@@ -23,19 +20,19 @@
 import shutil
 import sys
 import tempfile
+from pathlib import Path
+
 import pytest
 import yaml
-
-from pathlib import Path
 from jsonschema import validate, ValidationError
 
-TIME_TESTS_DIR = os.path.dirname(os.path.dirname(__file__))
-sys.path.append(TIME_TESTS_DIR)
-
-from scripts.run_timetest import check_positive_int
-from test_runner.utils import upload_timetest_data, metadata_from_manifest, get_os_name, get_os_version, \
-    get_cpu_info, DATABASE, DB_COLLECTIONS
+# add utils folder to imports
+UTILS_DIR = os.path.join(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))), "utils")
+sys.path.insert(0, str(UTILS_DIR))
 
+from path_utils import check_positive_int
+from platform_utils import get_os_name, get_os_version, get_cpu_info
+from utils import upload_data, metadata_from_manifest, DB_COLLECTIONS
 
 # -------------------- CLI options --------------------
 
@@ -82,7 +79,7 @@ def pytest_addoption(parser):
         '--db_collection',
         type=str,
         required=is_db_used,
-        help='collection name in "{}" database'.format(DATABASE),
+        help='collection name in database',
         choices=DB_COLLECTIONS
     )
     db_args_parser.addoption(
@@ -117,7 +114,6 @@ def niter(request):
 
 # -------------------- CLI options --------------------
 
-
 @pytest.fixture(scope="function")
 def temp_dir(pytestconfig):
     """Create temporary directory for test purposes.
@@ -131,7 +127,6 @@ def temp_dir(pytestconfig):
 @pytest.fixture(scope="function")
 def cl_cache_dir(pytestconfig, instance):
     """Generate directory to save OpenCL cache before test run and clean up after run.
-
     Folder `cl_cache` should be created in a directory where tests were run. In this case
     cache will be saved correctly. This behaviour is OS independent.
     More: https://github.com/intel/compute-runtime/blob/master/opencl/doc/FAQ.md#how-can-cl_cache-be-enabled
@@ -171,7 +166,6 @@ def model_cache_dir(pytestconfig, instance):
 @pytest.fixture(scope="function")
 def test_info(request, pytestconfig):
     """Fixture for collecting timetests information.
-
     Current fixture fills in `request` and `pytestconfig` global
     fixtures with timetests information which will be used for
     internal purposes.
@@ -186,7 +180,6 @@ def test_info(request, pytestconfig):
 @pytest.fixture(scope="function")
 def validate_test_case(request, test_info):
     """Fixture for validating test case on correctness.
-
     Fixture checks current test case contains all fields required for
     a correct work.
     """
@@ -226,7 +219,6 @@ def validate_test_case(request, test_info):
 @pytest.fixture(scope="function")
 def prepare_db_info(request, test_info, executable, niter, manifest_metadata):
     """Fixture for preparing and validating data to submit to a database.
-
     Fixture prepares data and metadata to submit to a database. One of the steps
     is parsing of build information from build manifest. After preparation,
     it checks if data contains required properties.
@@ -345,7 +337,6 @@ def manifest_metadata(request):
 
 def pytest_generate_tests(metafunc):
     """Pytest hook for test generation.
-
     Generate parameterized tests from discovered modules and test config
     parameters.
     """
@@ -376,7 +367,6 @@ def get_dict_values(d):
 @pytest.mark.hookwrapper
 def pytest_runtest_makereport(item, call):
     """Pytest hook for report preparation.
-
     Submit tests' data to a database.
     """
 
@@ -403,5 +393,5 @@ def pytest_runtest_makereport(item, call):
 
         db_url = item.config.getoption("db_url")
         db_collection = item.config.getoption("db_collection")
-        logging.info("Upload data to {}/{}.{}. Data: {}".format(db_url, DATABASE, db_collection, data))
-        upload_timetest_data(data, db_url, db_collection)
+        logging.info("Upload data to {}/{}.{}. Data: {}".format(db_url, 'timetests', db_collection, data))
+        upload_data(data, db_url, 'timetests', db_collection)
diff --git a/tests/time_tests/test_runner/requirements.txt b/tests/time_tests/test_runner/requirements.txt
index d8db3f72fb2b33..4ebdab165a753c 100644
--- a/tests/time_tests/test_runner/requirements.txt
+++ b/tests/time_tests/test_runner/requirements.txt
@@ -4,5 +4,5 @@ PyYAML==5.4.1
 jsonschema==3.2.0
 distro==1.5.0
 numpy>=1.19.2
-pymongo
-pytest-html
+pymongo>=3.12.0
+pytest-html>=1.19.0
\ No newline at end of file
diff --git a/tests/time_tests/test_runner/test_timetest.py b/tests/time_tests/test_runner/test_timetest.py
index 04cd3dcba7d349..a080cc5586c66d 100644
--- a/tests/time_tests/test_runner/test_timetest.py
+++ b/tests/time_tests/test_runner/test_timetest.py
@@ -18,9 +18,18 @@
 import logging
 import os
 import shutil
+import sys
+
+# add utils folder to imports
+UTILS_DIR = os.path.join(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))), "utils")
+sys.path.insert(0, str(UTILS_DIR))
+
+from path_utils import expand_env_vars
+
+TIME_TESTS_DIR = os.path.dirname(os.path.dirname(__file__))
+sys.path.append(TIME_TESTS_DIR)
 
 from scripts.run_timetest import run_timetest
-from test_runner.utils import expand_env_vars
 
 REFS_FACTOR = 1.2      # 120%
 
diff --git a/tests/time_tests/test_runner/utils.py b/tests/time_tests/test_runner/utils.py
index bf55f6c2a1e2e0..455b622576a528 100644
--- a/tests/time_tests/test_runner/utils.py
+++ b/tests/time_tests/test_runner/utils.py
@@ -3,66 +3,13 @@
 
 """Utility module."""
 
-import os
-import platform
-import subprocess
-import sys
-import distro
-import yaml
 import numpy as np
 
-from enum import Enum
-from pathlib import Path
-from pymongo import MongoClient
-
-# constants
-DATABASE = 'timetests'   # database name for timetests results
-DB_COLLECTIONS = ["commit", "nightly", "weekly"]
-PRODUCT_NAME = 'dldt'   # product name from build manifest
-
 # Define a range to cut outliers which are < Q1 − IQR_CUTOFF * IQR, and > Q3 + IQR_CUTOFF * IQR
 # https://en.wikipedia.org/wiki/Interquartile_range
 IQR_CUTOFF = 1.5
 
 
-def expand_env_vars(obj):
-    """Expand environment variables in provided object."""
-
-    if isinstance(obj, list):
-        for i, value in enumerate(obj):
-            obj[i] = expand_env_vars(value)
-    elif isinstance(obj, dict):
-        for name, value in obj.items():
-            obj[name] = expand_env_vars(value)
-    else:
-        obj = os.path.expandvars(obj)
-    return obj
-
-
-def upload_timetest_data(data, db_url, db_collection):
-    """ Upload timetest data to database."""
-    client = MongoClient(db_url)
-    collection = client[DATABASE][db_collection]
-    collection.replace_one({'_id': data['_id']}, data, upsert=True)
-
-
-def metadata_from_manifest(manifest: Path):
-    """ Extract commit metadata from manifest."""
-    with open(manifest, 'r') as manifest_file:
-        manifest = yaml.safe_load(manifest_file)
-    repo_trigger = next(
-        repo for repo in manifest['components'][PRODUCT_NAME]['repository'] if repo['trigger'])
-    return {
-        'product_type': manifest['components'][PRODUCT_NAME]['product_type'],
-        'commit_sha': repo_trigger['revision'],
-        'commit_date': repo_trigger['commit_time'],
-        'repo_url': repo_trigger['url'],
-        'branch': repo_trigger['branch'],
-        'target_branch': repo_trigger['target_branch'] if repo_trigger["target_branch"] else repo_trigger["branch"],
-        'version': manifest['components'][PRODUCT_NAME]['version']
-    }
-
-
 def calculate_iqr(stats: list):
     """IQR is calculated as the difference between the 3th and the 1th quantile of the data."""
     q1 = np.quantile(stats, 0.25)
@@ -80,98 +27,3 @@ def filter_timetest_result(stats: dict):
         upd_time_results = [x for x in time_results if (q1 - cut_off < x < q3 + cut_off)]
         filtered_stats.update({step_name: upd_time_results if upd_time_results else time_results})
     return filtered_stats
-
-
-class UnsupportedOsError(Exception):
-    """Exception for unsupported OS type."""
-    def __init__(self, *args, **kwargs):
-        error_message = f'OS type "{get_os_type()}" is not currently supported'
-        if args or kwargs:
-            super().__init__(*args, **kwargs)
-        else:
-            super().__init__(error_message)
-
-
-class OsType(Enum):
-    """Container for supported os types."""
-    WINDOWS = 'Windows'
-    LINUX = 'Linux'
-    DARWIN = 'Darwin'
-
-
-def get_os_type():
-    """
-    Get OS type
-
-    :return: OS type
-    :rtype: String | Exception if it is not supported
-    """
-    return platform.system()
-
-
-def os_type_is_windows():
-    """Returns True if OS type is Windows. Otherwise returns False."""
-    return get_os_type() == OsType.WINDOWS.value
-
-
-def os_type_is_linux():
-    """Returns True if OS type is Linux. Otherwise returns False."""
-    return get_os_type() == OsType.LINUX.value
-
-
-def os_type_is_darwin():
-    """Returns True if OS type is Darwin. Otherwise returns False."""
-    return get_os_type() == OsType.DARWIN.value
-
-
-def get_os_name():
-    """
-    Check OS type and return OS name
-
-    :return: OS name
-    :rtype: String | Exception if it is not supported
-    """
-    if os_type_is_linux():
-        return distro.id().lower()
-    if os_type_is_windows() or os_type_is_darwin():
-        return get_os_type().lower()
-    raise UnsupportedOsError()
-
-
-def get_os_version():
-    """
-    Check OS version and return it
-
-    :return: OS version
-    :rtype: tuple | Exception if it is not supported
-    """
-    if os_type_is_linux():
-        return distro.major_version(), distro.minor_version()
-    if os_type_is_windows():
-        return sys.getwindowsversion().major, sys.getwindowsversion().minor
-    if os_type_is_darwin():
-        return tuple(platform.mac_ver()[0].split(".")[:2])
-    raise UnsupportedOsError()
-
-
-def get_cpu_info():
-    """
-    Check OS version and returns name and frequency of cpu
-
-    :return: CPU name and frequency
-    :rtype: str
-    """
-    model = ''
-    if os_type_is_linux():
-        command = r"lscpu | sed -n 's/Model name:[ \t]*//p'"
-        model = subprocess.check_output(command, shell=True)
-    elif os_type_is_windows():
-        command = 'wmic cpu get name | find /v "Name"'
-        model = subprocess.check_output(command, shell=True)
-    elif os_type_is_darwin():
-        command = ['/usr/sbin/sysctl', "-n", "machdep.cpu.brand_string"]
-        model = subprocess.check_output(command)
-    else:
-        raise UnsupportedOsError()
-    info = model.decode('utf-8').strip()
-    return info
diff --git a/tests/utils/__init__.py b/tests/utils/__init__.py
new file mode 100644
index 00000000000000..60324954ef522e
--- /dev/null
+++ b/tests/utils/__init__.py
@@ -0,0 +1,3 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
diff --git a/tests/lib/install_pkg.py b/tests/utils/install_pkg.py
similarity index 89%
rename from tests/lib/install_pkg.py
rename to tests/utils/install_pkg.py
index c45d985c10a111..aca427c5db3726 100644
--- a/tests/lib/install_pkg.py
+++ b/tests/utils/install_pkg.py
@@ -16,10 +16,10 @@ def get_openvino_environment(install_prefix: Path):
     """ Get OpenVINO environment variables
     """
     if sys.platform == "win32":
-        script = install_prefix / "bin" / "setupvars.bat"
+        script = install_prefix / "setupvars.bat"
         cmd = f"{script} && set"
     else:
-        script = install_prefix / "bin" / "setupvars.sh"
+        script = install_prefix / "setupvars.sh"
         # setupvars.sh is not compatible with /bin/sh. Using bash.
         cmd = f'bash -c ". {script} && env"'
 
diff --git a/tests/lib/path_utils.py b/tests/utils/path_utils.py
similarity index 50%
rename from tests/lib/path_utils.py
rename to tests/utils/path_utils.py
index f97da037c5facd..8e9864059ad46c 100644
--- a/tests/lib/path_utils.py
+++ b/tests/utils/path_utils.py
@@ -6,10 +6,17 @@
 """ Common utilities for working with paths
 """
 
+import argparse
 import os
 import sys
 from pathlib import Path
 
+# add utils folder to imports
+UTILS_DIR = os.path.dirname(os.path.abspath(__file__))
+sys.path.insert(0, str(UTILS_DIR))
+
+from platform_utils import get_os_name
+
 
 def expand_env_vars(obj):
     """Expand environment variables in provided object."""
@@ -25,27 +32,27 @@ def expand_env_vars(obj):
     return obj
 
 
-def get_os_name():
-    """Function for getting OS name"""
-    if sys.platform == "win32":
-        os_name = 'Windows'
-    else:
-        os_name = 'Linux'
-    return os_name
-
-
 def get_lib_path(lib_name):
     """Function for getting absolute path in OpenVINO directory to specific lib"""
     os_name = get_os_name()
     all_libs = {
         'inference_engine_transformations': {
-            'Windows': Path('deployment_tools/inference_engine/bin/intel64/Release/inference_engine_transformations.dll'),
-            'Linux': Path('deployment_tools/inference_engine/lib/intel64/libinference_engine_transformations.so')},
+            'Windows': Path('runtime/bin/intel64/Release/inference_engine_transformations.dll'),
+            'Linux': Path('runtime/lib/intel64/libinference_engine_transformations.so')},
         'MKLDNNPlugin': {
-            'Windows': Path('deployment_tools/inference_engine/bin/intel64/Release/MKLDNNPlugin.dll'),
-            'Linux': Path('deployment_tools/inference_engine/lib/intel64/libMKLDNNPlugin.so')},
+            'Windows': Path('runtime/bin/intel64/Release/MKLDNNPlugin.dll'),
+            'Linux': Path('runtime/lib/intel64/libMKLDNNPlugin.so')},
         'ngraph': {
-            'Windows': Path('deployment_tools/ngraph/lib/ngraph.dll'),
-            'Linux': Path('deployment_tools/ngraph/lib/libngraph.so')}
+            'Windows': Path('runtime/bin/intel64/Release/ngraph.dll'),
+            'Linux': Path('runtime/lib/intel64/libngraph.so')}
                 }
     return all_libs[lib_name][os_name]
+
+
+def check_positive_int(val):
+    """Check argsparse argument is positive integer and return it"""
+    value = int(val)
+    if value < 1:
+        msg = "%r is less than 1" % val
+        raise argparse.ArgumentTypeError(msg)
+    return value
diff --git a/tests/utils/platform_utils.py b/tests/utils/platform_utils.py
new file mode 100644
index 00000000000000..f9e395c22a4f74
--- /dev/null
+++ b/tests/utils/platform_utils.py
@@ -0,0 +1,106 @@
+#!/usr/bin/env python3
+
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+""" Common utilities for working with OSes or platforms
+"""
+
+import platform
+import subprocess
+import sys
+from enum import Enum
+
+import distro
+
+
+class UnsupportedOsError(Exception):
+    """Exception for unsupported OS type."""
+
+    def __init__(self, *args, **kwargs):
+        error_message = f'OS type "{get_os_type()}" is not currently supported'
+        if args or kwargs:
+            super().__init__(*args, **kwargs)
+        else:
+            super().__init__(error_message)
+
+
+class OsType(Enum):
+    """Container for supported os types."""
+    WINDOWS = 'Windows'
+    LINUX = 'Linux'
+    DARWIN = 'Darwin'
+
+
+def get_os_type():
+    """
+    Get OS type
+    :return: OS type
+    :rtype: String | Exception if it is not supported
+    """
+    return platform.system()
+
+
+def os_type_is_windows():
+    """Returns True if OS type is Windows. Otherwise returns False."""
+    return get_os_type() == OsType.WINDOWS.value
+
+
+def os_type_is_linux():
+    """Returns True if OS type is Linux. Otherwise returns False."""
+    return get_os_type() == OsType.LINUX.value
+
+
+def os_type_is_darwin():
+    """Returns True if OS type is Darwin. Otherwise returns False."""
+    return get_os_type() == OsType.DARWIN.value
+
+
+def get_os_name():
+    """
+    Check OS type and return OS name
+    :return: OS name
+    :rtype: String | Exception if it is not supported
+    """
+    if os_type_is_linux():
+        return distro.id().lower()
+    if os_type_is_windows() or os_type_is_darwin():
+        return get_os_type().lower()
+    raise UnsupportedOsError()
+
+
+def get_os_version():
+    """
+    Check OS version and return it
+    :return: OS version
+    :rtype: tuple | Exception if it is not supported
+    """
+    if os_type_is_linux():
+        return distro.major_version(), distro.minor_version()
+    if os_type_is_windows():
+        return sys.getwindowsversion().major, sys.getwindowsversion().minor
+    if os_type_is_darwin():
+        return tuple(platform.mac_ver()[0].split(".")[:2])
+    raise UnsupportedOsError()
+
+
+def get_cpu_info():
+    """
+    Check OS version and returns name and frequency of cpu
+    :return: CPU name and frequency
+    :rtype: str
+    """
+    model = ''
+    if os_type_is_linux():
+        command = r"lscpu | sed -n 's/Model name:[ \t]*//p'"
+        model = subprocess.check_output(command, shell=True)
+    elif os_type_is_windows():
+        command = 'wmic cpu get name | find /v "Name"'
+        model = subprocess.check_output(command, shell=True)
+    elif os_type_is_darwin():
+        command = ['/usr/sbin/sysctl', "-n", "machdep.cpu.brand_string"]
+        model = subprocess.check_output(command)
+    else:
+        raise UnsupportedOsError()
+    info = model.decode('utf-8').strip()
+    return info
diff --git a/tests/lib/proc_utils.py b/tests/utils/proc_utils.py
similarity index 100%
rename from tests/lib/proc_utils.py
rename to tests/utils/proc_utils.py
diff --git a/tests/utils/utils.py b/tests/utils/utils.py
new file mode 100644
index 00000000000000..a0ccb3d741078a
--- /dev/null
+++ b/tests/utils/utils.py
@@ -0,0 +1,38 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+"""Utility module."""
+
+from pathlib import Path
+
+import yaml
+from pymongo import MongoClient
+
+# constants
+DATABASES = ['timetests', 'memcheck']
+DB_COLLECTIONS = ["commit", "nightly", "weekly"]
+PRODUCT_NAME = 'dldt'   # product name from build manifest
+
+
+def upload_data(data, db_url, db_name, db_collection):
+    """ Upload timetest data to database."""
+    client = MongoClient(db_url)
+    collection = client[db_name][db_collection]
+    collection.replace_one({'_id': data['_id']}, data, upsert=True)
+
+
+def metadata_from_manifest(manifest: Path):
+    """ Extract commit metadata from manifest."""
+    with open(manifest, 'r') as manifest_file:
+        manifest = yaml.safe_load(manifest_file)
+    repo_trigger = next(
+        repo for repo in manifest['components'][PRODUCT_NAME]['repository'] if repo['trigger'])
+    return {
+        'product_type': manifest['components'][PRODUCT_NAME]['product_type'],
+        'commit_sha': repo_trigger['revision'],
+        'commit_date': repo_trigger['commit_time'],
+        'repo_url': repo_trigger['url'],
+        'branch': repo_trigger['branch'],
+        'target_branch': repo_trigger['target_branch'] if repo_trigger["target_branch"] else repo_trigger["branch"],
+        'version': manifest['components'][PRODUCT_NAME]['version']
+    }
diff --git a/thirdparty/CMakeLists.txt b/thirdparty/CMakeLists.txt
index ef0acd6559b804..3924fd210440b1 100644
--- a/thirdparty/CMakeLists.txt
+++ b/thirdparty/CMakeLists.txt
@@ -123,16 +123,16 @@ endif()
 ie_cpack_add_component(cpp_samples_deps)
 
 install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/gflags
-        DESTINATION ${IE_CPACK_IE_DIR}/samples/cpp/thirdparty
+        DESTINATION "samples/cpp/thirdparty"
         COMPONENT cpp_samples_deps
         USE_SOURCE_PERMISSIONS)
 
 install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/zlib
-        DESTINATION ${IE_CPACK_IE_DIR}/samples/cpp/thirdparty
+        DESTINATION "samples/cpp/thirdparty"
         COMPONENT cpp_samples_deps
         USE_SOURCE_PERMISSIONS)
 
 install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/cnpy
-        DESTINATION ${IE_CPACK_IE_DIR}/samples/cpp/thirdparty
+        DESTINATION "samples/cpp/thirdparty"
         COMPONENT cpp_samples_deps
         USE_SOURCE_PERMISSIONS)
diff --git a/thirdparty/cnpy/README.md b/thirdparty/cnpy/README.md
index 37c4a4340c8e4e..4f0f42ad0fc8ca 100644
--- a/thirdparty/cnpy/README.md
+++ b/thirdparty/cnpy/README.md
@@ -51,5 +51,3 @@ struct NpyArray {
     template<typename T> T* data();
 };
 ```
-
-See [example1.cpp](example1.cpp) for examples of how to use the library. example1 will also be build during cmake installation.
diff --git a/thirdparty/itt_collector/sea_itt_lib/CMakeLists.txt b/thirdparty/itt_collector/sea_itt_lib/CMakeLists.txt
index 3618e8ae360929..694f9341bd2fbc 100644
--- a/thirdparty/itt_collector/sea_itt_lib/CMakeLists.txt
+++ b/thirdparty/itt_collector/sea_itt_lib/CMakeLists.txt
@@ -18,6 +18,7 @@ set(TARGET_NAME sea_itt_lib)
 
 set(CMAKE_DEBUG_POSTFIX "")
 set(CMAKE_RELEASE_POSTFIX "")
+set(CMAKE_INTERPROCEDURAL_OPTIMIZATION_RELEASE OFF)
 
 file(GLOB_RECURSE SOURCES "*.cpp" "*.h")
 
diff --git a/thirdparty/ocl/CMakeLists.txt b/thirdparty/ocl/CMakeLists.txt
index d091cc3f54da42..64cb685949934e 100644
--- a/thirdparty/ocl/CMakeLists.txt
+++ b/thirdparty/ocl/CMakeLists.txt
@@ -2,6 +2,40 @@
 # SPDX-License-Identifier: Apache-2.0
 #
 
+if(NOT ENABLE_CLDNN)
+    return()
+endif()
+
+function(get_lib_name TARGET_NAME LIBRARY_NAME)
+    if (CMAKE_BUILD_TYPE STREQUAL "Debug")
+        set(BUILD_SUFFIX ${IE_DEBUG_POSTFIX})
+    else()
+        set(BUILD_SUFFIX ${IE_RELEASE_POSTFIX})
+    endif()
+
+    if(WIN32)
+        set(LIB_SUFFIX "${BUILD_SUFFIX}${CMAKE_LINK_LIBRARY_SUFFIX}")
+    else()
+        set(LIB_SUFFIX "${BUILD_SUFFIX}${CMAKE_SHARED_LIBRARY_SUFFIX}")
+    endif()
+
+    set("${LIBRARY_NAME}" "${CMAKE_SHARED_MODULE_PREFIX}${TARGET_NAME}${LIB_SUFFIX}" PARENT_SCOPE)
+endfunction()
+
+function(get_lib_path OUTPUT_DIR FINAL_OUTPUT_DIR)
+    if(WIN32)
+        set(LIB_DIR "")
+    else()
+        set(LIB_DIR "lib")
+    endif()
+
+    if (NOT CMAKE_GENERATOR MATCHES "Ninja" AND NOT UNIX)
+        set(OUTPUT_DIR "${OUTPUT_DIR}/${CMAKE_BUILD_TYPE}")
+    endif()
+
+    set("${FINAL_OUTPUT_DIR}" "${OUTPUT_DIR}/${LIB_DIR}" PARENT_SCOPE)
+endfunction()
+
 set(OPENCL_ICD_LOADER_HEADERS_DIR "${CMAKE_CURRENT_SOURCE_DIR}/cl_headers/" CACHE PATH "Path to OCL includes" FORCE)
 
 set(OPENCL_HEADERS_DIR "${CMAKE_CURRENT_SOURCE_DIR}/cl_headers/" "${CMAKE_CURRENT_SOURCE_DIR}/clhpp_headers/include/" CACHE PATH "Path to OCL (CL and CLHPP) includes" FORCE)
@@ -20,5 +54,10 @@ target_include_directories(OpenCL SYSTEM PUBLIC ${OPENCL_HEADERS_DIR})
 
 # The following varables are needed to make find_package(OpenCL) work
 set(OpenCL_VERSION_STRING "2.2" CACHE STRING "" FORCE)
-set(OpenCL_INCLUDE_DIR "${OPENCL_ICD_LOADER_HEADERS_DIR}" CACHE PATH "" FORCE)
+set(OpenCL_INCLUDE_DIR "${OPENCL_HEADERS_DIR}" CACHE PATH "" FORCE)
 set(OPENCLROOT "${CMAKE_LIBRARY_OUTPUT_DIRECTORY}" CACHE PATH "" FORCE)
+
+get_lib_path("${OUTPUT_ROOT}/${BIN_FOLDER}" OPENCL_LIB_DIR)
+get_lib_name("OpenCL" OPENCL_LIB_NAME)
+
+set(OpenCL_LIBRARY "${OPENCL_LIB_DIR}/${OPENCL_LIB_NAME}" CACHE PATH "" FORCE)
diff --git a/tools/CMakeLists.txt b/tools/CMakeLists.txt
index fc468719d16f2c..f18d5f9ce1013b 100644
--- a/tools/CMakeLists.txt
+++ b/tools/CMakeLists.txt
@@ -1,19 +1,35 @@
 # Copyright (C) 2018-2021 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
+
 cmake_minimum_required(VERSION 3.13)
 
-project(python_tools)
+project(OpenVINO_Tools DESCRIPTION "OpenVINO toolkit Development Tools")
 
 if(NOT DEFINED OpenVINO_SOURCE_DIR)
     find_package(InferenceEngineDeveloperPackage QUIET)
+    set(python_tools_only ON)
+endif()
+
+# C++ tools
+
+if(NOT python_tools_only)
+    add_subdirectory(compile_tool)
 endif()
 
+# Python tools
+
+# install deployment_manager
+
+ie_cpack_add_component(deployment_manager REQUIRED)
+install(DIRECTORY deployment_manager
+        DESTINATION tools
+        COMPONENT deployment_manager
+        USE_SOURCE_PERMISSIONS)
+
 if(ENABLE_PYTHON)
     find_package(PythonInterp 3 REQUIRED)
     set(PYTHON_VERSION python${PYTHON_VERSION_MAJOR}.${PYTHON_VERSION_MINOR})
 
-    set(TARGET_NAME "python_tools")
-
     if(WIN32)
         set(PYTHON_BRIDGE_OUTPUT_DIRECTORY ${CMAKE_LIBRARY_OUTPUT_DIRECTORY}/$<CONFIG>/python_api/${PYTHON_VERSION}/openvino)
     else()
@@ -21,24 +37,32 @@ if(ENABLE_PYTHON)
     endif()
 
     # creates a copy inside bin directory for developers to have ability running python benchmark_app
-    add_custom_target(${TARGET_NAME} ALL
+    add_custom_target(python_tools_benchmark ALL
         COMMAND ${CMAKE_COMMAND} -E make_directory ${PYTHON_BRIDGE_OUTPUT_DIRECTORY}/tools
-        COMMAND ${CMAKE_COMMAND} -E copy_directory ${OpenVINO_SOURCE_DIR}/tools/benchmark_tool/openvino/tools/benchmark ${PYTHON_BRIDGE_OUTPUT_DIRECTORY}/tools/benchmark
+        COMMAND ${CMAKE_COMMAND} -E copy_directory ${CMAKE_CURRENT_SOURCE_DIR}/benchmark_tool/openvino/tools/benchmark
+                                                   ${PYTHON_BRIDGE_OUTPUT_DIRECTORY}/tools/benchmark
     )
 
     ie_cpack_add_component(python_tools_${PYTHON_VERSION})
     ie_cpack_add_component(python_tools)
 
-    install(FILES benchmark_tool/benchmark_app.py
-                  benchmark_tool/README.md
+    # install cross_check_tool tool
+    install(DIRECTORY cross_check_tool
+            DESTINATION tools
+            USE_SOURCE_PERMISSIONS
+            COMPONENT python_tools)
+
+    # install benchmark_app tool
+    install(FILES benchmark_tool/README.md
                   benchmark_tool/requirements.txt
-            DESTINATION deployment_tools/tools/benchmark_tool
+            DESTINATION tools/benchmark_tool
             COMPONENT python_tools)
 
-    install(DIRECTORY ../inference-engine/tools/cross_check_tool
-            DESTINATION deployment_tools/tools
+    install(PROGRAMS benchmark_tool/benchmark_app.py
+            DESTINATION tools/benchmark_tool
             COMPONENT python_tools)
 
+    # install openvino/tools/benchmark as a python package
     install(DIRECTORY benchmark_tool/openvino/tools/benchmark
             DESTINATION python/${PYTHON_VERSION}/openvino/tools
             USE_SOURCE_PERMISSIONS
diff --git a/tools/benchmark_tool/README.md b/tools/benchmark_tool/README.md
index 4c7608b6cce104..cccf1aaca0bd76 100644
--- a/tools/benchmark_tool/README.md
+++ b/tools/benchmark_tool/README.md
@@ -1,44 +1,55 @@
 # Benchmark Python* Tool {#openvino_inference_engine_tools_benchmark_tool_README}
 
-This topic demonstrates how to run the Benchmark Python* Tool, which performs inference using convolutional networks. Performance can be measured for two inference modes: synchronous (latency-oriented) and asynchronous (throughput-oriented).
+This topic demonstrates how to run the Benchmark Python* Tool, which performs inference using convolutional networks.
+Performance can be measured for two inference modes: latency- and throughput-oriented.
 
 > **NOTE:** This topic describes usage of Python implementation of the Benchmark Tool. For the C++ implementation, refer to [Benchmark C++ Tool](../../inference-engine/samples/benchmark_app/README.md).
 
-> **TIP**: You also can work with the Benchmark Tool inside the OpenVINO™ [Deep Learning Workbench](@ref workbench_docs_Workbench_DG_Introduction) (DL Workbench).
-> [DL Workbench](@ref workbench_docs_Workbench_DG_Introduction) is a platform built upon OpenVINO™ and provides a web-based graphical environment that enables you to optimize, fine-tune, analyze, visualize, and compare
-> performance of deep learning models on various Intel® architecture
-> configurations. In the DL Workbench, you can use most of OpenVINO™ toolkit components.
-> <br>
-> Proceed to an [easy installation from Docker](@ref workbench_docs_Workbench_DG_Install_from_Docker_Hub) to get started.
+> **TIP**: You can quick start with the Benchmark Tool inside the OpenVINO™ [Deep Learning Workbench](@ref openvino_docs_get_started_get_started_dl_workbench) (DL Workbench).
+> [DL Workbench](@ref workbench_docs_Workbench_DG_Introduction) is the OpenVINO™ toolkit UI you to 
+> import a model, analyze its performance and accuracy, visualize the outputs, optimize and prepare the model for 
+> deployment on various Intel® platforms.
 
 ## How It Works
-
-Upon start-up, the application reads command-line parameters and loads a network and images/binary files to the Inference Engine plugin, which is chosen depending on a specified device. The number of infer requests and execution approach depend on the mode defined with the `-api` command-line parameter.
+Upon start-up, the application reads command-line parameters and loads a network and inputs (images/binary files) to the specified device.
+Device-specific execution parameters (number of streams, threads, and so on) can be either explicitly specified through the command line
+or left default. In the latter case, the sample logic will select the values for the optimal throughput.
+While further experimenting with individual parameters (like number of streams and requests, batch size, etc) allows to find the performance sweet spot,
+usually, the resulting values are not very performance-portable,
+so the values from one machine or device are not necessarily optimal for another.
+From this perspective, the most portable way is experimenting only the performance hints. To learn more, refer to the section below.
 
 > **NOTE**: By default, Inference Engine samples, tools and demos expect input with BGR channels order. If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the sample or demo application or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified. For more information about the argument, refer to **When to Reverse Input Channels** section of [Converting a Model Using General Conversion Parameters](../../docs/MO_DG/prepare_model/convert_model/Converting_Model_General.md).
 
-### Synchronous API
-
-For synchronous mode, the primary metric is latency. The application creates one infer request and executes the `Infer` method. A number of executions is defined by one of the two values:
-* Number of iterations defined with the `-niter` command-line argument
-* Time duration specified with the `-t` command-line argument
+### Latency and Throughput-focused Inference Modes
+In many cases the primary performance metric is the time (in milliseconds) for an individual inference request.
+For conventional devices the best latency is usually achieved when the application operates single inference request.
+Similarly, while for some devices the synchronous API (`Infer` method) was slightly better for the latency.
+However, advanced devices like multi-socket CPUs, modern GPUs and so on, are capable to run multiple inference requests,
+while delivering the same latency (as with the single request). Also, the asynchronous API is more general/flexible
+(with respect to handling multiple inference requests).
+Overall, the legacy way of measuring latency (triggered by '-api sync') with a single request and synchronous API is discouraged
+in favor of the dedicated '-hint latency' that lets the _device_ to apply the right settings to minimize the time to request.
+
+Throughput-oriented scenarios, in contrast, are focused on fully saturating the machine with enough data to crunch,
+as opposite to the time of the individual request. So, the primary performance metric is rather FPS (frames per second).
+Yet, just like with the latency case, the optimal execution parameters may differ between machines and devices.
+So, again, as explained in the previous section, the most portable way is to use the dedicated performance hint, rather than playing individual parameters.
+The hints allow the device to configure actual settings for the specified mode. The sample then queries/executes the optimal number of inference requests.
+
+During the execution, the application collects/reports two types of metrics:
+* Wall-clock time (latency) of each infer request and resulting latency
+* Duration of all inference executions and resulting throughput
+By default, the reported latency value is always calculated as the median (i.e. 50th percentile) value of all collected latencies from individual requests.
+Notice that you can change the desired percentile with the command-line flag.
+The throughput value is derived from the overall inference execution time and number of completed requests (respecting the batch size).
+
+### Defining the Number of Inference Executions
+A number of executions is defined by one of the two values:
+* Explicitly, with the `-niter` command-line argument
+* As _time_ duration specified with the `-t` command-line argument
 * Both of them (execution will continue until both conditions are met)
-* Predefined duration if `-niter` and `-t` are not specified. Predefined duration value depends on device.
-
-During the execution, the application collects two types of metrics:
-* Latency for each infer request executed with `Infer` method
-* Duration of all executions
-
-Reported latency value is calculated as mean value of all collected latencies. Reported throughput value is a derivative from reported latency and additionally depends on batch size.
-
-### Asynchronous API
-For asynchronous mode, the primary metric is throughput in frames per second (FPS). The application creates a certain number of infer requests and executes the `StartAsync` method. A number of executions is defined by one of the two values:
-* Number of iterations defined with the `-niter` command-line argument
-* Time duration specified with the `-t` command-line argument
-* Both of them (execution will continue until both conditions are met)
-* Predefined duration if `-niter` and `-t` are not specified. Predefined duration value depends on device.
-
-The infer requests are executed asynchronously. Callback is used to wait for previous execution to complete. The application measures all infer requests executions and reports the throughput metric based on batch size and total execution duration.
+* Predefined duration if neither `-niter`nor `-t` are not specified. Predefined duration value depends on the device.
 
 ## Run the Tool
 
@@ -54,7 +65,7 @@ Notice that the benchmark_app usually produces optimal performance for any devic
 python3 benchmark_app.py -m <model> -i <input> -d CPU
 ```
 
-But it is still may be non-optimal for some cases, especially for very small networks. More details can read in [Introduction to Performance Topics](../../docs/IE_DG/Intro_to_Performance.md).
+But it is still may be sub-optimal for some cases, especially for very small networks. More details can read in [Introduction to Performance Topics](../../docs/IE_DG/Intro_to_Performance.md).
 
 Running the application with the `-h` or `--help`' option yields the following usage message:
 
@@ -62,11 +73,12 @@ Running the application with the `-h` or `--help`' option yields the following u
 usage: benchmark_app.py [-h] [-i PATH_TO_INPUT] -m PATH_TO_MODEL
                         [-d TARGET_DEVICE]
                         [-l PATH_TO_EXTENSION] [-c PATH_TO_CLDNN_CONFIG]
+                        [-hint {throughput, latency}]
                         [-api {sync,async}] [-niter NUMBER_ITERATIONS]
                         [-b BATCH_SIZE]
                         [-stream_output [STREAM_OUTPUT]] [-t TIME]
                         [-progress [PROGRESS]] [-nstreams NUMBER_STREAMS]
-                        [-nthreads NUMBER_THREADS] [-pin {YES,NO}]
+                        [-nthreads NUMBER_THREADS] [-pin {YES,NO,NUMA,HYBRID_AWARE}]
                         [--exec_graph_path EXEC_GRAPH_PATH]
                         [-pc [PERF_COUNTS]]
 
@@ -81,7 +93,7 @@ Options:
                         compiled model.
   -d TARGET_DEVICE, --target_device TARGET_DEVICE
                         Optional. Specify a target device to infer on: CPU,
-                        GPU, FPGA, HDDL or MYRIAD.
+                        GPU, HDDL or MYRIAD.
                         Use "-d HETERO:<comma separated devices list>" format to specify HETERO plugin.
                         Use "-d MULTI:<comma separated devices list>" format to specify MULTI plugin.
                         The application looks for a suitable plugin for the specified device.
@@ -92,6 +104,11 @@ Options:
   -c PATH_TO_CLDNN_CONFIG, --path_to_cldnn_config PATH_TO_CLDNN_CONFIG
                         Optional. Required for GPU custom kernels. Absolute
                         path to an .xml file with the kernels description.
+  -hint {throughput, latency}, --perf_hint {throughput, latency}
+                        Optional. Performance hint (optimize for latency or throughput).
+                        The hint allows the OpenVINO device to select the right network-specific settings,
+                        as opposite to defining specific values like  \nstreams\ from the command line.
+                        So you can specify just the hint without adding explicit device-specific options.
   -api {sync,async}, --api_type {sync,async}
                         Optional. Enable using sync/async API. Default value
                         is async.
@@ -117,7 +134,7 @@ Options:
                         "input1[NCHW],input2[NC]" or "[NCHW]" in case of one
                         input size.
   -nstreams NUMBER_STREAMS, --number_streams NUMBER_STREAMS
-                       Optional. Number of streams to use for inference on the CPU/GPU in throughput mode
+                       Optional. Number of streams to use for inference on the CPU/GPU/MYX in throughput mode
                        (for HETERO and MULTI device cases use format <device1>:<nstreams1>,<device2>:<nstreams2> or just <nstreams>).
                        Default value is determined automatically for a device.
                        Please note that although the automatic selection usually provides a reasonable performance,
@@ -125,9 +142,12 @@ Options:
   -nthreads NUMBER_THREADS, --number_threads NUMBER_THREADS
                         Number of threads to use for inference on the CPU
                         (including HETERO  and MULTI cases).
-  -pin {YES,NUMA,NO}, --infer_threads_pinning {YES,NUMA,NO}
-                        Optional. Enable threads->cores ("YES", default), threads->(NUMA)nodes ("NUMA") or completely disable
-                        ("NO") CPU threads pinning for CPU-involved inference.
+  -pin {YES,NO,NUMA,HYBRID_AWARE}, --infer_threads_pinning {YES,NO,NUMA,HYBRID_AWARE}
+                        Optional. Enable threads->cores ('YES' which is OpenVINO runtime's default for conventional CPUs),
+                        threads->(NUMA)nodes ('NUMA'),
+                        threads->appropriate core types ('HYBRID_AWARE', which is OpenVINO runtime's default for Hybrid CPUs)
+                        or completely disable ('NO')
+                        CPU threads pinning for CPU-involved inference.
   --exec_graph_path EXEC_GRAPH_PATH
                         Optional. Path to a file where to store executable
                         graph information serialized.
@@ -151,40 +171,40 @@ To run the tool, you can use [public](@ref omz_models_group_public) or [Intel's]
 
 ## Examples of Running the Tool
 
-This section provides step-by-step instructions on how to run the Benchmark Tool with the `googlenet-v1` public model on CPU or FPGA devices. As an input, the `car.png` file from the `<INSTALL_DIR>/deployment_tools/demo/` directory is used.
+This section provides step-by-step instructions on how to run the Benchmark Tool with the `googlenet-v1` public model on CPU or GPU devices. As an input, the `car.png` file from the `<INSTALL_DIR>/samples/scripts/` directory is used.
 
 > **NOTE:** The Internet access is required to execute the following steps successfully. If you have access to the Internet through the proxy server only, please make sure that it is configured in your OS environment.
 
 1. Download the model. Go to the the Model Downloader directory and run the `downloader.py` script with specifying the model name and directory to download the model to:
    ```sh
-   cd <INSTALL_DIR>/deployment_tools/open_model_zoo/tools/downloader
+   cd <INSTALL_DIR>/extras/open_model_zoo/tools/downloader
    ```
    ```sh
    python3 downloader.py --name googlenet-v1 -o <models_dir>
    ```
 2. Convert the model to the Inference Engine IR format. Go to the Model Optimizer directory and run the `mo.py` script with specifying the path to the model, model format (which must be FP32 for CPU and FPG) and output directory to generate the IR files:
    ```sh
-   cd <INSTALL_DIR>/deployment_tools/model_optimizer
+   cd <INSTALL_DIR>/tools/model_optimizer
    ```
    ```sh
    python3 mo.py --input_model <models_dir>/public/googlenet-v1/googlenet-v1.caffemodel --data_type FP32 --output_dir <ir_dir>
    ```
-3. Run the tool with specifying the `<INSTALL_DIR>/deployment_tools/demo/car.png` file as an input image, the IR of the `googlenet-v1` model and a device to perform inference on. The following commands demonstrate running the Benchmark Tool in the asynchronous mode on CPU and FPGA devices:
+3. Run the tool with specifying the `<INSTALL_DIR>/samples/scripts/car.png` file as an input image, the IR of the `googlenet-v1` model and a device to perform inference on. The following commands demonstrate running the Benchmark Tool in the asynchronous mode on CPU and GPU devices:
 
    * On CPU:
    ```sh
-    python3 benchmark_app.py -m <ir_dir>/googlenet-v1.xml -d CPU -api async -i <INSTALL_DIR>/deployment_tools/demo/car.png --progress true -b 1
+    python3 benchmark_app.py -m <ir_dir>/googlenet-v1.xml -d CPU -api async -i <INSTALL_DIR>/samples/scripts/car.png --progress true -b 1
    ```
-   * On FPGA:
+   * On GPU:
    ```sh
-   python3 benchmark_app.py -m <ir_dir>/googlenet-v1.xml -d HETERO:FPGA,CPU -api async -i <INSTALL_DIR>/deployment_tools/demo/car.png --progress true -b 1
+   python3 benchmark_app.py -m <ir_dir>/googlenet-v1.xml -d GPU -api async -i <INSTALL_DIR>/samples/scripts/car.png --progress true -b 1
    ```
 
 The application outputs number of executed iterations, total duration of execution, latency and throughput.
 Additionally, if you set the `-pc` parameter, the application outputs performance counters.
 If you set `-exec_graph_path`, the application reports executable graph information serialized.
 
-Below are fragments of sample output for CPU and FPGA devices:
+Below are fragments of sample output for CPU and GPU devices:
 * For CPU:
    ```
    [Step 8/9] Measuring performance (Start inference asynchronously, 60000 ms duration, 4 inference requests in parallel using 4 streams)
@@ -198,7 +218,7 @@ Below are fragments of sample output for CPU and FPGA devices:
    Latency:    51.8244 ms
    Throughput: 73.28 FPS
    ```
-* For FPGA:
+* For GPU:
    ```
    [Step 10/11] Measuring performance (Start inference asynchronously, 5 inference requests using 1 streams for CPU, limits: 120000 ms duration)
    Progress: |................................| 100%
diff --git a/tools/benchmark_tool/openvino/tools/benchmark/main.py b/tools/benchmark_tool/openvino/tools/benchmark/main.py
index b218749f7d34d0..df39b1f037f6a9 100644
--- a/tools/benchmark_tool/openvino/tools/benchmark/main.py
+++ b/tools/benchmark_tool/openvino/tools/benchmark/main.py
@@ -108,6 +108,12 @@ def is_flag_set_in_command_line(flag):
                 config[device]['PERF_COUNT'] = 'YES' if args.perf_counts else 'NO'
             perf_counts = True if config[device]['PERF_COUNT'] == 'YES' else perf_counts
 
+            ## high-level performance hints
+            if is_flag_set_in_command_line('hint'):
+                config[device]['PERFORMANCE_HINT'] = args.perf_hint.upper()
+                if is_flag_set_in_command_line('nireq'):
+                    config[device]['PERFORMANCE_HINT_NUM_REQUESTS'] = str(args.number_infer_requests)
+            ## the rest are individual per-device settings (overriding the values the device will deduce from perf hint)
             def set_throughput_streams():
                 key = device + "_THROUGHPUT_STREAMS"
                 if device in device_number_streams.keys():
@@ -117,7 +123,8 @@ def set_throughput_streams():
                         raise Exception(f"Device {device} doesn't support config key '{key}'! " +
                                         "Please specify -nstreams for correct devices in format  <dev1>:<nstreams1>,<dev2>:<nstreams2>")
                     config[device][key] = device_number_streams[device]
-                elif key not in config[device].keys() and args.api_type == "async":
+                elif key not in config[device].keys() and args.api_type == "async" and not is_flag_set_in_command_line('hint'):
+                    ## set the _AUTO value for the #streams
                     logger.warning(f"-nstreams default value is determined automatically for {device} device. " +
                                    "Although the automatic selection usually provides a reasonable performance,"
                                    "but it still may be non-optimal for some cases, for more information look at README.")
@@ -284,13 +291,20 @@ def set_throughput_streams():
             if batch_size == 0:
                 batch_size = 1
 
-        # --------------------- 8. Setting optimal runtime parameters --------------------------------------------------
+        # --------------------- 8. Querying optimal runtime parameters --------------------------------------------------
         next_step()
+        if is_flag_set_in_command_line('hint'):
+            ## actual device-deduced settings for the hint
+            for device in devices:
+                keys = benchmark.ie.get_metric(device, 'SUPPORTED_CONFIG_KEYS')
+                logger.info(f'DEVICE: {device}')
+                for k in keys:
+                    logger.info(f'  {k}  , {exe_network.get_config(k)}')
 
         # Update number of streams
         for device in device_number_streams.keys():
             key = device + '_THROUGHPUT_STREAMS'
-            device_number_streams[device] = benchmark.ie.get_config(device, key)
+            device_number_streams[device] = exe_network.get_config(key)
 
         # Number of requests
         infer_requests = exe_network.requests
@@ -328,7 +342,7 @@ def set_throughput_streams():
 
         # ------------------------------------ 10. Measuring performance -----------------------------------------------
 
-        output_string = process_help_inference_string(benchmark)
+        output_string = process_help_inference_string(benchmark, exe_network)
 
         next_step(additional_info=output_string)
         progress_bar_total_count = 10000
diff --git a/tools/benchmark_tool/openvino/tools/benchmark/parameters.py b/tools/benchmark_tool/openvino/tools/benchmark/parameters.py
index 2eb6f45f0ec0ad..9970b2b9725836 100644
--- a/tools/benchmark_tool/openvino/tools/benchmark/parameters.py
+++ b/tools/benchmark_tool/openvino/tools/benchmark/parameters.py
@@ -35,7 +35,7 @@ def parse_args():
                       help='Optional. '
                            'Path to a folder with images and/or binaries or to specific image or binary file.')
     args.add_argument('-m', '--path_to_model', type=str, required=True,
-                      help='Required. Path to an .xml/.onnx/.prototxt file with a trained model or '
+                      help='Required. Path to an .xml/.onnx file with a trained model or '
                            'to a .blob file with a trained compiled model.')
     args.add_argument('-d', '--target_device', type=str, required=False, default='CPU',
                       help='Optional. Specify a target device to infer on (the list of available devices is shown below). '
@@ -48,6 +48,11 @@ def parse_args():
     args.add_argument('-c', '--path_to_cldnn_config', type=str, required=False,
                       help='Optional. Required for GPU custom kernels. Absolute path to an .xml file with the '
                            'kernels description.')
+    args.add_argument('-hint', '--perf_hint', type=str, required=False, default='', choices=['throughput', 'latency'],
+                      help='Optional. Performance hint (optimize for latency or throughput).'
+                            'The hint allows the OpenVINO device to select the right network-specific settings,'
+                            'as opposite to accepting specific values like  \'nstreams\' from the command line.'
+                            'So you can specify just the hint without adding explicit device-specific options')
     args.add_argument('-api', '--api_type', type=str, required=False, default='async', choices=['sync', 'async'],
                       help='Optional. Enable using sync/async API. Default value is async.')
     args.add_argument('-niter', '--number_iterations', type=check_positive, required=False, default=None,
diff --git a/tools/benchmark_tool/openvino/tools/benchmark/utils/constants.py b/tools/benchmark_tool/openvino/tools/benchmark/utils/constants.py
index fd99d70e19f2e4..762502f2c96f3d 100644
--- a/tools/benchmark_tool/openvino/tools/benchmark/utils/constants.py
+++ b/tools/benchmark_tool/openvino/tools/benchmark/utils/constants.py
@@ -4,7 +4,6 @@
 VPU_DEVICE_NAME = 'VPU'
 MYRIAD_DEVICE_NAME = 'MYRIAD'
 HDDL_DEVICE_NAME = 'HDDL'
-FPGA_DEVICE_NAME = 'FPGA'
 CPU_DEVICE_NAME = 'CPU'
 GPU_DEVICE_NAME = 'GPU'
 HETERO_DEVICE_NAME = 'HETERO'
@@ -25,7 +24,6 @@
     VPU_DEVICE_NAME: 60,
     MYRIAD_DEVICE_NAME: 60,
     HDDL_DEVICE_NAME: 60,
-    FPGA_DEVICE_NAME: 120,
     GNA_DEVICE_NAME: 60,
     UNKNOWN_DEVICE_TYPE: 120
 }
diff --git a/tools/benchmark_tool/openvino/tools/benchmark/utils/utils.py b/tools/benchmark_tool/openvino/tools/benchmark/utils/utils.py
index ed6b76a5317cbb..7cd2bed6136ac3 100644
--- a/tools/benchmark_tool/openvino/tools/benchmark/utils/utils.py
+++ b/tools/benchmark_tool/openvino/tools/benchmark/utils/utils.py
@@ -30,7 +30,7 @@ def next_step(additional_info='', step_id=0):
         5: "Resizing network to match image sizes and given batch",
         6: "Configuring input of the model",
         7: "Loading the model to the device",
-        8: "Setting optimal runtime parameters",
+        8: "Querying optimal runtime parameters",
         9: "Creating infer requests and filling input blobs with images",
         10: "Measuring performance",
         11: "Dumping statistics report",
@@ -194,18 +194,18 @@ def parse_nstreams_value_per_device(devices, values_string):
     return result
 
 
-def process_help_inference_string(benchmark_app):
+def process_help_inference_string(benchmark_app, exe_network):
     output_string = f'Start inference {benchmark_app.api_type}hronously'
     if benchmark_app.api_type == 'async':
         output_string += f', {benchmark_app.nireq} inference requests'
 
         device_ss = ''
         if CPU_DEVICE_NAME in benchmark_app.device:
-            device_ss += str(benchmark_app.ie.get_config(CPU_DEVICE_NAME, 'CPU_THROUGHPUT_STREAMS'))
+            device_ss += str(exe_network.get_config('CPU_THROUGHPUT_STREAMS'))
             device_ss += f' streams for {CPU_DEVICE_NAME}'
         if GPU_DEVICE_NAME in benchmark_app.device:
             device_ss += ', ' if device_ss else ''
-            device_ss += str(benchmark_app.ie.get_config(GPU_DEVICE_NAME, 'GPU_THROUGHPUT_STREAMS'))
+            device_ss += str(exe_network.get_config('GPU_THROUGHPUT_STREAMS'))
             device_ss += f' streams for {GPU_DEVICE_NAME}'
 
         if device_ss:
diff --git a/inference-engine/tools/compile_tool/CMakeLists.txt b/tools/compile_tool/CMakeLists.txt
similarity index 88%
rename from inference-engine/tools/compile_tool/CMakeLists.txt
rename to tools/compile_tool/CMakeLists.txt
index 704b05cfcdeeeb..3f9459174be836 100644
--- a/inference-engine/tools/compile_tool/CMakeLists.txt
+++ b/tools/compile_tool/CMakeLists.txt
@@ -38,9 +38,9 @@ add_cpplint_target(${TARGET_NAME}_cpplint FOR_TARGETS ${TARGET_NAME})
 ie_cpack_add_component(core_tools DEPENDS core)
 
 install(TARGETS compile_tool
-        RUNTIME DESTINATION deployment_tools/tools/compile_tool
+        RUNTIME DESTINATION tools/compile_tool
         COMPONENT core_tools)
 
 install(FILES README.md
-        DESTINATION deployment_tools/tools/compile_tool
+        DESTINATION tools/compile_tool
         COMPONENT core_tools)
diff --git a/inference-engine/tools/compile_tool/README.md b/tools/compile_tool/README.md
similarity index 89%
rename from inference-engine/tools/compile_tool/README.md
rename to tools/compile_tool/README.md
index 0b083e15dc1e1a..279425f7f77572 100644
--- a/inference-engine/tools/compile_tool/README.md
+++ b/tools/compile_tool/README.md
@@ -7,11 +7,8 @@ The tool compiles networks for the following target devices using corresponding
 * Intel® Neural Compute Stick 2 (MYRIAD plugin)
 
 
-> **NOTE**: Intel® Distribution of OpenVINO™ toolkit no longer supports the Intel® Vision Accelerator Design with an Intel® Arria® 10 FPGA and the Intel® Programmable Acceleration Card with Intel® Arria® 10 GX FPGA. To compile a network for those devices, use the Compile Tool from the Intel® Distribution of OpenVINO™ toolkit [2020.3 LTS release](https://docs.openvinotoolkit.org/2020.3/_inference_engine_tools_compile_tool_README.html).
-
-
 The tool is delivered as an executable file that can be run on both Linux* and Windows*.
-The tool is located in the `<INSTALLROOT>/deployment_tools/tools/compile_tool` directory.
+The tool is located in the `<INSTALLROOT>/tools/compile_tool` directory.
 
 The workflow of the Compile tool is as follows:
 
diff --git a/inference-engine/tools/compile_tool/main.cpp b/tools/compile_tool/main.cpp
similarity index 94%
rename from inference-engine/tools/compile_tool/main.cpp
rename to tools/compile_tool/main.cpp
index 68b1a1416a5272..9aaf79b98b5591 100644
--- a/inference-engine/tools/compile_tool/main.cpp
+++ b/tools/compile_tool/main.cpp
@@ -83,10 +83,6 @@ static constexpr char tiling_cmx_limit_message[] =
 "                                             Value should be equal or greater than -1.\n"
 "                                             Overwrites value from config.";
 
-// FPGA-specific
-static constexpr char dla_arch_name[] =
-                                             "Optional. Specify architecture name used to compile executable network for FPGA device.";
-
 DEFINE_bool(h, false, help_message);
 DEFINE_string(m, "", model_message);
 DEFINE_string(d, "", targetDeviceMessage);
@@ -102,7 +98,6 @@ DEFINE_string(iol, "", iol_message);
 DEFINE_string(VPU_NUMBER_OF_SHAVES, "", number_of_shaves_message);
 DEFINE_string(VPU_NUMBER_OF_CMX_SLICES, "", number_of_cmx_slices_message);
 DEFINE_string(VPU_TILING_CMX_LIMIT_KB, "", tiling_cmx_limit_message);
-DEFINE_string(DLA_ARCH_NAME, "", dla_arch_name);
 
 static void showUsage() {
     std::cout << "compile_tool [OPTIONS]" << std::endl;
@@ -124,9 +119,6 @@ static void showUsage() {
     std::cout << "      -VPU_NUMBER_OF_SHAVES      <value>     "   << number_of_shaves_message     << std::endl;
     std::cout << "      -VPU_NUMBER_OF_CMX_SLICES  <value>     "   << number_of_cmx_slices_message << std::endl;
     std::cout << "      -VPU_TILING_CMX_LIMIT_KB   <value>     "   << tiling_cmx_limit_message     << std::endl;
-    std::cout                                                                                      << std::endl;
-    std::cout << " FPGA-specific options:                      "                                   << std::endl;
-    std::cout << "      -DLA_ARCH_NAME             <value>     "   << dla_arch_name                << std::endl;
     std::cout << std::endl;
 }
 
@@ -179,7 +171,6 @@ static std::map<std::string, std::string> parseConfigFile(char comment = '#') {
 
 static std::map<std::string, std::string> configure() {
     const bool isMYRIAD = FLAGS_d.find("MYRIAD") != std::string::npos;
-    const bool isFPGA = FLAGS_d.find("FPGA") != std::string::npos;
 
     auto config = parseConfigFile();
 
@@ -197,12 +188,6 @@ static std::map<std::string, std::string> configure() {
         }
     }
 
-    if (isFPGA) {
-        if (!FLAGS_DLA_ARCH_NAME.empty()) {
-            config["DLIA_ARCH_NAME"] = FLAGS_DLA_ARCH_NAME;
-        }
-    }
-
     return config;
 }
 
diff --git a/inference-engine/tools/cross_check_tool/README.md b/tools/cross_check_tool/README.md
similarity index 100%
rename from inference-engine/tools/cross_check_tool/README.md
rename to tools/cross_check_tool/README.md
diff --git a/tools/cross_check_tool/__init__.py b/tools/cross_check_tool/__init__.py
new file mode 100644
index 00000000000000..60324954ef522e
--- /dev/null
+++ b/tools/cross_check_tool/__init__.py
@@ -0,0 +1,3 @@
+# Copyright (C) 2018-2021 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
diff --git a/inference-engine/tools/cross_check_tool/cross_check_tool.py b/tools/cross_check_tool/cross_check_tool.py
similarity index 100%
rename from inference-engine/tools/cross_check_tool/cross_check_tool.py
rename to tools/cross_check_tool/cross_check_tool.py
diff --git a/inference-engine/tools/cross_check_tool/requirements.txt b/tools/cross_check_tool/requirements.txt
similarity index 100%
rename from inference-engine/tools/cross_check_tool/requirements.txt
rename to tools/cross_check_tool/requirements.txt
diff --git a/inference-engine/tools/cross_check_tool/utils.py b/tools/cross_check_tool/utils.py
similarity index 100%
rename from inference-engine/tools/cross_check_tool/utils.py
rename to tools/cross_check_tool/utils.py
diff --git a/scripts/deployment_manager/configs/darwin.json b/tools/deployment_manager/configs/darwin.json
similarity index 57%
rename from scripts/deployment_manager/configs/darwin.json
rename to tools/deployment_manager/configs/darwin.json
index 09be8f75ed9913..452b14c0ef4c1a 100644
--- a/scripts/deployment_manager/configs/darwin.json
+++ b/tools/deployment_manager/configs/darwin.json
@@ -4,7 +4,7 @@
     "setupvars": {
       "mandatory" : "yes",
       "files": [
-        "bin"
+        "setupvars.sh"
       ]
     },
     "openvino_license": {
@@ -16,18 +16,20 @@
     "ie_core": {
       "group": ["ie"],
       "files": [
-        "deployment_tools/inference_engine/version.txt",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine.dylib",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_transformations.dylib",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_preproc.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_ir_reader.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_c_api.dylib",
-        "deployment_tools/inference_engine/lib/intel64/libAutoPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/libHeteroPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/libMultiDevicePlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/plugins.xml",
-        "deployment_tools/inference_engine/external/tbb",
-        "deployment_tools/ngraph/lib"
+        "runtime/lib/intel64/libinference_engine.dylib",
+        "runtime/lib/intel64/libinference_engine_transformations.dylib",
+        "runtime/lib/intel64/libinference_engine_preproc.so",
+        "runtime/lib/intel64/libinference_engine_ir_reader.so",
+        "runtime/lib/intel64/libinference_engine_c_api.dylib",
+        "runtime/lib/intel64/libHeteroPlugin.so",
+        "runtime/lib/intel64/libMultiDevicePlugin.so",
+        "runtime/lib/intel64/libngraph.dylib",
+        "runtime/lib/intel64/libfrontend_manager.dylib",
+        "runtime/lib/intel64/libir_ngraph_frontend.dylib",
+        "runtime/lib/intel64/libonnx_ngraph_frontend.dylib",
+        "runtime/lib/intel64/libpaddlepaddle_ngraph_frontend.dylib",
+        "runtime/lib/intel64/plugins.xml",
+        "runtime/3rdparty/tbb"
       ]
     },
     "cpu": {
@@ -35,8 +37,8 @@
       "group": ["ie"],
       "dependencies" : ["ie_core"],
       "files": [
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_lp_transformations.dylib",
-        "deployment_tools/inference_engine/lib/intel64/libMKLDNNPlugin.so"
+        "runtime/lib/intel64/libinference_engine_lp_transformations.dylib",
+        "runtime/lib/intel64/libMKLDNNPlugin.so"
       ]
     },
     "vpu": {
@@ -44,10 +46,10 @@
       "group": ["ie"],
       "dependencies" : ["ie_core"],
       "files": [
-        "deployment_tools/inference_engine/lib/intel64/libmyriadPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_legacy.dylib",
-        "deployment_tools/inference_engine/lib/intel64/usb-ma2x8x.mvcmd",
-        "deployment_tools/inference_engine/lib/intel64/pcie-ma2x8x.mvcmd"
+        "runtime/lib/intel64/libmyriadPlugin.so",
+        "runtime/lib/intel64/libinference_engine_legacy.dylib",
+        "runtime/lib/intel64/usb-ma2x8x.mvcmd",
+        "runtime/lib/intel64/pcie-ma2x8x.mvcmd"
       ]
     },
     "opencv": {
diff --git a/scripts/deployment_manager/configs/linux.json b/tools/deployment_manager/configs/linux.json
similarity index 55%
rename from scripts/deployment_manager/configs/linux.json
rename to tools/deployment_manager/configs/linux.json
index 0c39eeb82a4963..29912e3ff3e389 100644
--- a/scripts/deployment_manager/configs/linux.json
+++ b/tools/deployment_manager/configs/linux.json
@@ -4,7 +4,7 @@
     "setupvars": {
       "mandatory" : "yes",
       "files": [
-        "bin"
+        "setupvars.sh"
       ]
     },
     "openvino_dependencies": {
@@ -22,18 +22,20 @@
     "ie_core": {
       "group": ["ie"],
       "files": [
-        "deployment_tools/inference_engine/version.txt",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_transformations.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_preproc.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_ir_reader.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_c_api.so",
-        "deployment_tools/inference_engine/lib/intel64/libAutoPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/libHeteroPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/libMultiDevicePlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/plugins.xml",
-        "deployment_tools/inference_engine/external/tbb",
-        "deployment_tools/ngraph/lib"
+        "runtime/lib/intel64/libinference_engine.so",
+        "runtime/lib/intel64/libinference_engine_transformations.so",
+        "runtime/lib/intel64/libinference_engine_preproc.so",
+        "runtime/lib/intel64/libinference_engine_ir_reader.so",
+        "runtime/lib/intel64/libinference_engine_c_api.so",
+        "runtime/lib/intel64/libHeteroPlugin.so",
+        "runtime/lib/intel64/libMultiDevicePlugin.so",
+        "runtime/lib/intel64/libngraph.so",
+        "runtime/lib/intel64/libfrontend_manager.so",
+        "runtime/lib/intel64/libir_ngraph_frontend.so",
+        "runtime/lib/intel64/libonnx_ngraph_frontend.so",
+        "runtime/lib/intel64/libpaddlepaddle_ngraph_frontend.so",
+        "runtime/lib/intel64/plugins.xml",
+        "runtime/3rdparty/tbb"
       ]
     },
     "cpu": {
@@ -41,8 +43,8 @@
       "group": ["ie"],
       "dependencies" : ["ie_core"],
       "files": [
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_lp_transformations.so",
-        "deployment_tools/inference_engine/lib/intel64/libMKLDNNPlugin.so"
+        "runtime/lib/intel64/libinference_engine_lp_transformations.so",
+        "runtime/lib/intel64/libMKLDNNPlugin.so"
       ]
     },
     "gpu": {
@@ -50,9 +52,9 @@
       "group": ["ie"],
       "dependencies" : ["ie_core"],
       "files": [
-        "deployment_tools/inference_engine/lib/intel64/cache.json",
-        "deployment_tools/inference_engine/lib/intel64/libclDNNPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_lp_transformations.so",
+        "runtime/lib/intel64/cache.json",
+        "runtime/lib/intel64/libclDNNPlugin.so",
+        "runtime/lib/intel64/libinference_engine_lp_transformations.so",
         "install_dependencies/install_NEO_OCL_driver.sh"
       ]
     },
@@ -61,12 +63,12 @@
       "group": ["ie"],
       "dependencies" : ["ie_core"],
       "files": [
-        "deployment_tools/inference_engine/external/97-myriad-usbboot.rules",
-        "deployment_tools/inference_engine/lib/intel64/usb-ma2x8x.mvcmd",
-        "deployment_tools/inference_engine/lib/intel64/pcie-ma2x8x.mvcmd",
-        "deployment_tools/inference_engine/lib/intel64/libmyriadPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/vpu_custom_kernels",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_legacy.so",
+        "runtime/3rdparty/97-myriad-usbboot.rules",
+        "runtime/lib/intel64/usb-ma2x8x.mvcmd",
+        "runtime/lib/intel64/pcie-ma2x8x.mvcmd",
+        "runtime/lib/intel64/libmyriadPlugin.so",
+        "runtime/lib/intel64/vpu_custom_kernels",
+        "runtime/lib/intel64/libinference_engine_legacy.so",
         "install_dependencies/install_NCS_udev_rules.sh"
       ]
     },
@@ -75,9 +77,11 @@
       "group": ["ie"],
       "dependencies" : ["ie_core"],
       "files": [
-        "deployment_tools/inference_engine/external/gna",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_legacy.so",
-        "deployment_tools/inference_engine/lib/intel64/libGNAPlugin.so"
+        "runtime/lib/intel64/libgna.so",
+        "runtime/lib/intel64/libgna.so.2",
+        "runtime/lib/intel64/libgna.so.2.0.0.1226",
+        "runtime/lib/intel64/libinference_engine_legacy.so",
+        "runtime/lib/intel64/libGNAPlugin.so"
       ]
     },
     "hddl": {
@@ -85,9 +89,9 @@
       "group": ["ie"],
       "dependencies" : ["ie_core"],
       "files": [
-        "deployment_tools/inference_engine/lib/intel64/libHDDLPlugin.so",
-        "deployment_tools/inference_engine/lib/intel64/libinference_engine_legacy.so",
-        "deployment_tools/inference_engine/external/hddl"
+        "runtime/lib/intel64/libHDDLPlugin.so",
+        "runtime/lib/intel64/libinference_engine_legacy.so",
+        "runtime/3rdparty/hddl"
       ]
     },
     "opencv": {
diff --git a/tools/deployment_manager/configs/windows.json b/tools/deployment_manager/configs/windows.json
new file mode 100644
index 00000000000000..f49d9d3b16a81a
--- /dev/null
+++ b/tools/deployment_manager/configs/windows.json
@@ -0,0 +1,139 @@
+{
+  "version": "0.2",
+  "components": {
+    "setupvars": {
+      "mandatory" : "yes",
+      "files": [
+        "setupvars.bat"
+      ]
+    },
+    "openvino_license": {
+      "mandatory" : "yes",
+      "files": [
+        "licensing"
+      ]
+    },
+    "ie_core": {
+      "group": ["ie"],
+      "files": [
+        "runtime/bin/intel64/Release/inference_engine.dll",
+        "runtime/bin/intel64/Release/inference_engine_transformations.dll",
+        "runtime/bin/intel64/Release/inference_engine_preproc.dll",
+        "runtime/bin/intel64/Release/inference_engine_ir_reader.dll",
+        "runtime/bin/intel64/Release/inference_engine_c_api.dll",
+        "runtime/bin/intel64/Release/HeteroPlugin.dll",
+        "runtime/bin/intel64/Release/MultiDevicePlugin.dll",
+        "runtime/bin/intel64/Release/ngraph.dll",
+        "runtime/bin/intel64/Release/frontend_manager.dll",
+        "runtime/bin/intel64/Release/ir_ngraph_frontend.dll",
+        "runtime/bin/intel64/Release/onnx_ngraph_frontend.dll",
+        "runtime/bin/intel64/Release/paddlepaddle_ngraph_frontend.dll",
+        "runtime/bin/intel64/Release/plugins.xml",
+        "runtime/3rdparty/tbb"
+      ]
+    },
+    "cpu": {
+      "ui_name": "Inference Engine Runtime for Intel(R) CPU",
+      "group": ["ie"],
+      "dependencies" : ["ie_core"],
+      "files": [
+        "runtime/bin/intel64/Release/inference_engine_lp_transformations.dll",
+        "runtime/bin/intel64/Release/MKLDNNPlugin.dll"
+      ]
+    },
+    "gpu": {
+      "ui_name": "Inference Engine Runtime for Intel(R) Processor Graphics",
+      "group": ["ie"],
+      "dependencies" : ["ie_core"],
+      "files": [
+        "runtime/bin/intel64/Release/cache.json",
+        "runtime/bin/intel64/Release/inference_engine_lp_transformations.dll",
+        "runtime/bin/intel64/Release/clDNNPlugin.dll"
+      ]
+    },
+    "vpu": {
+      "ui_name": "Inference Engine Runtime for Intel(R) Movidius(tm) VPU",
+      "group": ["ie"],
+      "dependencies" : ["ie_core"],
+      "files": [
+        "runtime/bin/intel64/Release/usb-ma2x8x.mvcmd",
+        "runtime/bin/intel64/Release/pcie-ma2x8x.elf",
+        "runtime/bin/intel64/Release/myriadPlugin.dll",
+        "runtime/bin/intel64/Release/inference_engine_legacy.dll"
+      ]
+    },
+    "gna": {
+      "ui_name": "Inference Engine Runtime for Intel(R) Gaussian Neural Accelerator",
+      "group": ["ie"],
+      "dependencies" : ["ie_core"],
+      "files": [
+        "runtime/bin/intel64/Release/gna.dll",
+        "runtime/bin/intel64/Release/inference_engine_legacy.dll",
+        "runtime/bin/intel64/Release/GNAPlugin.dll"
+      ]
+    },
+    "hddl": {
+      "ui_name": "Inference Engine Runtime for Intel(R) Vision Accelerator Design with\n\t   Intel(R) Movidius(tm) VPUs",
+      "group": ["ie"],
+      "dependencies" : ["ie_core"],
+      "files": [
+        "runtime/bin/intel64/Release/HDDLPlugin.dll",
+        "runtime/bin/intel64/Release/inference_engine_legacy.dll",
+        "runtime/bin/intel64/Release/hddl_perfcheck.exe",
+        "runtime/3rdparty/MovidiusDriver",
+        "runtime/3rdparty/hddl"
+      ]
+    },
+    "opencv": {
+      "ui_name": "OpenCV",
+      "group": ["opencv"],
+      "dependencies" : [],
+      "files": [
+        "opencv/version.txt",
+        "opencv/setupvars.bat",
+        "opencv/lib",
+        "opencv/bin"
+      ]
+    },
+    "python_common": {
+      "group": ["python"],
+      "dependencies" : ["ie_core"],
+      "files": [
+        "python/python3",
+        "python/requirements.txt"
+      ]
+    },
+    "python3.6": {
+      "ui_name": "OpenVINO Python API for Python3.6",
+      "group": ["python"],
+      "dependencies" : ["ie_core", "python_common"],
+      "files": [
+        "python/python3.6"
+      ]
+    },
+    "python3.7": {
+      "ui_name": "OpenVINO Python API for Python3.7",
+      "group": ["python"],
+      "dependencies" : ["ie_core", "python_common"],
+      "files": [
+        "python/python3.7"
+      ]
+    },
+    "python3.8": {
+      "ui_name": "OpenVINO Python API for Python3.8",
+      "group": ["python"],
+      "dependencies" : ["ie_core", "python_common"],
+      "files": [
+        "python/python3.8"
+      ]
+    },
+    "python3.9": {
+      "ui_name": "OpenVINO Python API for Python3.9",
+      "group": ["python"],
+      "dependencies" : ["ie_core", "python_common"],
+      "files": [
+        "python/python3.9"
+      ]
+    }
+  }
+}
diff --git a/scripts/deployment_manager/deployman/config.py b/tools/deployment_manager/deployman/config.py
similarity index 100%
rename from scripts/deployment_manager/deployman/config.py
rename to tools/deployment_manager/deployman/config.py
diff --git a/scripts/deployment_manager/deployman/logger.py b/tools/deployment_manager/deployman/logger.py
similarity index 100%
rename from scripts/deployment_manager/deployman/logger.py
rename to tools/deployment_manager/deployman/logger.py
diff --git a/scripts/deployment_manager/deployman/main.py b/tools/deployment_manager/deployman/main.py
similarity index 100%
rename from scripts/deployment_manager/deployman/main.py
rename to tools/deployment_manager/deployman/main.py
diff --git a/scripts/deployment_manager/deployman/ui.py b/tools/deployment_manager/deployman/ui.py
similarity index 100%
rename from scripts/deployment_manager/deployman/ui.py
rename to tools/deployment_manager/deployman/ui.py
diff --git a/scripts/deployment_manager/deployment_manager.py b/tools/deployment_manager/deployment_manager.py
similarity index 100%
rename from scripts/deployment_manager/deployment_manager.py
rename to tools/deployment_manager/deployment_manager.py